change convert tools.

marvin-Yu · marvin-Yu · commit 4730f04d0917 · 2024-03-28T01:16:18.000-04:00
diff --git a/README.md b/README.md
@@ -49,11 +49,11 @@ xFasterTransformer provides a series of APIs, both of C++ and Python, for end us
 |      ChatGLM3      | &#10004;  | &#10004; |   &#10004;   |
 |       Llama        | &#10004;  | &#10004; |   &#10004;   |
 |       Llama2       | &#10004;  | &#10004; |   &#10004;   |
-|   Deepseek-coder   | &#10004;  | &#10004; |   &#10004;   |
 |      Baichuan      | &#10004;  | &#10004; |   &#10004;   |
 |        QWen        | &#10004;  | &#10004; |   &#10004;   |
 | SecLLM(YaRN-Llama) | &#10004;  | &#10004; |   &#10004;   |
 |        Opt         | &#10004;  | &#10004; |   &#10004;   |
+|   Deepseek-coder   | &#10004;  | &#10004; |   &#10004;   |
 
 ### DataType support list
 
diff --git a/src/xfastertransformer/tools/llama_convert.py b/src/xfastertransformer/tools/llama_convert.py
@@ -125,12 +125,15 @@ def split_and_convert(self, input_dir, output_dir, dtype, processes):
             config["llama"]["layernorm_type"] = "pre_layernorm"
             config["llama"]["activation_type"] = str(hf_config["hidden_act"])
             config["llama"]["rope_theta"] = str(hf_config.get("rope_theta", 10000))
-            try:
-                config["llama"]["scaling_factor"] = str(hf_config["rope_scaling"]["factor"])
-                config["llama"]["rope_type"] = str(hf_config["rope_scaling"]["type"])
-            except Exception as e:
-                config["llama"]["scaling_factor"] = 1.0
-                config["llama"]["rope_type"] = "null"
+
+            rope_scaling = hf_config.get("rope_scaling", None)
+            if rope_scaling:
+                config["llama"]["scaling_factor"] = str(rope_scaling.get("factor", 1.0))
+                config["llama"]["rope_type"] = str(rope_scaling.get("type", "null"))
+            else:
+                config["llama"]["scaling_factor"] = str(1.0)
+                config["llama"]["rope_type"] = str("null")
+
             config["llama"]["has_post_decoder_layernorm"] = "1" if has_post_decoder_layernorm else "0"
             config["llama"]["vocab_size"] = str(hf_config["vocab_size"])
             config["llama"]["start_id"] = str(hf_config["bos_token_id"])
@@ -140,7 +143,6 @@ def split_and_convert(self, input_dir, output_dir, dtype, processes):
                 config.write(configfile)
         except Exception as e:
             print("Fail to save the config in config.ini.", str(e))
-
         hf_model_name_pattern = [
             "input_layernorm.weight",
             "attention.query_key_value.weight",