intel · XuehaoSun · Jun 11, 2024 · Jun 7, 2024 · Jun 7, 2024 · Jun 7, 2024
diff --git a/intel_extension_for_transformers/transformers/utils/utility.py b/intel_extension_for_transformers/transformers/utils/utility.py
@@ -462,6 +462,8 @@ def recover_model_from_json(fp32_model_name_or_path, json_file_path, trust_remot
         (object): quantized model
     """
     from transformers import AutoModelForCausalLM
+
+    # ipex recovered int8 model from configure.json requests float32 model input and on cpu device.
     user_model = AutoModelForCausalLM.from_pretrained(fp32_model_name_or_path,
                                                       trust_remote_code=trust_remote_code).float()
     if user_model.config.model_type in IPEX_OPT_LLM_SUPPORTED:
@@ -496,5 +498,9 @@ def recover_model_from_json(fp32_model_name_or_path, json_file_path, trust_remot
     from intel_extension_for_transformers.transformers.llm.evaluation.models import (
         TSModelCausalLMForITREX,
     )
+    origin_model_type = config.model_type
+    if origin_model_type in ["chatglm", "qwen", "baichuan"]:
+        config.model_type = "qwen2"
     user_model = TSModelCausalLMForITREX(user_model, config=config)
+    user_model.config.model_type = origin_model_type
     return user_model