File tree Expand file tree Collapse file tree 1 file changed +6
-4
lines changed
python/llm/src/ipex_llm/vllm/xpu Expand file tree Collapse file tree 1 file changed +6
-4
lines changed Original file line number Diff line number Diff line change @@ -93,10 +93,12 @@ def _ipex_llm_load_model(self) -> None:
93
93
vllm_config = new_vllm_config
94
94
)
95
95
if self .vllm_config .model_config .low_bit_model_path is None :
96
- if "qwen" in self .vllm_config .model_config .model .lower () or \
97
- "baichuan" in self .vllm_config .model_config .model .lower () or \
98
- "codegeex4-all" in self .vllm_config .model_config .model .lower () or \
99
- "chatglm" in self .vllm_config .model_config .model .lower ():
96
+ if ("qwen" in self .vllm_config .model_config .model .lower () or
97
+ "baichuan" in self .vllm_config .model_config .model .lower () or
98
+ "codegeex4-all" in self .vllm_config .model_config .model .lower () or
99
+ "chatglm" in self .vllm_config .model_config .model .lower ()) and \
100
+ "gptq" not in self .model_config .model .lower () and \
101
+ "awq" not in self .model_config .model .lower ():
100
102
self .model .apply (padding_mlp )
101
103
from ipex_llm import optimize_model
102
104
not_convert_last_mlp = os .getenv ("IPEX_LLM_NOT_CONVERT_LAST_MLP" , None )
You can’t perform that action at this time.
0 commit comments