Skip to content

Commit dbbdd2c

Browse files
hzjanecranechu0131
authored andcommitted
vllm update for glm-4 model automatic not_convert (intel#12003)
1 parent 33cba9d commit dbbdd2c

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

python/llm/src/ipex_llm/vllm/xpu/model_convert.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -250,7 +250,8 @@ def _ipex_llm_load_model(self) -> None:
250250
from ipex_llm import optimize_model
251251
import os
252252
not_convert_last_mlp = os.getenv("IPEX_LLM_NOT_CONVERT_LAST_MLP", None)
253-
if not_convert_last_mlp is not None:
253+
is_glm4_model = "glm-4" in self.model_config.model.lower()
254+
if not_convert_last_mlp is not None or is_glm4_model:
254255
# only use to avoid nan value in last mlp forward running glm4-9b-chat
255256
modules = ["35.mlp", "36.mlp", "37.mlp", "38.mlp", "39.mlp"]
256257
else:

0 commit comments

Comments
 (0)