vllm no padding glm4 to avoid nan error (#12062)
* no padding glm4 * add codegeex
This commit is contained in:
parent
649390c464
commit
c75f3dd874
1 changed files with 2 additions and 1 deletions
|
|
@ -89,7 +89,8 @@ def get_load_function(low_bit):
|
||||||
)
|
)
|
||||||
if "qwen" in self.model_config.model.lower() or \
|
if "qwen" in self.model_config.model.lower() or \
|
||||||
"baichuan" in self.model_config.model.lower() or \
|
"baichuan" in self.model_config.model.lower() or \
|
||||||
"glm" in self.model_config.model.lower():
|
"codegeex4-all" in self.model_config.model.lower() or \
|
||||||
|
"chatglm" in self.model_config.model.lower():
|
||||||
self.model.apply(padding_mlp)
|
self.model.apply(padding_mlp)
|
||||||
from ipex_llm import optimize_model
|
from ipex_llm import optimize_model
|
||||||
import os
|
import os
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue