LLM: Fix ParallelLMHead convert in vLLM cpu (#11654)
This commit is contained in:
parent
777e61d8c8
commit
4499d25c26
1 changed files with 2 additions and 1 deletions
|
|
@ -153,8 +153,9 @@ def is_linear_module(module):
|
|||
VLLM_LINEAR_LIST = [
|
||||
ColumnParallelLinear, RowParallelLinear, QKVParallelLinear,
|
||||
MergedColumnParallelLinear,
|
||||
ParallelLMHead
|
||||
]
|
||||
if 'xpu' in _VLLM_VERSION:
|
||||
VLLM_LINEAR_LIST.append(ParallelLMHead)
|
||||
if is_module_in_classes(module, VLLM_LINEAR_LIST):
|
||||
if 'xpu' in _VLLM_VERSION:
|
||||
# For vllm xpu
|
||||
|
|
|
|||
Loading…
Reference in a new issue