LLM: Fix ParallelLMHead convert in vLLM cpu (#11654)
This commit is contained in:
parent
777e61d8c8
commit
4499d25c26
1 changed files with 2 additions and 1 deletions
|
|
@ -153,8 +153,9 @@ def is_linear_module(module):
|
||||||
VLLM_LINEAR_LIST = [
|
VLLM_LINEAR_LIST = [
|
||||||
ColumnParallelLinear, RowParallelLinear, QKVParallelLinear,
|
ColumnParallelLinear, RowParallelLinear, QKVParallelLinear,
|
||||||
MergedColumnParallelLinear,
|
MergedColumnParallelLinear,
|
||||||
ParallelLMHead
|
|
||||||
]
|
]
|
||||||
|
if 'xpu' in _VLLM_VERSION:
|
||||||
|
VLLM_LINEAR_LIST.append(ParallelLMHead)
|
||||||
if is_module_in_classes(module, VLLM_LINEAR_LIST):
|
if is_module_in_classes(module, VLLM_LINEAR_LIST):
|
||||||
if 'xpu' in _VLLM_VERSION:
|
if 'xpu' in _VLLM_VERSION:
|
||||||
# For vllm xpu
|
# For vllm xpu
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue