LLM: Fix ParallelLMHead convert in vLLM cpu (#11654)

This commit is contained in:
Xiangyu Tian 2024-07-25 13:07:19 +08:00 committed by GitHub
parent 777e61d8c8
commit 4499d25c26
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -153,8 +153,9 @@ def is_linear_module(module):
VLLM_LINEAR_LIST = [ VLLM_LINEAR_LIST = [
ColumnParallelLinear, RowParallelLinear, QKVParallelLinear, ColumnParallelLinear, RowParallelLinear, QKVParallelLinear,
MergedColumnParallelLinear, MergedColumnParallelLinear,
ParallelLMHead
] ]
if 'xpu' in _VLLM_VERSION:
VLLM_LINEAR_LIST.append(ParallelLMHead)
if is_module_in_classes(module, VLLM_LINEAR_LIST): if is_module_in_classes(module, VLLM_LINEAR_LIST):
if 'xpu' in _VLLM_VERSION: if 'xpu' in _VLLM_VERSION:
# For vllm xpu # For vllm xpu