From da08c9ca603e9bc2d2f317f077b9e5e84044160a Mon Sep 17 00:00:00 2001 From: Guancheng Fu <110874468+gc-fu@users.noreply.github.com> Date: Mon, 12 May 2025 09:19:18 +0800 Subject: [PATCH] Update Dockerfile (#13148) --- docker/llm/serving/xpu/docker/Dockerfile | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/docker/llm/serving/xpu/docker/Dockerfile b/docker/llm/serving/xpu/docker/Dockerfile index 9a3d7d4d..e9ca4525 100644 --- a/docker/llm/serving/xpu/docker/Dockerfile +++ b/docker/llm/serving/xpu/docker/Dockerfile @@ -182,8 +182,9 @@ RUN set -eux && \ pip uninstall -y oneccl oneccl-devel && \ rm -rf /llm/vllm_for_multi_arc.patch && \ pip install mpi4py fastapi uvicorn openai && \ - pip install ray numba - + pip install ray numba && \ + # Re-enable sym_int4 + sed -i 's/qtype = ggml_tensor_qtype\["woq_int4"\]/qtype = ggml_tensor_qtype["sym_int4"]/' /usr/local/lib/python3.11/dist-packages/ipex_llm/transformers/convert.py WORKDIR /llm/ ENTRYPOINT ["bash", "/llm/start-vllm-service.sh"]