Update Dockerfile (#13148)

This commit is contained in:
Guancheng Fu 2025-05-12 09:19:18 +08:00 committed by GitHub
parent 0438e39f3e
commit da08c9ca60
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -182,8 +182,9 @@ RUN set -eux && \
pip uninstall -y oneccl oneccl-devel && \
rm -rf /llm/vllm_for_multi_arc.patch && \
pip install mpi4py fastapi uvicorn openai && \
pip install ray numba
pip install ray numba && \
# Re-enable sym_int4
sed -i 's/qtype = ggml_tensor_qtype\["woq_int4"\]/qtype = ggml_tensor_qtype["sym_int4"]/' /usr/local/lib/python3.11/dist-packages/ipex_llm/transformers/convert.py
WORKDIR /llm/
ENTRYPOINT ["bash", "/llm/start-vllm-service.sh"]