Update vLLM patch (#13079)

* update vllm patch

* Update Dockerfile
This commit is contained in:
Shaojun Liu 2025-04-15 16:55:29 +08:00 committed by GitHub
parent f5aaa83649
commit fa56212bb3
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
2 changed files with 15 additions and 2 deletions

View file

@ -53,7 +53,7 @@ RUN set -eux && \
dpkg -i *.deb && \
#
# Install Intel PyTorch extension for LLM inference
pip install --pre --upgrade ipex-llm[xpu_2.6] --extra-index-url https://download.pytorch.org/whl/xpu && \
pip install --pre --upgrade ipex-llm[xpu_2.6]==2.3.0b20250407 --extra-index-url https://download.pytorch.org/whl/xpu && \
#
# Build torch-ccl
mkdir -p /build && \
@ -123,7 +123,7 @@ RUN set -eux && \
wget https://bootstrap.pypa.io/get-pip.py -O get-pip.py && \
python3 get-pip.py && rm get-pip.py && \
pip install --upgrade requests argparse urllib3 && \
pip install --pre --upgrade ipex-llm[xpu_2.6] --extra-index-url https://download.pytorch.org/whl/xpu && \
pip install --pre --upgrade ipex-llm[xpu_2.6]==2.3.0b20250407 --extra-index-url https://download.pytorch.org/whl/xpu && \
pip install transformers_stream_generator einops tiktoken && \
pip install --upgrade colorama && \
#

View file

@ -12211,6 +12211,19 @@ index 000000000..75a99ffc1
+# Pass the collected arguments to the main entrypoint
+exec python3 -m vllm.entrypoints.openai.api_server "${ARGS[@]}"
\ No newline at end of file
diff --git a/requirements-common.txt b/requirements-common.txt
index 6c390bcfd..b22364c5a 100644
--- a/requirements-common.txt
+++ b/requirements-common.txt
@@ -21,7 +21,7 @@ tiktoken >= 0.6.0 # Required for DBRX tokenizer
lm-format-enforcer >= 0.10.9, < 0.11
outlines == 0.1.11 # Requires pytorch
lark == 1.2.2
-xgrammar >= 0.1.6; platform_machine == "x86_64"
+xgrammar <= 0.1.17; platform_machine == "x86_64"
typing_extensions >= 4.10
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
partial-json-parser # used for parsing partial JSON outputs
diff --git a/requirements-neuron.txt b/requirements-neuron.txt
index 148fdbe0d..5e08d101f 100644
--- a/requirements-neuron.txt