File tree Expand file tree Collapse file tree 2 files changed +15
-2
lines changed
docker/llm/serving/xpu/docker Expand file tree Collapse file tree 2 files changed +15
-2
lines changed Original file line number Diff line number Diff line change @@ -53,7 +53,7 @@ RUN set -eux && \
5353 dpkg -i *.deb && \
5454 #
5555 # Install Intel PyTorch extension for LLM inference
56- pip install --pre --upgrade ipex-llm[xpu_2.6] --extra-index-url https://download.pytorch.org/whl/xpu && \
56+ pip install --pre --upgrade ipex-llm[xpu_2.6]==2.3.0b20250407 --extra-index-url https://download.pytorch.org/whl/xpu && \
5757 #
5858 # Build torch-ccl
5959 mkdir -p /build && \
@@ -123,7 +123,7 @@ RUN set -eux && \
123123 wget https://bootstrap.pypa.io/get-pip.py -O get-pip.py && \
124124 python3 get-pip.py && rm get-pip.py && \
125125 pip install --upgrade requests argparse urllib3 && \
126- pip install --pre --upgrade ipex-llm[xpu_2.6] --extra-index-url https://download.pytorch.org/whl/xpu && \
126+ pip install --pre --upgrade ipex-llm[xpu_2.6]==2.3.0b20250407 --extra-index-url https://download.pytorch.org/whl/xpu && \
127127 pip install transformers_stream_generator einops tiktoken && \
128128 pip install --upgrade colorama && \
129129 #
Original file line number Diff line number Diff line change @@ -12211,6 +12211,19 @@ index 000000000..75a99ffc1
1221112211+# Pass the collected arguments to the main entrypoint
1221212212+exec python3 -m vllm.entrypoints.openai.api_server "${ARGS[@]}"
1221312213\ No newline at end of file
12214+ diff --git a/requirements-common.txt b/requirements-common.txt
12215+ index 6c390bcfd..b22364c5a 100644
12216+ --- a/requirements-common.txt
12217+ +++ b/requirements-common.txt
12218+ @@ -21,7 +21,7 @@ tiktoken >= 0.6.0 # Required for DBRX tokenizer
12219+ lm-format-enforcer >= 0.10.9, < 0.11
12220+ outlines == 0.1.11 # Requires pytorch
12221+ lark == 1.2.2
12222+ -xgrammar >= 0.1.6; platform_machine == "x86_64"
12223+ +xgrammar <= 0.1.17; platform_machine == "x86_64"
12224+ typing_extensions >= 4.10
12225+ filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
12226+ partial-json-parser # used for parsing partial JSON outputs
1221412227diff --git a/requirements-neuron.txt b/requirements-neuron.txt
1221512228index 148fdbe0d..5e08d101f 100644
1221612229--- a/requirements-neuron.txt
You can’t perform that action at this time.
0 commit comments