diff --git a/docker/llm/inference-cpp/Dockerfile b/docker/llm/inference-cpp/Dockerfile index 2f62b8bf..cb8c2178 100644 --- a/docker/llm/inference-cpp/Dockerfile +++ b/docker/llm/inference-cpp/Dockerfile @@ -91,3 +91,5 @@ RUN set -eux && \ # Clean up unnecessary dependencies to reduce image size find /usr/lib/python3/dist-packages/ -name 'blinker*' -exec rm -rf {} + && \ rm -rf /root/.cache/Cypress + +WORKDIR /llm/ diff --git a/docker/llm/inference-cpp/benchmark_llama-cpp.sh b/docker/llm/inference-cpp/benchmark_llama-cpp.sh index 17bd6a5f..4cd01fd2 100644 --- a/docker/llm/inference-cpp/benchmark_llama-cpp.sh +++ b/docker/llm/inference-cpp/benchmark_llama-cpp.sh @@ -6,13 +6,10 @@ init-llama-cpp # change the model_path to run if [[ "$DEVICE" == "Arc" || "$DEVICE" == "ARC" ]]; then source ipex-llm-init -g --device Arc - python run.py elif [[ "$DEVICE" == "Flex" || "$DEVICE" == "FLEX" ]]; then source ipex-llm-init -g --device Flex - python run.py elif [[ "$DEVICE" == "Max" || "$DEVICE" == "MAX" ]]; then source ipex-llm-init -g --device Max - python run.py else echo "Invalid DEVICE specified." fi