diff --git a/docker/llm/serving/cpu/docker/entrypoint.sh b/docker/llm/serving/cpu/docker/entrypoint.sh index ca0edead..da2ad7de 100644 --- a/docker/llm/serving/cpu/docker/entrypoint.sh +++ b/docker/llm/serving/cpu/docker/entrypoint.sh @@ -171,6 +171,8 @@ else else # Logic for non-controller(worker) mode worker_address="http://$worker_host:$worker_port" + # Apply optimizations from bigdl-llm + source bigdl-llm-init -t # First check if user have set OMP_NUM_THREADS by themselves if [[ -n "${omp_num_threads}" ]]; then echo "Setting OMP_NUM_THREADS to its original value: $omp_num_threads"