From b23b91407cd6a627702fbf35f03d380c6eaa235e Mon Sep 17 00:00:00 2001 From: Heyang Sun <60865256+Uxito-Ada@users.noreply.github.com> Date: Fri, 10 Nov 2023 13:51:24 +0800 Subject: [PATCH] fix llm-init on deepspeed missing lib (#9419) --- python/llm/dev/benchmark/all-in-one/run-deepspeed-spr.sh | 3 ++- python/llm/example/CPU/Deepspeed-AutoTP/run.sh | 3 ++- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/python/llm/dev/benchmark/all-in-one/run-deepspeed-spr.sh b/python/llm/dev/benchmark/all-in-one/run-deepspeed-spr.sh index 6dd42ed2..25bded0b 100644 --- a/python/llm/dev/benchmark/all-in-one/run-deepspeed-spr.sh +++ b/python/llm/dev/benchmark/all-in-one/run-deepspeed-spr.sh @@ -1,7 +1,8 @@ #!/bin/bash -source bigdl-nano-init +source bigdl-llm-init unset OMP_NUM_THREADS # deepspeed will set it for each instance automatically source /opt/intel/oneccl/env/setvars.sh +export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$CONDA_PREFIX/lib export WORLD_SIZE=2 # run 1 instance per SPR socket, thus 2 instances on 2 sockets, 96 cores export MASTER_ADDR=127.0.0.1 export CCL_ZE_IPC_EXCHANGE=sockets diff --git a/python/llm/example/CPU/Deepspeed-AutoTP/run.sh b/python/llm/example/CPU/Deepspeed-AutoTP/run.sh index f06c4453..1eb07388 100644 --- a/python/llm/example/CPU/Deepspeed-AutoTP/run.sh +++ b/python/llm/example/CPU/Deepspeed-AutoTP/run.sh @@ -1,7 +1,8 @@ #/bin/bash -source bigdl-nano-init +source bigdl-llm-init unset OMP_NUM_THREADS # deepspeed will set it for each instance automatically source /opt/intel/oneccl/env/setvars.sh +export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$CONDA_PREFIX/lib export WORLD_SIZE=2 # run 1 instance per SPR socket, thus 2 instances on 2 sockets, 96 cores export MASTER_ADDR=127.0.0.1 export CCL_ZE_IPC_EXCHANGE=sockets