30 lines
902 B
Bash
30 lines
902 B
Bash
#!/bin/bash
|
|
|
|
export ANALYTICS_ZOO_ROOT=${ANALYTICS_ZOO_ROOT}
|
|
export LLM_HOME=${ANALYTICS_ZOO_ROOT}/python/llm/src
|
|
export LLM_INFERENCE_TEST_DIR=${ANALYTICS_ZOO_ROOT}/python/llm/test/inference_gpu
|
|
|
|
export USE_XETLA=OFF
|
|
export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1
|
|
export DEVICE='xpu'
|
|
|
|
set -e
|
|
|
|
echo "# Start testing inference"
|
|
start=$(date "+%s")
|
|
|
|
# if [ -z "$THREAD_NUM" ]; then
|
|
# THREAD_NUM=2
|
|
# fi
|
|
# export OMP_NUM_THREADS=$THREAD_NUM
|
|
export BIGDL_LLM_XMX_DISABLED=1
|
|
pytest ${LLM_INFERENCE_TEST_DIR}/test_transformers_api_attention.py -v -s -k "Mistral"
|
|
pytest ${LLM_INFERENCE_TEST_DIR}/test_transformers_api_mlp.py -v -s -k "Mistral"
|
|
pytest ${LLM_INFERENCE_TEST_DIR}/test_transformers_api_RMSNorm.py -v -s -k "Mistral"
|
|
unset BIGDL_LLM_XMX_DISABLED
|
|
|
|
now=$(date "+%s")
|
|
time=$((now-start))
|
|
|
|
echo "Bigdl-llm gpu inference tests for transformers 4.34.0 finished"
|
|
echo "Time used:$time seconds"
|