ipex-llm/python/llm/test/run-llm-inference-tests-gpu.sh

#!/bin/bash

export ANALYTICS_ZOO_ROOT=${ANALYTICS_ZOO_ROOT}
export LLM_HOME=${ANALYTICS_ZOO_ROOT}/python/llm/src
export LLM_INFERENCE_TEST_DIR=${ANALYTICS_ZOO_ROOT}/python/llm/test/inference_gpu

export USE_XETLA=OFF
export DEVICE='xpu'

set -e

echo "# Start testing inference"
start=$(date "+%s")

if [ -z "$THREAD_NUM" ]; then
  THREAD_NUM=2
fi
export OMP_NUM_THREADS=$THREAD_NUM
pytest ${LLM_INFERENCE_TEST_DIR} -v -s

now=$(date "+%s")
time=$((now-start))

echo "Bigdl-llm gpu tests finished"
echo "Time used:$time seconds"