* first draft * fix * add readme for transformer_int4_gpu * fix doc * check device_map * add arc ut test * fix ut test * fix langchain ut * Refine README * fix gpu mem too high * fix ut test --------- Co-authored-by: Ariadne <wyn2000330@126.com>
22 lines
No EOL
518 B
Bash
22 lines
No EOL
518 B
Bash
#!/bin/bash
|
|
|
|
export ANALYTICS_ZOO_ROOT=${ANALYTICS_ZOO_ROOT}
|
|
export LLM_HOME=${ANALYTICS_ZOO_ROOT}/python/llm/src
|
|
export LLM_INFERENCE_TEST_DIR=${ANALYTICS_ZOO_ROOT}/python/llm/test/langchain_gpu
|
|
|
|
export USE_XETLA=OFF
|
|
export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1
|
|
export DEVICE='xpu'
|
|
|
|
set -e
|
|
|
|
echo "# Start testing inference"
|
|
start=$(date "+%s")
|
|
|
|
python -m pytest -s ${LLM_INFERENCE_TEST_DIR}
|
|
|
|
now=$(date "+%s")
|
|
time=$((now-start))
|
|
|
|
echo "Bigdl-llm langchain gpu tests finished"
|
|
echo "Time used:$time seconds" |