From 94723bb0b13e11b5fda63cdc7d59b00701453cbd Mon Sep 17 00:00:00 2001 From: pengyb2001 <284261055@qq.com> Date: Tue, 6 Feb 2024 14:09:14 +0800 Subject: [PATCH] add retry in run llm install part;test arc05 with llama2 --- .github/workflows/llm-harness-evaluation.yml | 22 ++++++++++++++++---- 1 file changed, 18 insertions(+), 4 deletions(-) diff --git a/.github/workflows/llm-harness-evaluation.yml b/.github/workflows/llm-harness-evaluation.yml index 59f588db..d270c300 100644 --- a/.github/workflows/llm-harness-evaluation.yml +++ b/.github/workflows/llm-harness-evaluation.yml @@ -68,7 +68,7 @@ jobs: PR_MATRIX_MODEL_NAME: '["Llama2-7b-guanaco-dolphin-500"]' PR_MATRIX_TASK: '["truthfulqa"]' PR_MATRIX_PRECISION: '["fp8"]' - PR_LABELS: '["self-hosted", "llm", "temp-arc01"]' + PR_LABELS: '["self-hosted", "llm", "accuracy2", "accuracy-nightly"]' run: | echo "model_name=$PR_MATRIX_MODEL_NAME" >> $GITHUB_ENV echo "precision=$PR_MATRIX_PRECISION" >> $GITHUB_ENV @@ -135,9 +135,23 @@ jobs: uses: ./.github/actions/llm/download-llm-binary - name: Run LLM install (all) test - uses: ./.github/actions/llm/setup-llm-env - with: - extra-dependency: "xpu_2.1" + # uses: ./.github/actions/llm/setup-llm-env + # with: + # extra-dependency: "xpu_2.1" + run: | + retry_count=0 + max_retries=1 + command="bash ./.github/actions/llm/setup-llm-env --extra-dependency xpu_2.1" + until $command; do + exit_code=$? + echo "Attempt $((retry_count+1)) failed with exit code $exit_code. Retrying..." + retry_count=$((retry_count+1)) + if [ "$retry_count" -gt "$max_retries" ]; then + echo "Reached maximum retry attempts. Exiting." + exit $exit_code + fi + sleep 5 + done - name: Install harness working-directory: ${{ github.workspace }}/python/llm/dev/benchmark/harness/