Add check in iGPU perf workflow for results integrity (#11616)
* Add csv check for igpu benchmark workflow (#11610) * add csv check for igpu benchmark workflow * ready to test --------- Co-authored-by: ATMxsp01 <shou.xu@intel.com> * Restore the temporarily removed models in iGPU-perf (#11615) Co-authored-by: ATMxsp01 <shou.xu@intel.com> --------- Co-authored-by: Xu, Shuo <100334393+ATMxsp01@users.noreply.github.com> Co-authored-by: ATMxsp01 <shou.xu@intel.com>
This commit is contained in:
parent
4594a3dd6c
commit
2478e2c14b
2 changed files with 100 additions and 0 deletions
30
.github/workflows/llm_performance_tests.yml
vendored
30
.github/workflows/llm_performance_tests.yml
vendored
|
|
@ -659,6 +659,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\32-32_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -682,6 +684,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\32-32_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test2
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -705,6 +709,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\32-32_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 if %ERRORLEVEL% neq -1073740791 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test3
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -750,6 +756,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -773,6 +781,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test2
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -796,6 +806,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test3
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -840,6 +852,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\2048-256_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -863,6 +877,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\2048-256_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test2
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -886,6 +902,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\2048-256_int4_fp16\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test3
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -930,6 +948,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128_int4_fp16_loadlowbit\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -953,6 +973,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128_int4_fp16_loadlowbit\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test2
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -976,6 +998,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128_int4_fp16_loadlowbit\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test3
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -1019,6 +1043,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -1042,6 +1068,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test2
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
@ -1065,6 +1093,8 @@ jobs:
|
|||
set PYTHONIOENCODING=utf-8
|
||||
python run.py >> %CSV_SAVE_PATH%\1024-128\log\%LOG_FILE% 2>&1
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
python ..\..\..\test\benchmark\igpu-perf\check_csv_results.py --yaml-file config.yaml --suffix test3
|
||||
if %ERRORLEVEL% neq 0 (exit /b 1)
|
||||
|
||||
call conda deactivate
|
||||
|
||||
|
|
|
|||
70
python/llm/test/benchmark/igpu-perf/check_csv_results.py
Normal file
70
python/llm/test/benchmark/igpu-perf/check_csv_results.py
Normal file
|
|
@ -0,0 +1,70 @@
|
|||
#
|
||||
# Copyright 2016 The BigDL Authors.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
#
|
||||
|
||||
# Python program to check if the number of lines in html meets expectation
|
||||
|
||||
import os
|
||||
import sys
|
||||
import argparse
|
||||
import pandas as pd
|
||||
from omegaconf import OmegaConf
|
||||
from datetime import date
|
||||
|
||||
def main():
|
||||
parser = argparse.ArgumentParser(description="check if the number of lines in html meets expectation")
|
||||
parser.add_argument("-y", "--yaml-file", type=str, dest="yaml_name", help="name of yaml", required=True)
|
||||
parser.add_argument("--suffix", type=str, dest="file_suffix", help="the suffix of the csv_file")
|
||||
args = parser.parse_args()
|
||||
|
||||
all_csv_files:list[str] = [file for file in os.listdir() if file.endswith('.csv')]
|
||||
|
||||
conf = OmegaConf.load(args.yaml_name)
|
||||
test_apis : list[str] = conf['test_api']
|
||||
in_out_pairs : list[str] = conf['in_out_pairs']
|
||||
for api in test_apis:
|
||||
for in_out in in_out_pairs:
|
||||
csv_name_info:str = f"{in_out}-{api}-results-"
|
||||
csv_file = [file for file in all_csv_files if (csv_name_info in file) and file.endswith(f"_{args.file_suffix}.csv")][0]
|
||||
|
||||
csv_dataframe = pd.read_csv(csv_file, index_col=0)
|
||||
actual_test_num = len(csv_dataframe)
|
||||
actual_test_cases = []
|
||||
for index, row in csv_dataframe.iterrows():
|
||||
actual_test_cases.append(row['model'] + ":" + row['input/output tokens'].split('-')[0] + ":" + str(row['batch_size']))
|
||||
|
||||
|
||||
all_test_cases = []
|
||||
for model in conf.repo_id:
|
||||
if not OmegaConf.is_list(conf["batch_size"]):
|
||||
batch_list = [conf["batch_size"]]
|
||||
else:
|
||||
batch_list = conf["batch_size"]
|
||||
for batch_size in batch_list:
|
||||
model_id_input = model + ':' + in_out.split('-')[0] + ':' + str(batch_size)
|
||||
all_test_cases.append(model_id_input)
|
||||
exclude_test_cases = []
|
||||
if 'exclude' in conf and conf['exclude'] is not None:
|
||||
exclude_test_cases = conf['exclude']
|
||||
expected_test_num = len(all_test_cases) - len(exclude_test_cases)
|
||||
if actual_test_num != expected_test_num:
|
||||
print("---------------The test cases should be tested!------------")
|
||||
for test_case in all_test_cases:
|
||||
if test_case not in actual_test_cases and test_case not in exclude_test_cases:
|
||||
print(test_case)
|
||||
raise ValueError("The above tests failed. Please check the errors in the log.")
|
||||
|
||||
if __name__ == "__main__":
|
||||
sys.exit(main())
|
||||
Loading…
Reference in a new issue