diff --git a/python/llm/test/benchmark/arc-perf-test.yaml b/python/llm/test/benchmark/arc-perf-test.yaml index a5fbe22f..81c80a27 100644 --- a/python/llm/test/benchmark/arc-perf-test.yaml +++ b/python/llm/test/benchmark/arc-perf-test.yaml @@ -13,6 +13,7 @@ repo_id: - 'Qwen/Qwen-7B-Chat' - 'BAAI/AquilaChat-7B' - 'baichuan-inc/Baichuan2-7B-Chat' + - 'baichuan-inc/Baichuan2-13B-Chat' - 'bigscience/bloomz-7b1' - 'fnlp/moss-moon-003-sft' local_model_hub: '/mnt/disk1/models' @@ -30,3 +31,4 @@ cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu w exclude: - 'fnlp/moss-moon-003-sft:1024' - 'fnlp/moss-moon-003-sft:2048' + - 'baichuan-inc/Baichuan2-13B-Chat:2048'