Modify arc nightly perf to fp16 (#11275)

* change api * move to pr mode and remove the build * add batch4 yaml and remove the bigcode * remove batch4 * revert the starcode * remove the exclude * revert --------- Co-authored-by: Yishuo Wang <yishuo.wang@intel.com>
2024-06-17 13:47:22 +08:00 · 2024-06-17 13:47:22 +08:00 · bca5cbd96c
commit bca5cbd96c
parent a2a5890b48
4 changed files with 4 additions and 4 deletions
--- a/python/llm/test/benchmark/arc-perf-test-batch2.yaml
+++ b/python/llm/test/benchmark/arc-perf-test-batch2.yaml
@ -29,7 +29,7 @@ in_out_pairs:
  - '1024-128'
  - '2048-256'
 test_api:
-  - "transformer_int4_gpu"  # on Intel GPU
+  - "transformer_int4_fp16_gpu"  # on Intel GPU
 cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api)
 exclude:
  - 'bigcode/starcoder-15.5b-4bit:2048'
--- a/python/llm/test/benchmark/arc-perf-test.yaml
+++ b/python/llm/test/benchmark/arc-perf-test.yaml
@ -29,7 +29,7 @@ in_out_pairs:
  - '1024-128'
  - '2048-256'
 test_api:
-  - "transformer_int4_gpu"  # on Intel GPU
+  - "transformer_int4_fp16_gpu"  # on Intel GPU
 cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api)
 exclude:
 #  - 'fnlp/moss-moon-003-sft-4bit:1024'
--- a/python/llm/test/benchmark/arc-perf-transformers-437-batch2.yaml
+++ b/python/llm/test/benchmark/arc-perf-transformers-437-batch2.yaml
@ -15,5 +15,5 @@ in_out_pairs:
  - '1024-128'
  - '2048-256'
 test_api:
-  - "transformer_int4_gpu"  # on Intel GPU
+  - "transformer_int4_fp16_gpu"  # on Intel GPU
 cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api)
--- a/python/llm/test/benchmark/arc-perf-transformers-437.yaml
+++ b/python/llm/test/benchmark/arc-perf-transformers-437.yaml
@ -15,5 +15,5 @@ in_out_pairs:
  - '1024-128'
  - '2048-256'
 test_api:
-  - "transformer_int4_gpu"  # on Intel GPU
+  - "transformer_int4_fp16_gpu"  # on Intel GPU
 cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api)