From f597a9d4f51e4c51944d0082cc5b23a9cf84e9e4 Mon Sep 17 00:00:00 2001 From: binbin Deng <108676127+plusbang@users.noreply.github.com> Date: Wed, 25 Oct 2023 12:35:48 +0800 Subject: [PATCH] LLM: update perf test configuration (#9264) --- python/llm/test/benchmark/arc-perf-test.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/python/llm/test/benchmark/arc-perf-test.yaml b/python/llm/test/benchmark/arc-perf-test.yaml index 9b5246bd..580adc50 100644 --- a/python/llm/test/benchmark/arc-perf-test.yaml +++ b/python/llm/test/benchmark/arc-perf-test.yaml @@ -8,6 +8,7 @@ local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3 num_beams: 1 # default to greedy search +low_bit: 'sym_int4' # default to use 'sym_int4' (i.e. symmetric int4) in_out_pairs: - '32-32' - '1024-128'