From d8a01d7c4fbfc71e0fea1cfc2a00173e5ac812ea Mon Sep 17 00:00:00 2001
From: Xin Qiu <qiuxin2012@users.noreply.github.com>
Date: Thu, 7 Sep 2023 16:44:10 +0800
Subject: [PATCH] fix chatglm in run.pu (#8919)

---
 python/llm/dev/benchmark/all-in-one/run.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/python/llm/dev/benchmark/all-in-one/run.py b/python/llm/dev/benchmark/all-in-one/run.py
index 56d45796..138adc48 100644
--- a/python/llm/dev/benchmark/all-in-one/run.py
+++ b/python/llm/dev/benchmark/all-in-one/run.py
@@ -127,6 +127,8 @@ def run_transformer_int4(repo_id,
             # slice the input_ids to ensure the prompt length is required length.
             input_ids = tokenizer.encode(input_str, return_tensors="pt")
             input_ids = input_ids[:, :in_len]
+            true_str = tokenizer.batch_decode(input_ids)[0]
+            input_ids = tokenizer.encode(true_str, return_tensors="pt")
             result[in_out] = []
             for i in range(num_trials + warm_up):
                 st = time.perf_counter()