diff --git a/python/llm/src/ipex_llm/transformers/models/baichuan.py b/python/llm/src/ipex_llm/transformers/models/baichuan.py index d91eb1e7..9d4688df 100644 --- a/python/llm/src/ipex_llm/transformers/models/baichuan.py +++ b/python/llm/src/ipex_llm/transformers/models/baichuan.py @@ -277,8 +277,8 @@ def baichuan_attention_forward_7b( else: enough_kv_room = is_enough_kv_cache_room_4_36(past_key_value, - self.layer_idx, - q_len) + self.layer_idx, + q_len) key_states, value_states = past_key_value.update( key_states, value_states, self.layer_idx, query_states, attention_mask, 1,