[NPU] fix transpose_value = False for NPU optimize_model=True (#12525)
This commit is contained in:
parent
588bfa24dc
commit
41ef4974ab
1 changed files with 1 additions and 0 deletions
|
|
@ -225,6 +225,7 @@ class LLMBaseNNFactory(NNFactory):
|
|||
head_dim=head_dim,
|
||||
)
|
||||
new_key_states = key_states
|
||||
new_value_states = value_states
|
||||
|
||||
if mode == "decode":
|
||||
key_states = self.concat(past_key, key_states, axis=-2)
|
||||
|
|
|
|||
Loading…
Reference in a new issue