[NPU] fix transpose_value = False for NPU optimize_model=True (#12525)
This commit is contained in:
parent
588bfa24dc
commit
41ef4974ab
1 changed files with 1 additions and 0 deletions
|
|
@ -225,6 +225,7 @@ class LLMBaseNNFactory(NNFactory):
|
||||||
head_dim=head_dim,
|
head_dim=head_dim,
|
||||||
)
|
)
|
||||||
new_key_states = key_states
|
new_key_states = key_states
|
||||||
|
new_value_states = value_states
|
||||||
|
|
||||||
if mode == "decode":
|
if mode == "decode":
|
||||||
key_states = self.concat(past_key, key_states, axis=-2)
|
key_states = self.concat(past_key, key_states, axis=-2)
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue