hot-fix mistral kv_cache (#9528)
This commit is contained in:
parent
42b7a16bc5
commit
3d24823cda
1 changed files with 5 additions and 0 deletions
|
|
@ -114,6 +114,11 @@ def mistral_attention_forward(
|
|||
dtype=cache_k.dtype,
|
||||
device=device)
|
||||
|
||||
new_cache_k[:] = cache_k
|
||||
new_cache_v[:] = cache_v
|
||||
cache_k = new_cache_k
|
||||
cache_v = new_cache_v
|
||||
|
||||
key_states, value_states = append_kv_cache(cache_k, cache_v, key_states, value_states)
|
||||
|
||||
elif use_cache:
|
||||
|
|
|
|||
Loading…
Reference in a new issue