fix a typo in yuan (#10503)

This commit is contained in:
Yishuo Wang 2024-03-22 09:40:04 +08:00 committed by GitHub
parent a7d38bee94
commit f0f317b6cf

View file

@ -394,7 +394,7 @@ def yuan_attention_forward_origin(
self.head_dim, self.head_dim,
cache_k.size(2), cache_k.size(2),
kv_seq_len + KV_CACHE_ALLOC_BLOCK_LENGTH, kv_seq_len + KV_CACHE_ALLOC_BLOCK_LENGTH,
dtype=cache_k.d_type, dtype=cache_k.dtype,
device=device) device=device)
new_cache_k[:] = cache_k new_cache_k[:] = cache_k
new_cache_v[:] = cache_v new_cache_v[:] = cache_v