Fix run_decoders bug (#11871)
This commit is contained in:
parent
32f0a77846
commit
bdaeee1d63
1 changed files with 1 additions and 1 deletions
|
|
@ -601,7 +601,7 @@ class FusedLlamaLowBitMultiDecoderlayer(torch.nn.Module):
|
||||||
x_np[2].ctypes.data_as(ctypes.c_void_p),
|
x_np[2].ctypes.data_as(ctypes.c_void_p),
|
||||||
)
|
)
|
||||||
t0 = time.perf_counter()
|
t0 = time.perf_counter()
|
||||||
backend_lib.run_decoders(models_ptr, inputs_ptr, 2, 3)
|
backend_lib.run_decoders(models_ptr, inputs_ptr, self.intra_stages, 3)
|
||||||
t1 = time.perf_counter()
|
t1 = time.perf_counter()
|
||||||
|
|
||||||
hidden_states = self.backend_decoders[-1].torch_out[0]
|
hidden_states = self.backend_decoders[-1].torch_out[0]
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue