parent
7a97fbb779
commit
6bf5a8c230
1 changed files with 1 additions and 1 deletions
|
|
@ -234,7 +234,7 @@ class LowBitQwenMultiDecoderlayer(LLMBaseNNFactory):
|
||||||
print(f"{mode} start compiling")
|
print(f"{mode} start compiling")
|
||||||
if (
|
if (
|
||||||
group_size != 0
|
group_size != 0
|
||||||
and (mode == "prefill" or num_layers == 2)
|
and (mode == "prefill" or num_layers == 2 or num_layers == 3)
|
||||||
and os.environ.get("IPEX_LLM_NPU_DISABLE_COMPILE_OPT", "0") != "1"
|
and os.environ.get("IPEX_LLM_NPU_DISABLE_COMPILE_OPT", "0") != "1"
|
||||||
):
|
):
|
||||||
self.compile(npu_dpu_groups=6)
|
self.compile(npu_dpu_groups=6)
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue