change xmx condition (#10000)

2024-01-25 17:48:11 +08:00 · 2024-01-25 17:48:11 +08:00 · 24b34b6e46
commit 24b34b6e46
parent 8b08ad408b
1 changed files with 3 additions and 4 deletions
--- a/python/llm/src/bigdl/llm/transformers/models/utils.py
+++ b/python/llm/src/bigdl/llm/transformers/models/utils.py
@ -291,14 +291,13 @@ def mlp_fusion_check(x, qtype, training):
 def use_xmx(x: torch.Tensor, qtype: int):
    device = get_xpu_device_type(x)
    return (
-        device in ["arc", "flex", "pvc"]
+        os.environ.get("BIGDL_LLM_XMX_DISABLED", "0") != "1"
        and device in ["arc", "flex", "pvc"]
        and qtype in [SYM_INT4, SYM_INT8, FP8]
        and (
            (device == "pvc" and 1 < x.size(0) <= 16)
            or
-            (device != "pvc" and x.dtype == torch.float32 and 1 < x.size(0) <= 64)
+            (device != "pvc" and 1 < x.size(0) <= 64)
            or
            1 < x.size(0) <= 8
        )
    )