ipex-llm/python/llm/src/ipex_llm/transformers/bmm.py
Yina Chen b6b70d1ba0
Divide core-xe packages (#11131)
* temp

* add batch

* fix style

* update package name

* fix style

* add workflow

* use temp version to run uts

* trigger performance test

* trigger win igpu perf

* revert workflow & setup
2024-05-28 12:00:18 +08:00

45 lines
1.2 KiB
Python

#
# Copyright 2016 The BigDL Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
import torch
import xe_linear
torch_bmm_old_ = torch.bmm
def torch_bmm(a, b):
if a.device.type == 'cpu':
return torch_bmm_old_(a, b)
batch, A_rows, common = a.size()
B_cols = b.size(2)
C = torch.empty((batch, A_rows, B_cols), device=a.device)
if a.size(1) == 1:
torch_bmm_old_(a, b, out=C)
else:
xe_linear.bmm(a.contiguous(), b.contiguous(), C)
return C
class SafeBMM:
def __init__(self):
self._old_bmm = torch_bmm_old_
def __enter__(self):
torch.bmm = torch_bmm
def __exit__(self, *args, **kwargs):
torch.bmm = self._old_bmm