Files
DeepSpeed/op_builder/xpu/inference.py
Yizhou Wang b81b197ec3 [XPU] API align with new intel pytorch extension release (#6395)
with intel_extension_for_pytorch new release, we changed deepspeed
kernel API. Need to align with upstream DeepSpeed xpu op builder.

Co-authored-by: Logan Adams <114770087+loadams@users.noreply.github.com>
2024-08-22 17:24:38 +00:00

40 lines
1.1 KiB
Python

# Copyright (c) Microsoft Corporation.
# SPDX-License-Identifier: Apache-2.0
# DeepSpeed Team
from .builder import SYCLOpBuilder
class InferenceBuilder(SYCLOpBuilder):
BUILD_VAR = "DS_BUILD_TRANSFORMER_INFERENCE"
NAME = "transformer_inference"
def __init__(self, name=None):
name = self.NAME if name is None else name
super().__init__(name=name)
def absolute_name(self):
return f'deepspeed.ops.transformer.inference.{self.NAME}_op'
def sources(self):
return
def include_paths(self):
return []
def extra_ldflags(self):
return []
def cxx_args(self):
return []
def load(self):
try:
import intel_extension_for_pytorch
if hasattr(intel_extension_for_pytorch, "deepspeed"):
return intel_extension_for_pytorch.deepspeed.transformer_inference.transformer_inference
else:
return intel_extension_for_pytorch.xpu.deepspeed
except ImportError:
raise ImportError("Please install intel-extension-for-pytorch >= 2.1.30 to include DeepSpeed kernels.")