mirror of
https://github.com/deepspeedai/DeepSpeed.git
synced 2025-10-21 08:43:50 +08:00
with intel_extension_for_pytorch new release, we changed deepspeed kernel API. Need to align with upstream DeepSpeed xpu op builder. Co-authored-by: Logan Adams <114770087+loadams@users.noreply.github.com>
40 lines
1.1 KiB
Python
40 lines
1.1 KiB
Python
# Copyright (c) Microsoft Corporation.
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
# DeepSpeed Team
|
|
from .builder import SYCLOpBuilder
|
|
|
|
|
|
class InferenceBuilder(SYCLOpBuilder):
|
|
BUILD_VAR = "DS_BUILD_TRANSFORMER_INFERENCE"
|
|
NAME = "transformer_inference"
|
|
|
|
def __init__(self, name=None):
|
|
name = self.NAME if name is None else name
|
|
super().__init__(name=name)
|
|
|
|
def absolute_name(self):
|
|
return f'deepspeed.ops.transformer.inference.{self.NAME}_op'
|
|
|
|
def sources(self):
|
|
return
|
|
|
|
def include_paths(self):
|
|
return []
|
|
|
|
def extra_ldflags(self):
|
|
return []
|
|
|
|
def cxx_args(self):
|
|
return []
|
|
|
|
def load(self):
|
|
try:
|
|
import intel_extension_for_pytorch
|
|
if hasattr(intel_extension_for_pytorch, "deepspeed"):
|
|
return intel_extension_for_pytorch.deepspeed.transformer_inference.transformer_inference
|
|
else:
|
|
return intel_extension_for_pytorch.xpu.deepspeed
|
|
except ImportError:
|
|
raise ImportError("Please install intel-extension-for-pytorch >= 2.1.30 to include DeepSpeed kernels.")
|