1234567891011121314151617181920212223242526272829303132333435363738394041424344 |
- """
- Copyright 2020 The Microsoft DeepSpeed Team
- """
- from .builder import CUDAOpBuilder
- class TransformerBuilder(CUDAOpBuilder):
- BUILD_VAR = "DS_BUILD_TRANSFORMER"
- NAME = "transformer"
- def __init__(self, name=None):
- name = self.NAME if name is None else name
- super().__init__(name=name)
- def absolute_name(self):
- return f'deepspeed.ops.transformer.{self.NAME}_op'
- def extra_ldflags(self):
- if not self.is_rocm_pytorch():
- return ['-lcurand']
- else:
- return []
- def sources(self):
- return [
- 'csrc/transformer/ds_transformer_cuda.cpp',
- 'csrc/transformer/cublas_wrappers.cu',
- 'csrc/transformer/transform_kernels.cu',
- 'csrc/transformer/gelu_kernels.cu',
- 'csrc/transformer/dropout_kernels.cu',
- 'csrc/transformer/normalize_kernels.cu',
- 'csrc/transformer/softmax_kernels.cu',
- 'csrc/transformer/general_kernels.cu'
- ]
- def include_paths(self):
- includes = ['csrc/includes']
- if self.is_rocm_pytorch():
- from torch.utils.cpp_extension import ROCM_HOME
- includes += [
- '{}/hiprand/include'.format(ROCM_HOME),
- '{}/rocrand/include'.format(ROCM_HOME)
- ]
- return includes
|