Jeff Rasley 3fbd01ccca FP [6,8,12] quantizer op (#5336) 6 月之前
..
StopWatch.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
Timer.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
activation_type.h 38b41dffa1 DeepSpeed-FastGen (#4604) 11 月之前
compat.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
context.h 46bb08c2df Include cublas error details when getting cublas handle fails (#3695) 1 年之前
conversion_utils.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
cpu_adagrad.h d873ce6159 [NPU] Fix npu offload bug (#4883) 9 月之前
cpu_adam.h d873ce6159 [NPU] Fix npu offload bug (#4883) 9 月之前
cpu_lion.h d873ce6159 [NPU] Fix npu offload bug (#4883) 9 月之前
cublas_wrappers.h 869629c210 Add missing RocBlas include (#4557) 1 年之前
custom_cuda_layers.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
dequantization_utils.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
dropout.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
ds_kernel_utils.h 38b41dffa1 DeepSpeed-FastGen (#4604) 11 月之前
ds_transformer_cuda.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
feed_forward.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
gelu.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
gemm_test.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
general_kernels.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
memory_access_utils.h 3fbd01ccca FP [6,8,12] quantizer op (#5336) 6 月之前
normalize_layer.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
quantization.h 6c86ff393f adding 8bit dequantization kernel for asym fine-grained block quantization in zero-inference (#4450) 1 年之前
quantization_utils.h 48297c4841 improving int4 asymmetric quantization accuracy (#3190) 1 年之前
quantizer.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
reduction_utils.h 3fbd01ccca FP [6,8,12] quantizer op (#5336) 6 月之前
simd.h f517903162 Fix confusing width in simd_load (#4714) 9 月之前
softmax.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
strided_batch_gemm.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
type_shim.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前