Logan Adams 297a6840e1 Update clang-format version from 16 to 18. (#5839) 2 月之前
..
StopWatch.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
Timer.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
activation_type.h 38b41dffa1 DeepSpeed-FastGen (#4604) 11 月之前
compat.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
context.h 46bb08c2df Include cublas error details when getting cublas handle fails (#3695) 1 年之前
conversion_utils.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
cpu_adagrad.h 69af361167 CPUAdam fp16 and bf16 support (#5409) 5 月之前
cpu_adam.h 69af361167 CPUAdam fp16 and bf16 support (#5409) 5 月之前
cpu_lion.h 69af361167 CPUAdam fp16 and bf16 support (#5409) 5 月之前
cublas_wrappers.h d3dd8e7454 rocblas -> hipblas changes for ROCm (#5401) 5 月之前
custom_cuda_layers.h 69af361167 CPUAdam fp16 and bf16 support (#5409) 5 月之前
dequantization_utils.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
dropout.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
ds_kernel_utils.h 76c9c69fb1 Rocm warp size fix (#5402) 5 月之前
ds_transformer_cuda.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
feed_forward.h d3dd8e7454 rocblas -> hipblas changes for ROCm (#5401) 5 月之前
gelu.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
gemm_test.h d3dd8e7454 rocblas -> hipblas changes for ROCm (#5401) 5 月之前
general_kernels.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
memory_access_utils.h 3fbd01ccca FP [6,8,12] quantizer op (#5336) 6 月之前
normalize_layer.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
quantization.h 6c86ff393f adding 8bit dequantization kernel for asym fine-grained block quantization in zero-inference (#4450) 1 年之前
quantization_utils.h 48297c4841 improving int4 asymmetric quantization accuracy (#3190) 1 年之前
quantizer.h c7724c6181 Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539) 1 年之前
reduction_utils.h 3fbd01ccca FP [6,8,12] quantizer op (#5336) 6 月之前
simd.h 297a6840e1 Update clang-format version from 16 to 18. (#5839) 2 月之前
softmax.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前
strided_batch_gemm.h d3dd8e7454 rocblas -> hipblas changes for ROCm (#5401) 5 月之前
type_shim.h b361c72761 Update DeepSpeed copyright license to Apache 2.0 (#3111) 1 年之前