.. |
StopWatch.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
Timer.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
activation_type.h
|
38b41dffa1
DeepSpeed-FastGen (#4604)
|
11 月之前 |
compat.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
context.h
|
46bb08c2df
Include cublas error details when getting cublas handle fails (#3695)
|
1 年之前 |
conversion_utils.h
|
c7724c6181
Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539)
|
1 年之前 |
cpu_adagrad.h
|
d873ce6159
[NPU] Fix npu offload bug (#4883)
|
9 月之前 |
cpu_adam.h
|
d873ce6159
[NPU] Fix npu offload bug (#4883)
|
9 月之前 |
cpu_lion.h
|
d873ce6159
[NPU] Fix npu offload bug (#4883)
|
9 月之前 |
cublas_wrappers.h
|
869629c210
Add missing RocBlas include (#4557)
|
1 年之前 |
custom_cuda_layers.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
dequantization_utils.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
dropout.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
ds_kernel_utils.h
|
38b41dffa1
DeepSpeed-FastGen (#4604)
|
11 月之前 |
ds_transformer_cuda.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
feed_forward.h
|
c7724c6181
Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539)
|
1 年之前 |
gelu.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
gemm_test.h
|
c7724c6181
Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539)
|
1 年之前 |
general_kernels.h
|
c7724c6181
Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539)
|
1 年之前 |
memory_access_utils.h
|
3fbd01ccca
FP [6,8,12] quantizer op (#5336)
|
6 月之前 |
normalize_layer.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
quantization.h
|
6c86ff393f
adding 8bit dequantization kernel for asym fine-grained block quantization in zero-inference (#4450)
|
1 年之前 |
quantization_utils.h
|
48297c4841
improving int4 asymmetric quantization accuracy (#3190)
|
1 年之前 |
quantizer.h
|
c7724c6181
Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539)
|
1 年之前 |
reduction_utils.h
|
3fbd01ccca
FP [6,8,12] quantizer op (#5336)
|
6 月之前 |
simd.h
|
f517903162
Fix confusing width in simd_load (#4714)
|
9 月之前 |
softmax.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |
strided_batch_gemm.h
|
c7724c6181
Switch from HIP_PLATFORM_HCC to HIP_PLATFORM_AMD (#4539)
|
1 年之前 |
type_shim.h
|
b361c72761
Update DeepSpeed copyright license to Apache 2.0 (#3111)
|
1 年之前 |