123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778 |
- main:
- - title: "Getting Started"
- url: /getting-started/
- - title: "News"
- url: /news/
- - title: "Tutorials"
- url: /tutorials/
- - title: "Documentation"
- url: https://deepspeed.readthedocs.io/
- - title: "GitHub"
- url: https://github.com/microsoft/DeepSpeed
- lnav:
- - title: "Feature Overview"
- url: /features/
- - title: "Getting Started"
- url: /getting-started/
- children:
- - title: "Installation"
- url: /getting-started/#installation
- - title: "Writing models"
- url: /getting-started/#writing-deepspeed-models
- - title: "Training"
- url: /getting-started/#training
- - title: "Launching"
- url: /getting-started/#launching-deepspeed-training
- - title: "Configuration"
- url: /docs/config-json/
- children:
- - title: "Batch size"
- url: /docs/config-json/#batch-size-related-parameters
- - title: "Optimizer"
- url: /docs/config-json/#optimizer-parameters
- - title: "Scheduler"
- url: /docs/config-json/#scheduler-parameters
- - title: "Communication"
- url: /docs/config-json/#communication-options
- - title: "FP16"
- url: /docs/config-json/#fp16-training-options
- - title: "ZeRO optimizations"
- url: /docs/config-json/#zero-optimizations-for-fp16-training
- - title: "Logging"
- url: /docs/config-json/#logging
- - title: "Activation checkpointing"
- url: /docs/config-json/#activation-checkpointing
- - title: "Tutorials"
- url: /tutorials/
- children:
- - title: "Getting started"
- url: /getting-started/
- - title: "Getting started on Azure"
- url: /tutorials/azure/
- - title: "CIFAR-10"
- url: /tutorials/cifar-10/
- - title: "BERT Pre-training"
- url: /tutorials/bert-pretraining/
- - title: "BingBertSQuAD Fine-tuning"
- url: /tutorials/bert-finetuning/
- - title: "DeepSpeed Transformer Kernel"
- url: /tutorials/transformer_kernel/
- - title: "Megatron-LM GPT2"
- url: /tutorials/megatron/
- - title: "1-Cycle Schedule"
- url: /tutorials/1Cycle/
- - title: "Learning Rate Range Test"
- url: /tutorials/lrrt/
- - title: "DeepSpeed Sparse Attention"
- url: /tutorials/sparse-attention/
- - title: "ZeRO-Offload"
- url: /tutorials/zero-offload/
- - title: "ZeRO Redundancy Optimizer (ZeRO)"
- url: /tutorials/zero/
- - title: "DeepSpeed with 1-bit Adam"
- url: /tutorials/onebit-adam/
- - title: "Pipeline Parallelism"
- url: /tutorials/pipeline/
- - title: "Contributing"
- url: /contributing/
|