ds_config_perf_bs32.json 326 B

1234567891011121314151617
  1. {
  2. "train_batch_size": 32,
  3. "gradient_accumulation_steps": 1,
  4. "steps_per_print": 1,
  5. "zero_optimization": {
  6. "stage": 1
  7. },
  8. "disable_allgather": true,
  9. "gradient_clipping": 1.0,
  10. "fp16": {
  11. "enabled": true,
  12. "loss_scale": 0,
  13. "loss_scale_window": 1000,
  14. "hysteresis": 2,
  15. "min_loss_scale": 1
  16. }
  17. }