ds_config_func_scheduler.json 449 B

123456789101112131415161718192021222324
  1. {
  2. "train_batch_size": 4,
  3. "gradient_accumulation_steps": 1,
  4. "steps_per_print": 1,
  5. "zero_optimization": {
  6. "stage": 2
  7. },
  8. "gradient_clipping": 1.0,
  9. "scheduler": {
  10. "type": "WarmupLR",
  11. "params": {
  12. "warmup_min_lr": 0,
  13. "warmup_max_lr": 0.001,
  14. "warmup_num_steps": 10
  15. }
  16. },
  17. "fp16": {
  18. "enabled": true,
  19. "loss_scale": 0,
  20. "loss_scale_window": 1000,
  21. "hysteresis": 2,
  22. "min_loss_scale": 1
  23. }
  24. }