ds_config_func_bs4_zero2.json 397 B

12345678910111213141516171819
  1. {
  2. "train_batch_size": 4,
  3. "gradient_accumulation_steps": 1,
  4. "steps_per_print": 1,
  5. "zero_optimization": {
  6. "stage": 2,
  7. "reduce_bucket_size": 7000000,
  8. "allgather_bucket_size": 7000000,
  9. "reduce_scatter": true
  10. },
  11. "gradient_clipping": 1.0,
  12. "fp16": {
  13. "enabled": true,
  14. "loss_scale": 0,
  15. "loss_scale_window": 1000,
  16. "hysteresis": 2,
  17. "min_loss_scale": 1
  18. }
  19. }