deepspeed_bsz24_fp16_zero2_config.json 344 B

1234567891011121314151617181920
  1. {
  2. "train_batch_size": 24,
  3. "train_micro_batch_size_per_gpu": 3,
  4. "steps_per_print": 1,
  5. "optimizer": {
  6. "type": "Adam",
  7. "params": {
  8. "lr": 3e-5,
  9. "weight_decay": 0.0,
  10. "bias_correction": false
  11. }
  12. },
  13. "gradient_clipping": 1.0,
  14. "fp16": {
  15. "enabled": true
  16. },
  17. "zero_optimization": {
  18. "stage": 2
  19. }
  20. }