deepspeed_bsz24_fp32_config.json 298 B

1234567891011121314151617
  1. {
  2. "train_batch_size": 24,
  3. "train_micro_batch_size_per_gpu": 3,
  4. "steps_per_print": 1,
  5. "optimizer": {
  6. "type": "Adam",
  7. "params": {
  8. "lr": 3e-5,
  9. "weight_decay": 0.0,
  10. "bias_correction": false
  11. }
  12. },
  13. "gradient_clipping": 1.0,
  14. "fp16": {
  15. "enabled": false
  16. }
  17. }