ds_batch_config.json 262 B

123456789101112131415
  1. {
  2. "train_batch_size": 2,
  3. "gradient_accumulation_steps": 1,
  4. "optimizer": {
  5. "type": "Adam",
  6. "params": {
  7. "lr": 0.00015
  8. }
  9. },
  10. "gradient_clipping": 1.0,
  11. "fp16": {
  12. "enabled": true,
  13. "loss_scale": 0
  14. }
  15. }