ds_config.json 336 B

12345678910111213141516171819
  1. {
  2. "train_batch_size": 1,
  3. "gradient_accumulation_steps": 1,
  4. "steps_per_print": 1,
  5. "optimizer": {
  6. "type": "Adam",
  7. "params": {
  8. "lr": 0.00015,
  9. "weight_decay": 1e-2
  10. }
  11. },
  12. "fp16": {
  13. "enabled": false,
  14. "loss_scale": 0,
  15. "loss_scale_window": 1000,
  16. "hysteresis": 2,
  17. "min_loss_scale": 1
  18. }
  19. }