template_zero3.json 485 B

1234567891011121314151617
  1. {
  2. "zero_optimization": {
  3. "stage": 3,
  4. "allgather_partitions": true,
  5. "allgather_bucket_size": 5e8,
  6. "overlap_comm": false,
  7. "reduce_scatter": true,
  8. "reduce_bucket_size": 5e8,
  9. "contiguous_gradients": false,
  10. "stage3_max_live_parameters": 1e9,
  11. "stage3_max_reuse_distance": 1e9,
  12. "stage3_prefetch_bucket_size": 5e8,
  13. "stage3_param_persistence_threshold": 1e6,
  14. "stage3_gather_16bit_weights_on_model_save": false,
  15. "sub_group_size": 1e12
  16. }
  17. }