Skip to content

Commit

Permalink
Fix train_batch size
Browse files Browse the repository at this point in the history
  • Loading branch information
workingloong committed Jan 2, 2024
1 parent faa5b4f commit caf96e4
Showing 1 changed file with 18 additions and 18 deletions.
36 changes: 18 additions & 18 deletions examples/pytorch/nanogpt/ds_config.json
Original file line number Diff line number Diff line change
@@ -1,21 +1,21 @@
{
"zero_optimization": {
"stage": 1,
"overlap_comm": true,
"contiguous_gradients": true,
"sub_group_size": 1e9,
"reduce_bucket_size": "auto",
"stage3_prefetch_bucket_size": "auto",
"stage3_param_persistence_threshold": "auto",
"stage3_max_live_parameters": 1e9,
"stage3_max_reuse_distance": 1e9,
"stage3_gather_fp16_weights_on_model_save": true
},
"stage": 1,
"overlap_comm": true,
"contiguous_gradients": true,
"sub_group_size": 1e9,
"reduce_bucket_size": "auto",
"stage3_prefetch_bucket_size": "auto",
"stage3_param_persistence_threshold": "auto",
"stage3_max_live_parameters": 1e9,
"stage3_max_reuse_distance": 1e9,
"stage3_gather_fp16_weights_on_model_save": true
},

"gradient_accumulation_steps": 1,
"gradient_clipping": 0.1,
"steps_per_print": 100,
"train_batch_size": 32,
"train_micro_batch_size_per_gpu": 16,
"wall_clock_breakdown": false
}
"gradient_accumulation_steps": 1,
"gradient_clipping": 0.1,
"steps_per_print": 100,
"train_batch_size": 256,
"train_micro_batch_size_per_gpu": 16,
"wall_clock_breakdown": false
}

0 comments on commit caf96e4

Please sign in to comment.