File tree Expand file tree Collapse file tree 4 files changed +8
-8
lines changed
launcher_scripts/conf/training/gpt3 Expand file tree Collapse file tree 4 files changed +8
-8
lines changed Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ exp_manager:
4747 buffer_size : 5
4848
4949model :
50- micro_batch_size : 4
50+ micro_batch_size : 2
5151 global_batch_size : 512
5252 tensor_model_parallel_size : 1
5353 pipeline_model_parallel_size : 1
Original file line number Diff line number Diff line change @@ -13,7 +13,7 @@ trainer:
1313 enable_checkpointing : False
1414 replace_sampler_ddp : False
1515 max_epochs : null
16- max_steps : 200000 # consumed_samples = global_step * global_batch_size
16+ max_steps : 100000 # consumed_samples = global_step * global_batch_size
1717 max_time : " 6:11:00:00" # days:hours:minutes:seconds
1818 log_every_n_steps : 10
1919 val_check_interval : 2000
@@ -48,9 +48,9 @@ exp_manager:
4848
4949model :
5050 micro_batch_size : 2
51- global_batch_size : 768
52- tensor_model_parallel_size : 4
53- pipeline_model_parallel_size : 4
51+ global_batch_size : 1536
52+ tensor_model_parallel_size : 8
53+ pipeline_model_parallel_size : 2
5454 virtual_pipeline_model_parallel_size : null
5555 encoder_seq_length : 2048
5656 max_position_embeddings : 2048
Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ exp_manager:
4747 buffer_size : 5
4848
4949model :
50- micro_batch_size : 2
50+ micro_batch_size : 4
5151 global_batch_size : 256
5252 tensor_model_parallel_size : 1
5353 pipeline_model_parallel_size : 1
@@ -207,4 +207,4 @@ model:
207207 - .0333
208208 - ${data_dir}/my-gpt3_28_text_document
209209 - .0334
210- - ${data_dir}/my-gpt3_29_text_document
210+ - ${data_dir}/my-gpt3_29_text_document
Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ exp_manager:
4747 buffer_size : 5
4848
4949model :
50- micro_batch_size : 4
50+ micro_batch_size : 2
5151 global_batch_size : 512
5252 tensor_model_parallel_size : 2
5353 pipeline_model_parallel_size : 1
You can’t perform that action at this time.
0 commit comments