mtasic85 commited on
Commit
f607f01
·
1 Parent(s): fe695cb

pretrain core 4

Browse files
Files changed (1) hide show
  1. scripts/pretrain_core_model_4.yaml +2 -1
scripts/pretrain_core_model_4.yaml CHANGED
@@ -59,7 +59,8 @@ train:
59
 
60
  # Number of samples between optimizer steps across data-parallel ranks (type: int, default: 512)
61
  # global_batch_size: 512
62
- global_batch_size: 256
 
63
 
64
  # Number of samples per data-parallel rank (type: int, default: 4)
65
  micro_batch_size: 1
 
59
 
60
  # Number of samples between optimizer steps across data-parallel ranks (type: int, default: 512)
61
  # global_batch_size: 512
62
+ # global_batch_size: 256
63
+ global_batch_size: 250
64
 
65
  # Number of samples per data-parallel rank (type: int, default: 4)
66
  micro_batch_size: 1