mtasic85 commited on
Commit
7c5858c
·
1 Parent(s): 199602f

pretrain core 4

Browse files
Files changed (1) hide show
  1. scripts/pretrain_core_model_4.yaml +2 -2
scripts/pretrain_core_model_4.yaml CHANGED
@@ -136,10 +136,10 @@ eval:
136
 
137
  optimizer:
138
  # class_path: torch.optim.AdamW
139
- class_path: torchao.prototype.low_bit_optim.AdamW8bit
140
  # class_path: torchao.prototype.low_bit_optim.AdamW4bit
141
  # class_path: bitsandbytes.optim.AdamW8bit
142
- # class_path: bitsandbytes.optim.PagedAdamW8bit
143
  init_args:
144
  # (type: float, default: 0.001)
145
  lr: 1e-4
 
136
 
137
  optimizer:
138
  # class_path: torch.optim.AdamW
139
+ # class_path: torchao.prototype.low_bit_optim.AdamW8bit
140
  # class_path: torchao.prototype.low_bit_optim.AdamW4bit
141
  # class_path: bitsandbytes.optim.AdamW8bit
142
+ class_path: bitsandbytes.optim.PagedAdamW8bit
143
  init_args:
144
  # (type: float, default: 0.001)
145
  lr: 1e-4