pretrain core 4
Browse files
scripts/pretrain_core_model_4.yaml
CHANGED
@@ -136,10 +136,10 @@ eval:
|
|
136 |
|
137 |
optimizer:
|
138 |
# class_path: torch.optim.AdamW
|
139 |
-
class_path: torchao.prototype.low_bit_optim.AdamW8bit
|
140 |
# class_path: torchao.prototype.low_bit_optim.AdamW4bit
|
141 |
# class_path: bitsandbytes.optim.AdamW8bit
|
142 |
-
|
143 |
init_args:
|
144 |
# (type: float, default: 0.001)
|
145 |
lr: 1e-4
|
|
|
136 |
|
137 |
optimizer:
|
138 |
# class_path: torch.optim.AdamW
|
139 |
+
# class_path: torchao.prototype.low_bit_optim.AdamW8bit
|
140 |
# class_path: torchao.prototype.low_bit_optim.AdamW4bit
|
141 |
# class_path: bitsandbytes.optim.AdamW8bit
|
142 |
+
class_path: bitsandbytes.optim.PagedAdamW8bit
|
143 |
init_args:
|
144 |
# (type: float, default: 0.001)
|
145 |
lr: 1e-4
|