pretrain core 4
Browse files
scripts/pretrain_core_model_4.yaml
CHANGED
|
@@ -136,10 +136,10 @@ eval:
|
|
| 136 |
|
| 137 |
optimizer:
|
| 138 |
# class_path: torch.optim.AdamW
|
| 139 |
-
class_path: torchao.prototype.low_bit_optim.AdamW8bit
|
| 140 |
# class_path: torchao.prototype.low_bit_optim.AdamW4bit
|
| 141 |
# class_path: bitsandbytes.optim.AdamW8bit
|
| 142 |
-
|
| 143 |
init_args:
|
| 144 |
# (type: float, default: 0.001)
|
| 145 |
lr: 1e-4
|
|
|
|
| 136 |
|
| 137 |
optimizer:
|
| 138 |
# class_path: torch.optim.AdamW
|
| 139 |
+
# class_path: torchao.prototype.low_bit_optim.AdamW8bit
|
| 140 |
# class_path: torchao.prototype.low_bit_optim.AdamW4bit
|
| 141 |
# class_path: bitsandbytes.optim.AdamW8bit
|
| 142 |
+
class_path: bitsandbytes.optim.PagedAdamW8bit
|
| 143 |
init_args:
|
| 144 |
# (type: float, default: 0.001)
|
| 145 |
lr: 1e-4
|