Upload policy with preprocessor, postprocessor, and model card
Browse files- config.json +1 -1
- model.safetensors +1 -1
- train_config.json +3 -3
config.json
CHANGED
|
@@ -46,7 +46,7 @@
|
|
| 46 |
]
|
| 47 |
}
|
| 48 |
},
|
| 49 |
-
"device": "cuda
|
| 50 |
"use_amp": false,
|
| 51 |
"push_to_hub": true,
|
| 52 |
"repo_id": "sengi/rabc_pi05",
|
|
|
|
| 46 |
]
|
| 47 |
}
|
| 48 |
},
|
| 49 |
+
"device": "cuda",
|
| 50 |
"use_amp": false,
|
| 51 |
"push_to_hub": true,
|
| 52 |
"repo_id": "sengi/rabc_pi05",
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7473096344
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b64f48176cde4efbe3cd657213f4334a35fb44c46cb1c3ce686968d42acb49ef
|
| 3 |
size 7473096344
|
train_config.json
CHANGED
|
@@ -131,7 +131,7 @@
|
|
| 131 |
]
|
| 132 |
}
|
| 133 |
},
|
| 134 |
-
"device": "cuda
|
| 135 |
"use_amp": false,
|
| 136 |
"compiled": false,
|
| 137 |
"push_to_hub": true,
|
|
@@ -185,13 +185,13 @@
|
|
| 185 |
"compile": true,
|
| 186 |
"strict": true,
|
| 187 |
"loss_threshold": 3.0,
|
| 188 |
-
"output_dir": "outputs/train/2026-02-20/
|
| 189 |
"job_name": "rabc_pi05_finetuning",
|
| 190 |
"resume": false,
|
| 191 |
"resume_scheduler": true,
|
| 192 |
"seed": 3407,
|
| 193 |
"num_workers": 4,
|
| 194 |
-
"batch_size":
|
| 195 |
"gradient_accumulation_steps": 1,
|
| 196 |
"steps": 10000,
|
| 197 |
"eval_freq": 20000,
|
|
|
|
| 131 |
]
|
| 132 |
}
|
| 133 |
},
|
| 134 |
+
"device": "cuda",
|
| 135 |
"use_amp": false,
|
| 136 |
"compiled": false,
|
| 137 |
"push_to_hub": true,
|
|
|
|
| 185 |
"compile": true,
|
| 186 |
"strict": true,
|
| 187 |
"loss_threshold": 3.0,
|
| 188 |
+
"output_dir": "outputs/train/2026-02-20/19-39-30_rabc_pi05_finetuning",
|
| 189 |
"job_name": "rabc_pi05_finetuning",
|
| 190 |
"resume": false,
|
| 191 |
"resume_scheduler": true,
|
| 192 |
"seed": 3407,
|
| 193 |
"num_workers": 4,
|
| 194 |
+
"batch_size": 24,
|
| 195 |
"gradient_accumulation_steps": 1,
|
| 196 |
"steps": 10000,
|
| 197 |
"eval_freq": 20000,
|