stage2: Epoch 0/10 - Latest checkpoint
Browse files- statistics.json +3 -17
statistics.json
CHANGED
|
@@ -17,31 +17,17 @@
|
|
| 17 |
"language_4bit_quantized": false,
|
| 18 |
"memory_158bit_quantized": true,
|
| 19 |
"estimated_model_size_mb": 1026.85,
|
| 20 |
-
"epoch":
|
| 21 |
"total_epochs": 10,
|
| 22 |
"stage": "stage2",
|
| 23 |
-
"timestamp": "2025-12-
|
| 24 |
"training_history": [
|
| 25 |
{
|
| 26 |
"epoch": 0,
|
| 27 |
-
"train_loss": 1.
|
| 28 |
"alignment_loss": 0,
|
| 29 |
"learning_rate": 9.786403637412737e-05,
|
| 30 |
"gradient_norm": 0
|
| 31 |
-
},
|
| 32 |
-
{
|
| 33 |
-
"epoch": 1,
|
| 34 |
-
"train_loss": 1.4130540664910034,
|
| 35 |
-
"alignment_loss": 0,
|
| 36 |
-
"learning_rate": 9.098753048166504e-05,
|
| 37 |
-
"gradient_norm": 0
|
| 38 |
-
},
|
| 39 |
-
{
|
| 40 |
-
"epoch": 2,
|
| 41 |
-
"train_loss": 1.353085695717397,
|
| 42 |
-
"alignment_loss": 0,
|
| 43 |
-
"learning_rate": 8.00400991267938e-05,
|
| 44 |
-
"gradient_norm": 0
|
| 45 |
}
|
| 46 |
]
|
| 47 |
}
|
|
|
|
| 17 |
"language_4bit_quantized": false,
|
| 18 |
"memory_158bit_quantized": true,
|
| 19 |
"estimated_model_size_mb": 1026.85,
|
| 20 |
+
"epoch": 0,
|
| 21 |
"total_epochs": 10,
|
| 22 |
"stage": "stage2",
|
| 23 |
+
"timestamp": "2025-12-19T21:35:56.376020",
|
| 24 |
"training_history": [
|
| 25 |
{
|
| 26 |
"epoch": 0,
|
| 27 |
+
"train_loss": 1.7373690557870052,
|
| 28 |
"alignment_loss": 0,
|
| 29 |
"learning_rate": 9.786403637412737e-05,
|
| 30 |
"gradient_norm": 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
}
|
| 32 |
]
|
| 33 |
}
|