Upload metrics.json
Browse files- metrics.json +9 -9
metrics.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"config": {
|
| 3 |
"model_name": "deepseek-ai/DeepSeek-OCR",
|
| 4 |
"output_dir": "/app/trained_model",
|
| 5 |
-
"batch_size":
|
| 6 |
"num_epochs": 3,
|
| 7 |
-
"gradient_accumulation_steps":
|
| 8 |
"max_length": 512,
|
| 9 |
"mixed_precision": "bf16",
|
| 10 |
"optimizer": {
|
|
@@ -63,15 +63,15 @@
|
|
| 63 |
"use_text_projection": false
|
| 64 |
},
|
| 65 |
"metrics": {
|
| 66 |
-
"train_loss": 2.
|
| 67 |
"train_loss_per_epoch": [
|
| 68 |
-
2.
|
| 69 |
-
2.
|
| 70 |
-
2.
|
| 71 |
],
|
| 72 |
"epochs": 3,
|
| 73 |
-
"total_steps":
|
| 74 |
-
"eval_loss": 2.
|
| 75 |
-
"eval_perplexity": 16.
|
| 76 |
}
|
| 77 |
}
|
|
|
|
| 2 |
"config": {
|
| 3 |
"model_name": "deepseek-ai/DeepSeek-OCR",
|
| 4 |
"output_dir": "/app/trained_model",
|
| 5 |
+
"batch_size": 6,
|
| 6 |
"num_epochs": 3,
|
| 7 |
+
"gradient_accumulation_steps": 2,
|
| 8 |
"max_length": 512,
|
| 9 |
"mixed_precision": "bf16",
|
| 10 |
"optimizer": {
|
|
|
|
| 63 |
"use_text_projection": false
|
| 64 |
},
|
| 65 |
"metrics": {
|
| 66 |
+
"train_loss": 2.176753851794596,
|
| 67 |
"train_loss_per_epoch": [
|
| 68 |
+
2.334065725453685,
|
| 69 |
+
2.2217297172861037,
|
| 70 |
+
2.176753851794596
|
| 71 |
],
|
| 72 |
"epochs": 3,
|
| 73 |
+
"total_steps": 10002,
|
| 74 |
+
"eval_loss": 2.795014963263557,
|
| 75 |
+
"eval_perplexity": 16.362873593315534
|
| 76 |
}
|
| 77 |
}
|