Upload checkpoint checkpoint-50
Browse files
checkpoint-50/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 614801160
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebca23c43e2da93412879287d3ecb22ba143e75a2600955a24c9739b83be1507
|
| 3 |
size 614801160
|
checkpoint-50/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 312742204
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bfa314ed8ffe2040322876ac873f864979ab880ac758867620937ebd26730858
|
| 3 |
size 312742204
|
checkpoint-50/trainer_state.json
CHANGED
|
@@ -13,35 +13,35 @@
|
|
| 13 |
"epoch": 0.05235602094240838,
|
| 14 |
"grad_norm": NaN,
|
| 15 |
"learning_rate": 0.0,
|
| 16 |
-
"loss": 9.
|
| 17 |
"step": 10
|
| 18 |
},
|
| 19 |
{
|
| 20 |
"epoch": 0.10471204188481675,
|
| 21 |
-
"grad_norm":
|
| 22 |
"learning_rate": 3.1413612565445024e-08,
|
| 23 |
-
"loss": 9.
|
| 24 |
"step": 20
|
| 25 |
},
|
| 26 |
{
|
| 27 |
"epoch": 0.15706806282722513,
|
| 28 |
-
"grad_norm":
|
| 29 |
"learning_rate": 1.3612565445026178e-07,
|
| 30 |
-
"loss": 3.
|
| 31 |
"step": 30
|
| 32 |
},
|
| 33 |
{
|
| 34 |
"epoch": 0.2094240837696335,
|
| 35 |
-
"grad_norm":
|
| 36 |
"learning_rate": 2.4083769633507854e-07,
|
| 37 |
-
"loss": 3.
|
| 38 |
"step": 40
|
| 39 |
},
|
| 40 |
{
|
| 41 |
"epoch": 0.2617801047120419,
|
| 42 |
-
"grad_norm":
|
| 43 |
"learning_rate": 3.4554973821989523e-07,
|
| 44 |
-
"loss": 3.
|
| 45 |
"step": 50
|
| 46 |
}
|
| 47 |
],
|
|
|
|
| 13 |
"epoch": 0.05235602094240838,
|
| 14 |
"grad_norm": NaN,
|
| 15 |
"learning_rate": 0.0,
|
| 16 |
+
"loss": 9.7408,
|
| 17 |
"step": 10
|
| 18 |
},
|
| 19 |
{
|
| 20 |
"epoch": 0.10471204188481675,
|
| 21 |
+
"grad_norm": 202209.765625,
|
| 22 |
"learning_rate": 3.1413612565445024e-08,
|
| 23 |
+
"loss": 9.1548,
|
| 24 |
"step": 20
|
| 25 |
},
|
| 26 |
{
|
| 27 |
"epoch": 0.15706806282722513,
|
| 28 |
+
"grad_norm": 27189.787109375,
|
| 29 |
"learning_rate": 1.3612565445026178e-07,
|
| 30 |
+
"loss": 3.8451,
|
| 31 |
"step": 30
|
| 32 |
},
|
| 33 |
{
|
| 34 |
"epoch": 0.2094240837696335,
|
| 35 |
+
"grad_norm": 10457.34765625,
|
| 36 |
"learning_rate": 2.4083769633507854e-07,
|
| 37 |
+
"loss": 3.267,
|
| 38 |
"step": 40
|
| 39 |
},
|
| 40 |
{
|
| 41 |
"epoch": 0.2617801047120419,
|
| 42 |
+
"grad_norm": 8087.2939453125,
|
| 43 |
"learning_rate": 3.4554973821989523e-07,
|
| 44 |
+
"loss": 3.0939,
|
| 45 |
"step": 50
|
| 46 |
}
|
| 47 |
],
|