Training in progress, step 10000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/rng_state_4.pth +1 -1
- last-checkpoint/rng_state_5.pth +1 -1
- last-checkpoint/rng_state_6.pth +1 -1
- last-checkpoint/rng_state_7.pth +1 -1
- last-checkpoint/text_renderer_config.json +17 -5
- last-checkpoint/trainer_state.json +93 -93
- last-checkpoint/training_args.bin +1 -1
- pytorch_model.bin +1 -1
- text_renderer_config.json +17 -5
- training_args.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 202193937
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec52caad045b3f34632491a3e60266fca49fb4a8996857ded69858dac82d39b4
|
| 3 |
size 202193937
|
last-checkpoint/pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 102501541
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4934ec353ee8c0b201d8896e01193b73d8d525ed3d2c04d990e1d6af1e4f1ff
|
| 3 |
size 102501541
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_4.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_5.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_6.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/rng_state_7.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
| 3 |
size 14503
|
last-checkpoint/text_renderer_config.json
CHANGED
|
@@ -16,18 +16,20 @@
|
|
| 16 |
"Nimbus Roman",
|
| 17 |
"Nimbus Sans",
|
| 18 |
"Nimbus Sans Narrow",
|
|
|
|
|
|
|
| 19 |
"Noto Kufi Arabic",
|
| 20 |
-
"Noto Looped Lao",
|
| 21 |
-
"Noto Looped Lao UI",
|
| 22 |
"Noto Music",
|
| 23 |
"Noto Naskh Arabic",
|
| 24 |
"Noto Naskh Arabic UI",
|
| 25 |
"Noto Nastaliq Urdu",
|
| 26 |
"Noto Rashi Hebrew",
|
|
|
|
| 27 |
"Noto Sans Adlam",
|
| 28 |
"Noto Sans Adlam Unjoined",
|
| 29 |
"Noto Sans Anatolian Hieroglyphs",
|
| 30 |
"Noto Sans Arabic",
|
|
|
|
| 31 |
"Noto Sans Armenian",
|
| 32 |
"Noto Sans Avestan",
|
| 33 |
"Noto Sans Balinese",
|
|
@@ -86,12 +88,16 @@
|
|
| 86 |
"Noto Sans Kaithi",
|
| 87 |
"Noto Sans Kannada",
|
| 88 |
"Noto Sans Kannada UI",
|
|
|
|
| 89 |
"Noto Sans Kayah Li",
|
| 90 |
"Noto Sans Kharoshthi",
|
| 91 |
"Noto Sans Khmer",
|
| 92 |
"Noto Sans Khmer UI",
|
|
|
|
| 93 |
"Noto Sans Khudawadi",
|
| 94 |
"Noto Sans Lao",
|
|
|
|
|
|
|
| 95 |
"Noto Sans Lao UI",
|
| 96 |
"Noto Sans Lepcha",
|
| 97 |
"Noto Sans Limbu",
|
|
@@ -123,13 +129,15 @@
|
|
| 123 |
"Noto Sans Myanmar UI",
|
| 124 |
"Noto Sans NKo",
|
| 125 |
"Noto Sans Nabataean",
|
|
|
|
| 126 |
"Noto Sans Nandinagari",
|
| 127 |
"Noto Sans New Tai Lue",
|
| 128 |
"Noto Sans Newa",
|
| 129 |
"Noto Sans Nushu",
|
| 130 |
"Noto Sans Ogham",
|
| 131 |
-
"Noto Sans
|
| 132 |
"Noto Sans Old Hungarian",
|
|
|
|
| 133 |
"Noto Sans Old North Arabian",
|
| 134 |
"Noto Sans Old Permic",
|
| 135 |
"Noto Sans Old Persian",
|
|
@@ -142,7 +150,7 @@
|
|
| 142 |
"Noto Sans Pahawh Hmong",
|
| 143 |
"Noto Sans Palmyrene",
|
| 144 |
"Noto Sans Pau Cin Hau",
|
| 145 |
-
"Noto Sans
|
| 146 |
"Noto Sans Phoenician",
|
| 147 |
"Noto Sans Psalter Pahlavi",
|
| 148 |
"Noto Sans Rejang",
|
|
@@ -156,11 +164,15 @@
|
|
| 156 |
"Noto Sans Sinhala",
|
| 157 |
"Noto Sans Sinhala UI",
|
| 158 |
"Noto Sans Sogdian",
|
|
|
|
| 159 |
"Noto Sans Soyombo",
|
|
|
|
| 160 |
"Noto Sans Syloti Nagri",
|
| 161 |
"Noto Sans Symbols",
|
| 162 |
-
"Noto Sans
|
| 163 |
"Noto Sans Syriac",
|
|
|
|
|
|
|
| 164 |
"Noto Sans Tagalog",
|
| 165 |
"Noto Sans Tagbanwa",
|
| 166 |
"Noto Sans Tai Le",
|
|
|
|
| 16 |
"Nimbus Roman",
|
| 17 |
"Nimbus Sans",
|
| 18 |
"Nimbus Sans Narrow",
|
| 19 |
+
"Noto Fangsong KSS Rotated",
|
| 20 |
+
"Noto Fangsong KSS Vertical",
|
| 21 |
"Noto Kufi Arabic",
|
|
|
|
|
|
|
| 22 |
"Noto Music",
|
| 23 |
"Noto Naskh Arabic",
|
| 24 |
"Noto Naskh Arabic UI",
|
| 25 |
"Noto Nastaliq Urdu",
|
| 26 |
"Noto Rashi Hebrew",
|
| 27 |
+
"Noto Sans",
|
| 28 |
"Noto Sans Adlam",
|
| 29 |
"Noto Sans Adlam Unjoined",
|
| 30 |
"Noto Sans Anatolian Hieroglyphs",
|
| 31 |
"Noto Sans Arabic",
|
| 32 |
+
"Noto Sans Arabic UI",
|
| 33 |
"Noto Sans Armenian",
|
| 34 |
"Noto Sans Avestan",
|
| 35 |
"Noto Sans Balinese",
|
|
|
|
| 88 |
"Noto Sans Kaithi",
|
| 89 |
"Noto Sans Kannada",
|
| 90 |
"Noto Sans Kannada UI",
|
| 91 |
+
"Noto Sans Kawi",
|
| 92 |
"Noto Sans Kayah Li",
|
| 93 |
"Noto Sans Kharoshthi",
|
| 94 |
"Noto Sans Khmer",
|
| 95 |
"Noto Sans Khmer UI",
|
| 96 |
+
"Noto Sans Khojki",
|
| 97 |
"Noto Sans Khudawadi",
|
| 98 |
"Noto Sans Lao",
|
| 99 |
+
"Noto Sans Lao Looped",
|
| 100 |
+
"Noto Sans Lao Looped UI",
|
| 101 |
"Noto Sans Lao UI",
|
| 102 |
"Noto Sans Lepcha",
|
| 103 |
"Noto Sans Limbu",
|
|
|
|
| 129 |
"Noto Sans Myanmar UI",
|
| 130 |
"Noto Sans NKo",
|
| 131 |
"Noto Sans Nabataean",
|
| 132 |
+
"Noto Sans Nag Mundari",
|
| 133 |
"Noto Sans Nandinagari",
|
| 134 |
"Noto Sans New Tai Lue",
|
| 135 |
"Noto Sans Newa",
|
| 136 |
"Noto Sans Nushu",
|
| 137 |
"Noto Sans Ogham",
|
| 138 |
+
"Noto Sans Ol Chiki",
|
| 139 |
"Noto Sans Old Hungarian",
|
| 140 |
+
"Noto Sans Old Italic",
|
| 141 |
"Noto Sans Old North Arabian",
|
| 142 |
"Noto Sans Old Permic",
|
| 143 |
"Noto Sans Old Persian",
|
|
|
|
| 150 |
"Noto Sans Pahawh Hmong",
|
| 151 |
"Noto Sans Palmyrene",
|
| 152 |
"Noto Sans Pau Cin Hau",
|
| 153 |
+
"Noto Sans Phags-Pa",
|
| 154 |
"Noto Sans Phoenician",
|
| 155 |
"Noto Sans Psalter Pahlavi",
|
| 156 |
"Noto Sans Rejang",
|
|
|
|
| 164 |
"Noto Sans Sinhala",
|
| 165 |
"Noto Sans Sinhala UI",
|
| 166 |
"Noto Sans Sogdian",
|
| 167 |
+
"Noto Sans Sora Sompeng",
|
| 168 |
"Noto Sans Soyombo",
|
| 169 |
+
"Noto Sans Sundanese",
|
| 170 |
"Noto Sans Syloti Nagri",
|
| 171 |
"Noto Sans Symbols",
|
| 172 |
+
"Noto Sans Symbols 2",
|
| 173 |
"Noto Sans Syriac",
|
| 174 |
+
"Noto Sans Syriac Eastern",
|
| 175 |
+
"Noto Sans Syriac Western",
|
| 176 |
"Noto Sans Tagalog",
|
| 177 |
"Noto Sans Tagbanwa",
|
| 178 |
"Noto Sans Tai Le",
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,216 +1,216 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch":
|
| 5 |
"global_step": 10000,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
| 9 |
"log_history": [
|
| 10 |
{
|
| 11 |
-
"epoch": 0.
|
| 12 |
"learning_rate": 5.999999999999999e-06,
|
| 13 |
-
"loss": 0.
|
| 14 |
"step": 500
|
| 15 |
},
|
| 16 |
{
|
| 17 |
-
"epoch": 0.
|
| 18 |
"learning_rate": 1.1999999999999999e-05,
|
| 19 |
-
"loss": 0.
|
| 20 |
"step": 1000
|
| 21 |
},
|
| 22 |
{
|
| 23 |
-
"epoch": 0.
|
| 24 |
-
"eval_loss": 0.
|
| 25 |
-
"eval_runtime": 1.
|
| 26 |
-
"eval_samples_per_second":
|
| 27 |
-
"eval_steps_per_second":
|
| 28 |
"step": 1000
|
| 29 |
},
|
| 30 |
{
|
| 31 |
-
"epoch": 0.
|
| 32 |
"learning_rate": 1.7999999999999997e-05,
|
| 33 |
-
"loss": 0.
|
| 34 |
"step": 1500
|
| 35 |
},
|
| 36 |
{
|
| 37 |
-
"epoch": 0.
|
| 38 |
"learning_rate": 2.3999999999999997e-05,
|
| 39 |
-
"loss": 0.
|
| 40 |
"step": 2000
|
| 41 |
},
|
| 42 |
{
|
| 43 |
-
"epoch": 0.
|
| 44 |
-
"eval_loss": 0.
|
| 45 |
-
"eval_runtime": 1.
|
| 46 |
-
"eval_samples_per_second":
|
| 47 |
-
"eval_steps_per_second":
|
| 48 |
"step": 2000
|
| 49 |
},
|
| 50 |
{
|
| 51 |
-
"epoch": 0.
|
| 52 |
"learning_rate": 2.9999999999999997e-05,
|
| 53 |
-
"loss": 0.
|
| 54 |
"step": 2500
|
| 55 |
},
|
| 56 |
{
|
| 57 |
-
"epoch": 0.
|
| 58 |
"learning_rate": 3.5999999999999994e-05,
|
| 59 |
-
"loss": 0.
|
| 60 |
"step": 3000
|
| 61 |
},
|
| 62 |
{
|
| 63 |
-
"epoch": 0.
|
| 64 |
-
"eval_loss": 0.
|
| 65 |
-
"eval_runtime": 1.
|
| 66 |
-
"eval_samples_per_second":
|
| 67 |
-
"eval_steps_per_second":
|
| 68 |
"step": 3000
|
| 69 |
},
|
| 70 |
{
|
| 71 |
-
"epoch":
|
| 72 |
"learning_rate": 4.2e-05,
|
| 73 |
-
"loss": 0.
|
| 74 |
"step": 3500
|
| 75 |
},
|
| 76 |
{
|
| 77 |
-
"epoch":
|
| 78 |
"learning_rate": 4.7999999999999994e-05,
|
| 79 |
-
"loss": 0.
|
| 80 |
"step": 4000
|
| 81 |
},
|
| 82 |
{
|
| 83 |
-
"epoch":
|
| 84 |
-
"eval_loss": 0.
|
| 85 |
-
"eval_runtime": 1.
|
| 86 |
-
"eval_samples_per_second":
|
| 87 |
-
"eval_steps_per_second":
|
| 88 |
"step": 4000
|
| 89 |
},
|
| 90 |
{
|
| 91 |
-
"epoch":
|
| 92 |
"learning_rate": 5.399999999999999e-05,
|
| 93 |
-
"loss": 0.
|
| 94 |
"step": 4500
|
| 95 |
},
|
| 96 |
{
|
| 97 |
-
"epoch":
|
| 98 |
"learning_rate": 5.9999999999999995e-05,
|
| 99 |
-
"loss": 0.
|
| 100 |
"step": 5000
|
| 101 |
},
|
| 102 |
{
|
| 103 |
-
"epoch":
|
| 104 |
-
"eval_loss": 0.
|
| 105 |
-
"eval_runtime": 1.
|
| 106 |
-
"eval_samples_per_second":
|
| 107 |
-
"eval_steps_per_second":
|
| 108 |
"step": 5000
|
| 109 |
},
|
| 110 |
{
|
| 111 |
-
"epoch":
|
| 112 |
"learning_rate": 6.599999999999999e-05,
|
| 113 |
-
"loss": 0.
|
| 114 |
"step": 5500
|
| 115 |
},
|
| 116 |
{
|
| 117 |
-
"epoch":
|
| 118 |
"learning_rate": 7.199999999999999e-05,
|
| 119 |
-
"loss": 0.
|
| 120 |
"step": 6000
|
| 121 |
},
|
| 122 |
{
|
| 123 |
-
"epoch":
|
| 124 |
-
"eval_loss": 0.
|
| 125 |
-
"eval_runtime": 1.
|
| 126 |
-
"eval_samples_per_second":
|
| 127 |
-
"eval_steps_per_second":
|
| 128 |
"step": 6000
|
| 129 |
},
|
| 130 |
{
|
| 131 |
-
"epoch":
|
| 132 |
"learning_rate": 7.8e-05,
|
| 133 |
-
"loss": 0.
|
| 134 |
"step": 6500
|
| 135 |
},
|
| 136 |
{
|
| 137 |
-
"epoch":
|
| 138 |
"learning_rate": 8.4e-05,
|
| 139 |
-
"loss": 0.
|
| 140 |
"step": 7000
|
| 141 |
},
|
| 142 |
{
|
| 143 |
-
"epoch":
|
| 144 |
-
"eval_loss": 0.
|
| 145 |
-
"eval_runtime": 1.
|
| 146 |
-
"eval_samples_per_second":
|
| 147 |
-
"eval_steps_per_second":
|
| 148 |
"step": 7000
|
| 149 |
},
|
| 150 |
{
|
| 151 |
-
"epoch":
|
| 152 |
"learning_rate": 8.999999999999999e-05,
|
| 153 |
-
"loss": 0.
|
| 154 |
"step": 7500
|
| 155 |
},
|
| 156 |
{
|
| 157 |
-
"epoch":
|
| 158 |
"learning_rate": 9.599999999999999e-05,
|
| 159 |
-
"loss": 0.
|
| 160 |
"step": 8000
|
| 161 |
},
|
| 162 |
{
|
| 163 |
-
"epoch":
|
| 164 |
-
"eval_loss": 0.
|
| 165 |
-
"eval_runtime": 1.
|
| 166 |
-
"eval_samples_per_second":
|
| 167 |
-
"eval_steps_per_second":
|
| 168 |
"step": 8000
|
| 169 |
},
|
| 170 |
{
|
| 171 |
-
"epoch":
|
| 172 |
"learning_rate": 0.000102,
|
| 173 |
-
"loss": 0.
|
| 174 |
"step": 8500
|
| 175 |
},
|
| 176 |
{
|
| 177 |
-
"epoch":
|
| 178 |
"learning_rate": 0.00010799999999999998,
|
| 179 |
-
"loss": 0.
|
| 180 |
"step": 9000
|
| 181 |
},
|
| 182 |
{
|
| 183 |
-
"epoch":
|
| 184 |
-
"eval_loss": 0.
|
| 185 |
-
"eval_runtime": 1.
|
| 186 |
-
"eval_samples_per_second":
|
| 187 |
-
"eval_steps_per_second":
|
| 188 |
"step": 9000
|
| 189 |
},
|
| 190 |
{
|
| 191 |
-
"epoch":
|
| 192 |
"learning_rate": 0.00011399999999999999,
|
| 193 |
-
"loss": 0.
|
| 194 |
"step": 9500
|
| 195 |
},
|
| 196 |
{
|
| 197 |
-
"epoch":
|
| 198 |
"learning_rate": 0.00011999999999999999,
|
| 199 |
-
"loss": 0.
|
| 200 |
"step": 10000
|
| 201 |
},
|
| 202 |
{
|
| 203 |
-
"epoch":
|
| 204 |
-
"eval_loss": 0.
|
| 205 |
-
"eval_runtime": 1.
|
| 206 |
-
"eval_samples_per_second":
|
| 207 |
-
"eval_steps_per_second":
|
| 208 |
"step": 10000
|
| 209 |
}
|
| 210 |
],
|
| 211 |
"max_steps": 500000,
|
| 212 |
-
"num_train_epochs":
|
| 213 |
-
"total_flos": 3.
|
| 214 |
"trial_name": null,
|
| 215 |
"trial_params": null
|
| 216 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 0.22305496074232692,
|
| 5 |
"global_step": 10000,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
| 9 |
"log_history": [
|
| 10 |
{
|
| 11 |
+
"epoch": 0.01,
|
| 12 |
"learning_rate": 5.999999999999999e-06,
|
| 13 |
+
"loss": 0.9165,
|
| 14 |
"step": 500
|
| 15 |
},
|
| 16 |
{
|
| 17 |
+
"epoch": 0.02,
|
| 18 |
"learning_rate": 1.1999999999999999e-05,
|
| 19 |
+
"loss": 0.7051,
|
| 20 |
"step": 1000
|
| 21 |
},
|
| 22 |
{
|
| 23 |
+
"epoch": 0.02,
|
| 24 |
+
"eval_loss": 0.6818633079528809,
|
| 25 |
+
"eval_runtime": 1.9324,
|
| 26 |
+
"eval_samples_per_second": 1188.697,
|
| 27 |
+
"eval_steps_per_second": 18.63,
|
| 28 |
"step": 1000
|
| 29 |
},
|
| 30 |
{
|
| 31 |
+
"epoch": 0.03,
|
| 32 |
"learning_rate": 1.7999999999999997e-05,
|
| 33 |
+
"loss": 0.6818,
|
| 34 |
"step": 1500
|
| 35 |
},
|
| 36 |
{
|
| 37 |
+
"epoch": 0.04,
|
| 38 |
"learning_rate": 2.3999999999999997e-05,
|
| 39 |
+
"loss": 0.6808,
|
| 40 |
"step": 2000
|
| 41 |
},
|
| 42 |
{
|
| 43 |
+
"epoch": 0.04,
|
| 44 |
+
"eval_loss": 0.6788448691368103,
|
| 45 |
+
"eval_runtime": 1.762,
|
| 46 |
+
"eval_samples_per_second": 1303.62,
|
| 47 |
+
"eval_steps_per_second": 20.431,
|
| 48 |
"step": 2000
|
| 49 |
},
|
| 50 |
{
|
| 51 |
+
"epoch": 0.06,
|
| 52 |
"learning_rate": 2.9999999999999997e-05,
|
| 53 |
+
"loss": 0.6804,
|
| 54 |
"step": 2500
|
| 55 |
},
|
| 56 |
{
|
| 57 |
+
"epoch": 0.07,
|
| 58 |
"learning_rate": 3.5999999999999994e-05,
|
| 59 |
+
"loss": 0.6803,
|
| 60 |
"step": 3000
|
| 61 |
},
|
| 62 |
{
|
| 63 |
+
"epoch": 0.07,
|
| 64 |
+
"eval_loss": 0.678871750831604,
|
| 65 |
+
"eval_runtime": 1.9035,
|
| 66 |
+
"eval_samples_per_second": 1206.735,
|
| 67 |
+
"eval_steps_per_second": 18.913,
|
| 68 |
"step": 3000
|
| 69 |
},
|
| 70 |
{
|
| 71 |
+
"epoch": 0.08,
|
| 72 |
"learning_rate": 4.2e-05,
|
| 73 |
+
"loss": 0.6801,
|
| 74 |
"step": 3500
|
| 75 |
},
|
| 76 |
{
|
| 77 |
+
"epoch": 0.09,
|
| 78 |
"learning_rate": 4.7999999999999994e-05,
|
| 79 |
+
"loss": 0.68,
|
| 80 |
"step": 4000
|
| 81 |
},
|
| 82 |
{
|
| 83 |
+
"epoch": 0.09,
|
| 84 |
+
"eval_loss": 0.6781899333000183,
|
| 85 |
+
"eval_runtime": 1.9139,
|
| 86 |
+
"eval_samples_per_second": 1200.176,
|
| 87 |
+
"eval_steps_per_second": 18.81,
|
| 88 |
"step": 4000
|
| 89 |
},
|
| 90 |
{
|
| 91 |
+
"epoch": 0.1,
|
| 92 |
"learning_rate": 5.399999999999999e-05,
|
| 93 |
+
"loss": 0.6798,
|
| 94 |
"step": 4500
|
| 95 |
},
|
| 96 |
{
|
| 97 |
+
"epoch": 0.11,
|
| 98 |
"learning_rate": 5.9999999999999995e-05,
|
| 99 |
+
"loss": 0.6796,
|
| 100 |
"step": 5000
|
| 101 |
},
|
| 102 |
{
|
| 103 |
+
"epoch": 0.11,
|
| 104 |
+
"eval_loss": 0.6784412860870361,
|
| 105 |
+
"eval_runtime": 1.8311,
|
| 106 |
+
"eval_samples_per_second": 1254.405,
|
| 107 |
+
"eval_steps_per_second": 19.66,
|
| 108 |
"step": 5000
|
| 109 |
},
|
| 110 |
{
|
| 111 |
+
"epoch": 0.12,
|
| 112 |
"learning_rate": 6.599999999999999e-05,
|
| 113 |
+
"loss": 0.6792,
|
| 114 |
"step": 5500
|
| 115 |
},
|
| 116 |
{
|
| 117 |
+
"epoch": 0.13,
|
| 118 |
"learning_rate": 7.199999999999999e-05,
|
| 119 |
+
"loss": 0.6788,
|
| 120 |
"step": 6000
|
| 121 |
},
|
| 122 |
{
|
| 123 |
+
"epoch": 0.13,
|
| 124 |
+
"eval_loss": 0.67804354429245,
|
| 125 |
+
"eval_runtime": 1.8509,
|
| 126 |
+
"eval_samples_per_second": 1240.986,
|
| 127 |
+
"eval_steps_per_second": 19.449,
|
| 128 |
"step": 6000
|
| 129 |
},
|
| 130 |
{
|
| 131 |
+
"epoch": 0.14,
|
| 132 |
"learning_rate": 7.8e-05,
|
| 133 |
+
"loss": 0.6783,
|
| 134 |
"step": 6500
|
| 135 |
},
|
| 136 |
{
|
| 137 |
+
"epoch": 0.16,
|
| 138 |
"learning_rate": 8.4e-05,
|
| 139 |
+
"loss": 0.678,
|
| 140 |
"step": 7000
|
| 141 |
},
|
| 142 |
{
|
| 143 |
+
"epoch": 0.16,
|
| 144 |
+
"eval_loss": 0.6776260733604431,
|
| 145 |
+
"eval_runtime": 1.8893,
|
| 146 |
+
"eval_samples_per_second": 1215.825,
|
| 147 |
+
"eval_steps_per_second": 19.055,
|
| 148 |
"step": 7000
|
| 149 |
},
|
| 150 |
{
|
| 151 |
+
"epoch": 0.17,
|
| 152 |
"learning_rate": 8.999999999999999e-05,
|
| 153 |
+
"loss": 0.6778,
|
| 154 |
"step": 7500
|
| 155 |
},
|
| 156 |
{
|
| 157 |
+
"epoch": 0.18,
|
| 158 |
"learning_rate": 9.599999999999999e-05,
|
| 159 |
+
"loss": 0.678,
|
| 160 |
"step": 8000
|
| 161 |
},
|
| 162 |
{
|
| 163 |
+
"epoch": 0.18,
|
| 164 |
+
"eval_loss": 0.6782737374305725,
|
| 165 |
+
"eval_runtime": 1.8707,
|
| 166 |
+
"eval_samples_per_second": 1227.889,
|
| 167 |
+
"eval_steps_per_second": 19.244,
|
| 168 |
"step": 8000
|
| 169 |
},
|
| 170 |
{
|
| 171 |
+
"epoch": 0.19,
|
| 172 |
"learning_rate": 0.000102,
|
| 173 |
+
"loss": 0.6783,
|
| 174 |
"step": 8500
|
| 175 |
},
|
| 176 |
{
|
| 177 |
+
"epoch": 0.2,
|
| 178 |
"learning_rate": 0.00010799999999999998,
|
| 179 |
+
"loss": 0.6672,
|
| 180 |
"step": 9000
|
| 181 |
},
|
| 182 |
{
|
| 183 |
+
"epoch": 0.2,
|
| 184 |
+
"eval_loss": 0.6526092290878296,
|
| 185 |
+
"eval_runtime": 1.8141,
|
| 186 |
+
"eval_samples_per_second": 1266.219,
|
| 187 |
+
"eval_steps_per_second": 19.845,
|
| 188 |
"step": 9000
|
| 189 |
},
|
| 190 |
{
|
| 191 |
+
"epoch": 0.21,
|
| 192 |
"learning_rate": 0.00011399999999999999,
|
| 193 |
+
"loss": 0.6453,
|
| 194 |
"step": 9500
|
| 195 |
},
|
| 196 |
{
|
| 197 |
+
"epoch": 0.22,
|
| 198 |
"learning_rate": 0.00011999999999999999,
|
| 199 |
+
"loss": 0.632,
|
| 200 |
"step": 10000
|
| 201 |
},
|
| 202 |
{
|
| 203 |
+
"epoch": 0.22,
|
| 204 |
+
"eval_loss": 0.6212196350097656,
|
| 205 |
+
"eval_runtime": 1.9366,
|
| 206 |
+
"eval_samples_per_second": 1186.109,
|
| 207 |
+
"eval_steps_per_second": 18.589,
|
| 208 |
"step": 10000
|
| 209 |
}
|
| 210 |
],
|
| 211 |
"max_steps": 500000,
|
| 212 |
+
"num_train_epochs": 12,
|
| 213 |
+
"total_flos": 3.194871387745e+20,
|
| 214 |
"trial_name": null,
|
| 215 |
"trial_params": null
|
| 216 |
}
|
last-checkpoint/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3311
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:229efc1d49e061de5d19e6e496114be212e29dd2150b027ea46959c2a5a56c0b
|
| 3 |
size 3311
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 102501541
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4934ec353ee8c0b201d8896e01193b73d8d525ed3d2c04d990e1d6af1e4f1ff
|
| 3 |
size 102501541
|
text_renderer_config.json
CHANGED
|
@@ -16,18 +16,20 @@
|
|
| 16 |
"Nimbus Roman",
|
| 17 |
"Nimbus Sans",
|
| 18 |
"Nimbus Sans Narrow",
|
|
|
|
|
|
|
| 19 |
"Noto Kufi Arabic",
|
| 20 |
-
"Noto Looped Lao",
|
| 21 |
-
"Noto Looped Lao UI",
|
| 22 |
"Noto Music",
|
| 23 |
"Noto Naskh Arabic",
|
| 24 |
"Noto Naskh Arabic UI",
|
| 25 |
"Noto Nastaliq Urdu",
|
| 26 |
"Noto Rashi Hebrew",
|
|
|
|
| 27 |
"Noto Sans Adlam",
|
| 28 |
"Noto Sans Adlam Unjoined",
|
| 29 |
"Noto Sans Anatolian Hieroglyphs",
|
| 30 |
"Noto Sans Arabic",
|
|
|
|
| 31 |
"Noto Sans Armenian",
|
| 32 |
"Noto Sans Avestan",
|
| 33 |
"Noto Sans Balinese",
|
|
@@ -86,12 +88,16 @@
|
|
| 86 |
"Noto Sans Kaithi",
|
| 87 |
"Noto Sans Kannada",
|
| 88 |
"Noto Sans Kannada UI",
|
|
|
|
| 89 |
"Noto Sans Kayah Li",
|
| 90 |
"Noto Sans Kharoshthi",
|
| 91 |
"Noto Sans Khmer",
|
| 92 |
"Noto Sans Khmer UI",
|
|
|
|
| 93 |
"Noto Sans Khudawadi",
|
| 94 |
"Noto Sans Lao",
|
|
|
|
|
|
|
| 95 |
"Noto Sans Lao UI",
|
| 96 |
"Noto Sans Lepcha",
|
| 97 |
"Noto Sans Limbu",
|
|
@@ -123,13 +129,15 @@
|
|
| 123 |
"Noto Sans Myanmar UI",
|
| 124 |
"Noto Sans NKo",
|
| 125 |
"Noto Sans Nabataean",
|
|
|
|
| 126 |
"Noto Sans Nandinagari",
|
| 127 |
"Noto Sans New Tai Lue",
|
| 128 |
"Noto Sans Newa",
|
| 129 |
"Noto Sans Nushu",
|
| 130 |
"Noto Sans Ogham",
|
| 131 |
-
"Noto Sans
|
| 132 |
"Noto Sans Old Hungarian",
|
|
|
|
| 133 |
"Noto Sans Old North Arabian",
|
| 134 |
"Noto Sans Old Permic",
|
| 135 |
"Noto Sans Old Persian",
|
|
@@ -142,7 +150,7 @@
|
|
| 142 |
"Noto Sans Pahawh Hmong",
|
| 143 |
"Noto Sans Palmyrene",
|
| 144 |
"Noto Sans Pau Cin Hau",
|
| 145 |
-
"Noto Sans
|
| 146 |
"Noto Sans Phoenician",
|
| 147 |
"Noto Sans Psalter Pahlavi",
|
| 148 |
"Noto Sans Rejang",
|
|
@@ -156,11 +164,15 @@
|
|
| 156 |
"Noto Sans Sinhala",
|
| 157 |
"Noto Sans Sinhala UI",
|
| 158 |
"Noto Sans Sogdian",
|
|
|
|
| 159 |
"Noto Sans Soyombo",
|
|
|
|
| 160 |
"Noto Sans Syloti Nagri",
|
| 161 |
"Noto Sans Symbols",
|
| 162 |
-
"Noto Sans
|
| 163 |
"Noto Sans Syriac",
|
|
|
|
|
|
|
| 164 |
"Noto Sans Tagalog",
|
| 165 |
"Noto Sans Tagbanwa",
|
| 166 |
"Noto Sans Tai Le",
|
|
|
|
| 16 |
"Nimbus Roman",
|
| 17 |
"Nimbus Sans",
|
| 18 |
"Nimbus Sans Narrow",
|
| 19 |
+
"Noto Fangsong KSS Rotated",
|
| 20 |
+
"Noto Fangsong KSS Vertical",
|
| 21 |
"Noto Kufi Arabic",
|
|
|
|
|
|
|
| 22 |
"Noto Music",
|
| 23 |
"Noto Naskh Arabic",
|
| 24 |
"Noto Naskh Arabic UI",
|
| 25 |
"Noto Nastaliq Urdu",
|
| 26 |
"Noto Rashi Hebrew",
|
| 27 |
+
"Noto Sans",
|
| 28 |
"Noto Sans Adlam",
|
| 29 |
"Noto Sans Adlam Unjoined",
|
| 30 |
"Noto Sans Anatolian Hieroglyphs",
|
| 31 |
"Noto Sans Arabic",
|
| 32 |
+
"Noto Sans Arabic UI",
|
| 33 |
"Noto Sans Armenian",
|
| 34 |
"Noto Sans Avestan",
|
| 35 |
"Noto Sans Balinese",
|
|
|
|
| 88 |
"Noto Sans Kaithi",
|
| 89 |
"Noto Sans Kannada",
|
| 90 |
"Noto Sans Kannada UI",
|
| 91 |
+
"Noto Sans Kawi",
|
| 92 |
"Noto Sans Kayah Li",
|
| 93 |
"Noto Sans Kharoshthi",
|
| 94 |
"Noto Sans Khmer",
|
| 95 |
"Noto Sans Khmer UI",
|
| 96 |
+
"Noto Sans Khojki",
|
| 97 |
"Noto Sans Khudawadi",
|
| 98 |
"Noto Sans Lao",
|
| 99 |
+
"Noto Sans Lao Looped",
|
| 100 |
+
"Noto Sans Lao Looped UI",
|
| 101 |
"Noto Sans Lao UI",
|
| 102 |
"Noto Sans Lepcha",
|
| 103 |
"Noto Sans Limbu",
|
|
|
|
| 129 |
"Noto Sans Myanmar UI",
|
| 130 |
"Noto Sans NKo",
|
| 131 |
"Noto Sans Nabataean",
|
| 132 |
+
"Noto Sans Nag Mundari",
|
| 133 |
"Noto Sans Nandinagari",
|
| 134 |
"Noto Sans New Tai Lue",
|
| 135 |
"Noto Sans Newa",
|
| 136 |
"Noto Sans Nushu",
|
| 137 |
"Noto Sans Ogham",
|
| 138 |
+
"Noto Sans Ol Chiki",
|
| 139 |
"Noto Sans Old Hungarian",
|
| 140 |
+
"Noto Sans Old Italic",
|
| 141 |
"Noto Sans Old North Arabian",
|
| 142 |
"Noto Sans Old Permic",
|
| 143 |
"Noto Sans Old Persian",
|
|
|
|
| 150 |
"Noto Sans Pahawh Hmong",
|
| 151 |
"Noto Sans Palmyrene",
|
| 152 |
"Noto Sans Pau Cin Hau",
|
| 153 |
+
"Noto Sans Phags-Pa",
|
| 154 |
"Noto Sans Phoenician",
|
| 155 |
"Noto Sans Psalter Pahlavi",
|
| 156 |
"Noto Sans Rejang",
|
|
|
|
| 164 |
"Noto Sans Sinhala",
|
| 165 |
"Noto Sans Sinhala UI",
|
| 166 |
"Noto Sans Sogdian",
|
| 167 |
+
"Noto Sans Sora Sompeng",
|
| 168 |
"Noto Sans Soyombo",
|
| 169 |
+
"Noto Sans Sundanese",
|
| 170 |
"Noto Sans Syloti Nagri",
|
| 171 |
"Noto Sans Symbols",
|
| 172 |
+
"Noto Sans Symbols 2",
|
| 173 |
"Noto Sans Syriac",
|
| 174 |
+
"Noto Sans Syriac Eastern",
|
| 175 |
+
"Noto Sans Syriac Western",
|
| 176 |
"Noto Sans Tagalog",
|
| 177 |
"Noto Sans Tagbanwa",
|
| 178 |
"Noto Sans Tai Le",
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3311
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:229efc1d49e061de5d19e6e496114be212e29dd2150b027ea46959c2a5a56c0b
|
| 3 |
size 3311
|