Training in progress, epoch 0
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +117 -220
- training_args.bin +1 -1
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db24cf62c687c65bd405f2992ce91cea20e4854776905f300db496ba68e1636b
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2168a2007ac7107210994cc6a9857a8a19fff0e0a052b4048f43e60307b3c2fa
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b45d19532fe893a0abe2ccec22bb79c13284dca1c92f2a6c4d74b2b4b45fbd4
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:512b5d0932cc6a7a0a6f1faaed400fac2b620942fc6b1b207a76a8c974128b25
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -1,220 +1,117 @@
|
|
| 1 |
-
{"current_steps": 1, "total_steps":
|
| 2 |
-
{"current_steps": 2, "total_steps":
|
| 3 |
-
{"current_steps": 3, "total_steps":
|
| 4 |
-
{"current_steps": 4, "total_steps":
|
| 5 |
-
{"current_steps": 5, "total_steps":
|
| 6 |
-
{"current_steps": 6, "total_steps":
|
| 7 |
-
{"current_steps": 7, "total_steps":
|
| 8 |
-
{"current_steps": 8, "total_steps":
|
| 9 |
-
{"current_steps": 9, "total_steps":
|
| 10 |
-
{"current_steps": 10, "total_steps":
|
| 11 |
-
{"current_steps": 11, "total_steps":
|
| 12 |
-
{"current_steps": 12, "total_steps":
|
| 13 |
-
{"current_steps": 13, "total_steps":
|
| 14 |
-
{"current_steps": 14, "total_steps":
|
| 15 |
-
{"current_steps": 15, "total_steps":
|
| 16 |
-
{"current_steps": 16, "total_steps":
|
| 17 |
-
{"current_steps": 17, "total_steps":
|
| 18 |
-
{"current_steps": 18, "total_steps":
|
| 19 |
-
{"current_steps": 19, "total_steps":
|
| 20 |
-
{"current_steps": 20, "total_steps":
|
| 21 |
-
{"current_steps": 21, "total_steps":
|
| 22 |
-
{"current_steps": 22, "total_steps":
|
| 23 |
-
{"current_steps": 23, "total_steps":
|
| 24 |
-
{"current_steps": 24, "total_steps":
|
| 25 |
-
{"current_steps": 25, "total_steps":
|
| 26 |
-
{"current_steps": 26, "total_steps":
|
| 27 |
-
{"current_steps": 27, "total_steps":
|
| 28 |
-
{"current_steps": 28, "total_steps":
|
| 29 |
-
{"current_steps": 29, "total_steps":
|
| 30 |
-
{"current_steps": 30, "total_steps":
|
| 31 |
-
{"current_steps": 31, "total_steps":
|
| 32 |
-
{"current_steps": 32, "total_steps":
|
| 33 |
-
{"current_steps": 33, "total_steps":
|
| 34 |
-
{"current_steps": 34, "total_steps":
|
| 35 |
-
{"current_steps": 35, "total_steps":
|
| 36 |
-
{"current_steps": 36, "total_steps":
|
| 37 |
-
{"current_steps": 37, "total_steps":
|
| 38 |
-
{"current_steps": 38, "total_steps":
|
| 39 |
-
{"current_steps": 39, "total_steps":
|
| 40 |
-
{"current_steps": 40, "total_steps":
|
| 41 |
-
{"current_steps": 41, "total_steps":
|
| 42 |
-
{"current_steps": 42, "total_steps":
|
| 43 |
-
{"current_steps": 43, "total_steps":
|
| 44 |
-
{"current_steps": 44, "total_steps":
|
| 45 |
-
{"current_steps": 45, "total_steps":
|
| 46 |
-
{"current_steps": 46, "total_steps":
|
| 47 |
-
{"current_steps": 47, "total_steps":
|
| 48 |
-
{"current_steps": 48, "total_steps":
|
| 49 |
-
{"current_steps": 49, "total_steps":
|
| 50 |
-
{"current_steps": 50, "total_steps":
|
| 51 |
-
{"current_steps": 51, "total_steps":
|
| 52 |
-
{"current_steps": 52, "total_steps":
|
| 53 |
-
{"current_steps": 53, "total_steps":
|
| 54 |
-
{"current_steps": 54, "total_steps":
|
| 55 |
-
{"current_steps": 55, "total_steps":
|
| 56 |
-
{"current_steps": 56, "total_steps":
|
| 57 |
-
{"current_steps": 57, "total_steps":
|
| 58 |
-
{"current_steps": 58, "total_steps":
|
| 59 |
-
{"current_steps": 59, "total_steps":
|
| 60 |
-
{"current_steps": 60, "total_steps":
|
| 61 |
-
{"current_steps": 61, "total_steps":
|
| 62 |
-
{"current_steps": 62, "total_steps":
|
| 63 |
-
{"current_steps": 63, "total_steps":
|
| 64 |
-
{"current_steps": 64, "total_steps":
|
| 65 |
-
{"current_steps": 65, "total_steps":
|
| 66 |
-
{"current_steps": 66, "total_steps":
|
| 67 |
-
{"current_steps": 67, "total_steps":
|
| 68 |
-
{"current_steps": 68, "total_steps":
|
| 69 |
-
{"current_steps": 69, "total_steps":
|
| 70 |
-
{"current_steps": 70, "total_steps":
|
| 71 |
-
{"current_steps": 71, "total_steps":
|
| 72 |
-
{"current_steps": 72, "total_steps":
|
| 73 |
-
{"current_steps": 73, "total_steps":
|
| 74 |
-
{"current_steps": 74, "total_steps":
|
| 75 |
-
{"current_steps": 75, "total_steps":
|
| 76 |
-
{"current_steps": 76, "total_steps":
|
| 77 |
-
{"current_steps": 77, "total_steps":
|
| 78 |
-
{"current_steps": 78, "total_steps":
|
| 79 |
-
{"current_steps": 79, "total_steps":
|
| 80 |
-
{"current_steps": 80, "total_steps":
|
| 81 |
-
{"current_steps": 81, "total_steps":
|
| 82 |
-
{"current_steps": 82, "total_steps":
|
| 83 |
-
{"current_steps": 83, "total_steps":
|
| 84 |
-
{"current_steps": 84, "total_steps":
|
| 85 |
-
{"current_steps": 85, "total_steps":
|
| 86 |
-
{"current_steps": 86, "total_steps":
|
| 87 |
-
{"current_steps": 87, "total_steps":
|
| 88 |
-
{"current_steps": 88, "total_steps":
|
| 89 |
-
{"current_steps": 89, "total_steps":
|
| 90 |
-
{"current_steps": 90, "total_steps":
|
| 91 |
-
{"current_steps": 91, "total_steps":
|
| 92 |
-
{"current_steps": 92, "total_steps":
|
| 93 |
-
{"current_steps": 93, "total_steps":
|
| 94 |
-
{"current_steps": 94, "total_steps":
|
| 95 |
-
{"current_steps": 95, "total_steps":
|
| 96 |
-
{"current_steps": 96, "total_steps":
|
| 97 |
-
{"current_steps": 97, "total_steps":
|
| 98 |
-
{"current_steps": 98, "total_steps":
|
| 99 |
-
{"current_steps": 99, "total_steps":
|
| 100 |
-
{"current_steps": 100, "total_steps":
|
| 101 |
-
{"current_steps": 101, "total_steps":
|
| 102 |
-
{"current_steps": 102, "total_steps":
|
| 103 |
-
{"current_steps": 103, "total_steps":
|
| 104 |
-
{"current_steps": 104, "total_steps":
|
| 105 |
-
{"current_steps": 105, "total_steps":
|
| 106 |
-
{"current_steps": 106, "total_steps":
|
| 107 |
-
{"current_steps": 107, "total_steps":
|
| 108 |
-
{"current_steps": 108, "total_steps":
|
| 109 |
-
{"current_steps": 109, "total_steps":
|
| 110 |
-
{"current_steps": 110, "total_steps":
|
| 111 |
-
{"current_steps": 111, "total_steps":
|
| 112 |
-
{"current_steps": 112, "total_steps":
|
| 113 |
-
{"current_steps": 113, "total_steps":
|
| 114 |
-
{"current_steps": 114, "total_steps":
|
| 115 |
-
{"current_steps": 115, "total_steps":
|
| 116 |
-
{"current_steps": 116, "total_steps":
|
| 117 |
-
{"current_steps": 117, "total_steps":
|
| 118 |
-
{"current_steps": 118, "total_steps": 219, "loss": 0.2315, "lr": 5.199286832792553e-06, "epoch": 1.6164383561643836, "percentage": 53.88, "elapsed_time": "0:03:40", "remaining_time": "0:03:09"}
|
| 119 |
-
{"current_steps": 119, "total_steps": 219, "loss": 0.295, "lr": 5.119592375289015e-06, "epoch": 1.6301369863013697, "percentage": 54.34, "elapsed_time": "0:03:43", "remaining_time": "0:03:07"}
|
| 120 |
-
{"current_steps": 120, "total_steps": 219, "loss": 0.2276, "lr": 5.039867504623084e-06, "epoch": 1.643835616438356, "percentage": 54.79, "elapsed_time": "0:03:44", "remaining_time": "0:03:05"}
|
| 121 |
-
{"current_steps": 121, "total_steps": 219, "loss": 0.276, "lr": 4.960132495376919e-06, "epoch": 1.6575342465753424, "percentage": 55.25, "elapsed_time": "0:03:46", "remaining_time": "0:03:03"}
|
| 122 |
-
{"current_steps": 122, "total_steps": 219, "loss": 0.2886, "lr": 4.880407624710986e-06, "epoch": 1.6712328767123288, "percentage": 55.71, "elapsed_time": "0:03:47", "remaining_time": "0:03:00"}
|
| 123 |
-
{"current_steps": 123, "total_steps": 219, "loss": 0.2911, "lr": 4.800713167207449e-06, "epoch": 1.6849315068493151, "percentage": 56.16, "elapsed_time": "0:03:49", "remaining_time": "0:02:58"}
|
| 124 |
-
{"current_steps": 124, "total_steps": 219, "loss": 0.2931, "lr": 4.721069389714188e-06, "epoch": 1.6986301369863015, "percentage": 56.62, "elapsed_time": "0:03:50", "remaining_time": "0:02:56"}
|
| 125 |
-
{"current_steps": 125, "total_steps": 219, "loss": 0.2429, "lr": 4.641496546190813e-06, "epoch": 1.7123287671232876, "percentage": 57.08, "elapsed_time": "0:03:51", "remaining_time": "0:02:54"}
|
| 126 |
-
{"current_steps": 126, "total_steps": 219, "loss": 0.2898, "lr": 4.562014872557936e-06, "epoch": 1.726027397260274, "percentage": 57.53, "elapsed_time": "0:03:53", "remaining_time": "0:02:51"}
|
| 127 |
-
{"current_steps": 127, "total_steps": 219, "loss": 0.2853, "lr": 4.48264458155104e-06, "epoch": 1.7397260273972601, "percentage": 57.99, "elapsed_time": "0:03:54", "remaining_time": "0:02:49"}
|
| 128 |
-
{"current_steps": 128, "total_steps": 219, "loss": 0.2457, "lr": 4.403405857580243e-06, "epoch": 1.7534246575342465, "percentage": 58.45, "elapsed_time": "0:03:55", "remaining_time": "0:02:47"}
|
| 129 |
-
{"current_steps": 129, "total_steps": 219, "loss": 0.282, "lr": 4.3243188515972575e-06, "epoch": 1.7671232876712328, "percentage": 58.9, "elapsed_time": "0:03:57", "remaining_time": "0:02:45"}
|
| 130 |
-
{"current_steps": 130, "total_steps": 219, "loss": 0.2653, "lr": 4.245403675970877e-06, "epoch": 1.7808219178082192, "percentage": 59.36, "elapsed_time": "0:03:58", "remaining_time": "0:02:43"}
|
| 131 |
-
{"current_steps": 131, "total_steps": 219, "loss": 0.2535, "lr": 4.166680399372248e-06, "epoch": 1.7945205479452055, "percentage": 59.82, "elapsed_time": "0:04:00", "remaining_time": "0:02:41"}
|
| 132 |
-
{"current_steps": 132, "total_steps": 219, "loss": 0.2786, "lr": 4.08816904167128e-06, "epoch": 1.808219178082192, "percentage": 60.27, "elapsed_time": "0:04:01", "remaining_time": "0:02:39"}
|
| 133 |
-
{"current_steps": 133, "total_steps": 219, "loss": 0.2588, "lr": 4.009889568845453e-06, "epoch": 1.821917808219178, "percentage": 60.73, "elapsed_time": "0:04:02", "remaining_time": "0:02:36"}
|
| 134 |
-
{"current_steps": 134, "total_steps": 219, "loss": 0.276, "lr": 3.9318618879023255e-06, "epoch": 1.8356164383561644, "percentage": 61.19, "elapsed_time": "0:04:04", "remaining_time": "0:02:34"}
|
| 135 |
-
{"current_steps": 135, "total_steps": 219, "loss": 0.2486, "lr": 3.854105841817056e-06, "epoch": 1.8493150684931505, "percentage": 61.64, "elapsed_time": "0:04:05", "remaining_time": "0:02:32"}
|
| 136 |
-
{"current_steps": 136, "total_steps": 219, "loss": 0.3044, "lr": 3.776641204486191e-06, "epoch": 1.8630136986301369, "percentage": 62.1, "elapsed_time": "0:04:06", "remaining_time": "0:02:30"}
|
| 137 |
-
{"current_steps": 137, "total_steps": 219, "loss": 0.2668, "lr": 3.699487675699027e-06, "epoch": 1.8767123287671232, "percentage": 62.56, "elapsed_time": "0:04:08", "remaining_time": "0:02:28"}
|
| 138 |
-
{"current_steps": 138, "total_steps": 219, "loss": 0.263, "lr": 3.6226648761278238e-06, "epoch": 1.8904109589041096, "percentage": 63.01, "elapsed_time": "0:04:09", "remaining_time": "0:02:26"}
|
| 139 |
-
{"current_steps": 139, "total_steps": 219, "loss": 0.2641, "lr": 3.5461923423381313e-06, "epoch": 1.904109589041096, "percentage": 63.47, "elapsed_time": "0:04:10", "remaining_time": "0:02:24"}
|
| 140 |
-
{"current_steps": 140, "total_steps": 219, "loss": 0.2841, "lr": 3.4700895218205026e-06, "epoch": 1.9178082191780823, "percentage": 63.93, "elapsed_time": "0:04:12", "remaining_time": "0:02:22"}
|
| 141 |
-
{"current_steps": 141, "total_steps": 219, "loss": 0.2793, "lr": 3.3943757680448697e-06, "epoch": 1.9315068493150684, "percentage": 64.38, "elapsed_time": "0:04:13", "remaining_time": "0:02:20"}
|
| 142 |
-
{"current_steps": 142, "total_steps": 219, "loss": 0.2646, "lr": 3.3190703355388165e-06, "epoch": 1.9452054794520548, "percentage": 64.84, "elapsed_time": "0:04:14", "remaining_time": "0:02:18"}
|
| 143 |
-
{"current_steps": 143, "total_steps": 219, "loss": 0.2544, "lr": 3.244192374991027e-06, "epoch": 1.958904109589041, "percentage": 65.3, "elapsed_time": "0:04:16", "remaining_time": "0:02:16"}
|
| 144 |
-
{"current_steps": 144, "total_steps": 219, "loss": 0.2838, "lr": 3.169760928381127e-06, "epoch": 1.9726027397260273, "percentage": 65.75, "elapsed_time": "0:04:17", "remaining_time": "0:02:14"}
|
| 145 |
-
{"current_steps": 145, "total_steps": 219, "loss": 0.2582, "lr": 3.0957949241371845e-06, "epoch": 1.9863013698630136, "percentage": 66.21, "elapsed_time": "0:04:18", "remaining_time": "0:02:12"}
|
| 146 |
-
{"current_steps": 146, "total_steps": 219, "loss": 0.2092, "lr": 3.0223131723220756e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:04:20", "remaining_time": "0:02:10"}
|
| 147 |
-
{"current_steps": 147, "total_steps": 219, "loss": 0.2165, "lr": 2.949334359849957e-06, "epoch": 2.0136986301369864, "percentage": 67.12, "elapsed_time": "0:05:19", "remaining_time": "0:02:36"}
|
| 148 |
-
{"current_steps": 148, "total_steps": 219, "loss": 0.2247, "lr": 2.876877045734058e-06, "epoch": 2.0273972602739727, "percentage": 67.58, "elapsed_time": "0:05:20", "remaining_time": "0:02:33"}
|
| 149 |
-
{"current_steps": 149, "total_steps": 219, "loss": 0.1997, "lr": 2.8049596563669936e-06, "epoch": 2.041095890410959, "percentage": 68.04, "elapsed_time": "0:05:22", "remaining_time": "0:02:31"}
|
| 150 |
-
{"current_steps": 150, "total_steps": 219, "loss": 0.2302, "lr": 2.7336004808348094e-06, "epoch": 2.0547945205479454, "percentage": 68.49, "elapsed_time": "0:05:23", "remaining_time": "0:02:28"}
|
| 151 |
-
{"current_steps": 151, "total_steps": 219, "loss": 0.2337, "lr": 2.662817666265932e-06, "epoch": 2.0684931506849313, "percentage": 68.95, "elapsed_time": "0:05:24", "remaining_time": "0:02:26"}
|
| 152 |
-
{"current_steps": 152, "total_steps": 219, "loss": 0.2303, "lr": 2.5926292132162432e-06, "epoch": 2.0821917808219177, "percentage": 69.41, "elapsed_time": "0:05:26", "remaining_time": "0:02:23"}
|
| 153 |
-
{"current_steps": 153, "total_steps": 219, "loss": 0.2373, "lr": 2.5230529710914074e-06, "epoch": 2.095890410958904, "percentage": 69.86, "elapsed_time": "0:05:27", "remaining_time": "0:02:21"}
|
| 154 |
-
{"current_steps": 154, "total_steps": 219, "loss": 0.1983, "lr": 2.4541066336076434e-06, "epoch": 2.1095890410958904, "percentage": 70.32, "elapsed_time": "0:05:28", "remaining_time": "0:02:18"}
|
| 155 |
-
{"current_steps": 155, "total_steps": 219, "loss": 0.3069, "lr": 2.385807734292097e-06, "epoch": 2.1232876712328768, "percentage": 70.78, "elapsed_time": "0:05:30", "remaining_time": "0:02:16"}
|
| 156 |
-
{"current_steps": 156, "total_steps": 219, "loss": 0.2487, "lr": 2.318173642023939e-06, "epoch": 2.136986301369863, "percentage": 71.23, "elapsed_time": "0:05:31", "remaining_time": "0:02:13"}
|
| 157 |
-
{"current_steps": 157, "total_steps": 219, "loss": 0.2513, "lr": 2.251221556617344e-06, "epoch": 2.1506849315068495, "percentage": 71.69, "elapsed_time": "0:05:33", "remaining_time": "0:02:11"}
|
| 158 |
-
{"current_steps": 158, "total_steps": 219, "loss": 0.2337, "lr": 2.184968504447453e-06, "epoch": 2.1643835616438354, "percentage": 72.15, "elapsed_time": "0:05:34", "remaining_time": "0:02:09"}
|
| 159 |
-
{"current_steps": 159, "total_steps": 219, "loss": 0.1819, "lr": 2.11943133412046e-06, "epoch": 2.1780821917808217, "percentage": 72.6, "elapsed_time": "0:05:36", "remaining_time": "0:02:06"}
|
| 160 |
-
{"current_steps": 160, "total_steps": 219, "loss": 0.2157, "lr": 2.0546267121888863e-06, "epoch": 2.191780821917808, "percentage": 73.06, "elapsed_time": "0:05:38", "remaining_time": "0:02:04"}
|
| 161 |
-
{"current_steps": 161, "total_steps": 219, "loss": 0.2337, "lr": 1.990571118913166e-06, "epoch": 2.2054794520547945, "percentage": 73.52, "elapsed_time": "0:05:40", "remaining_time": "0:02:02"}
|
| 162 |
-
{"current_steps": 162, "total_steps": 219, "loss": 0.2319, "lr": 1.9272808440706024e-06, "epoch": 2.219178082191781, "percentage": 73.97, "elapsed_time": "0:05:41", "remaining_time": "0:02:00"}
|
| 163 |
-
{"current_steps": 163, "total_steps": 219, "loss": 0.2067, "lr": 1.864771982812763e-06, "epoch": 2.232876712328767, "percentage": 74.43, "elapsed_time": "0:05:42", "remaining_time": "0:01:57"}
|
| 164 |
-
{"current_steps": 164, "total_steps": 219, "loss": 0.1983, "lr": 1.8030604315723765e-06, "epoch": 2.2465753424657535, "percentage": 74.89, "elapsed_time": "0:05:44", "remaining_time": "0:01:55"}
|
| 165 |
-
{"current_steps": 165, "total_steps": 219, "loss": 0.2062, "lr": 1.7421618840207576e-06, "epoch": 2.26027397260274, "percentage": 75.34, "elapsed_time": "0:05:45", "remaining_time": "0:01:53"}
|
| 166 |
-
{"current_steps": 166, "total_steps": 219, "loss": 0.2391, "lr": 1.682091827076796e-06, "epoch": 2.2739726027397262, "percentage": 75.8, "elapsed_time": "0:05:46", "remaining_time": "0:01:50"}
|
| 167 |
-
{"current_steps": 167, "total_steps": 219, "loss": 0.2615, "lr": 1.6228655369685342e-06, "epoch": 2.287671232876712, "percentage": 76.26, "elapsed_time": "0:05:48", "remaining_time": "0:01:48"}
|
| 168 |
-
{"current_steps": 168, "total_steps": 219, "loss": 0.2346, "lr": 1.5644980753483109e-06, "epoch": 2.3013698630136985, "percentage": 76.71, "elapsed_time": "0:05:49", "remaining_time": "0:01:46"}
|
| 169 |
-
{"current_steps": 169, "total_steps": 219, "loss": 0.2281, "lr": 1.5070042854624833e-06, "epoch": 2.315068493150685, "percentage": 77.17, "elapsed_time": "0:05:50", "remaining_time": "0:01:43"}
|
| 170 |
-
{"current_steps": 170, "total_steps": 219, "loss": 0.2411, "lr": 1.4503987883766857e-06, "epoch": 2.328767123287671, "percentage": 77.63, "elapsed_time": "0:05:52", "remaining_time": "0:01:41"}
|
| 171 |
-
{"current_steps": 171, "total_steps": 219, "loss": 0.214, "lr": 1.3946959792575915e-06, "epoch": 2.3424657534246576, "percentage": 78.08, "elapsed_time": "0:05:53", "remaining_time": "0:01:39"}
|
| 172 |
-
{"current_steps": 172, "total_steps": 219, "loss": 0.1733, "lr": 1.3399100237121266e-06, "epoch": 2.356164383561644, "percentage": 78.54, "elapsed_time": "0:05:54", "remaining_time": "0:01:36"}
|
| 173 |
-
{"current_steps": 173, "total_steps": 219, "loss": 0.191, "lr": 1.2860548541850542e-06, "epoch": 2.3698630136986303, "percentage": 79.0, "elapsed_time": "0:05:56", "remaining_time": "0:01:34"}
|
| 174 |
-
{"current_steps": 174, "total_steps": 219, "loss": 0.2372, "lr": 1.233144166415861e-06, "epoch": 2.383561643835616, "percentage": 79.45, "elapsed_time": "0:05:57", "remaining_time": "0:01:32"}
|
| 175 |
-
{"current_steps": 175, "total_steps": 219, "loss": 0.187, "lr": 1.1811914159558374e-06, "epoch": 2.3972602739726026, "percentage": 79.91, "elapsed_time": "0:05:58", "remaining_time": "0:01:30"}
|
| 176 |
-
{"current_steps": 176, "total_steps": 219, "loss": 0.2357, "lr": 1.1302098147462348e-06, "epoch": 2.410958904109589, "percentage": 80.37, "elapsed_time": "0:06:00", "remaining_time": "0:01:27"}
|
| 177 |
-
{"current_steps": 177, "total_steps": 219, "loss": 0.2322, "lr": 1.080212327758382e-06, "epoch": 2.4246575342465753, "percentage": 80.82, "elapsed_time": "0:06:01", "remaining_time": "0:01:25"}
|
| 178 |
-
{"current_steps": 178, "total_steps": 219, "loss": 0.1893, "lr": 1.0312116696966012e-06, "epoch": 2.4383561643835616, "percentage": 81.28, "elapsed_time": "0:06:02", "remaining_time": "0:01:23"}
|
| 179 |
-
{"current_steps": 179, "total_steps": 219, "loss": 0.2097, "lr": 9.832203017647746e-07, "epoch": 2.452054794520548, "percentage": 81.74, "elapsed_time": "0:06:04", "remaining_time": "0:01:21"}
|
| 180 |
-
{"current_steps": 180, "total_steps": 219, "loss": 0.187, "lr": 9.362504284973683e-07, "epoch": 2.4657534246575343, "percentage": 82.19, "elapsed_time": "0:06:05", "remaining_time": "0:01:19"}
|
| 181 |
-
{"current_steps": 181, "total_steps": 219, "loss": 0.2157, "lr": 8.903139946557437e-07, "epoch": 2.4794520547945207, "percentage": 82.65, "elapsed_time": "0:06:06", "remaining_time": "0:01:16"}
|
| 182 |
-
{"current_steps": 182, "total_steps": 219, "loss": 0.2315, "lr": 8.454226821905171e-07, "epoch": 2.493150684931507, "percentage": 83.11, "elapsed_time": "0:06:07", "remaining_time": "0:01:14"}
|
| 183 |
-
{"current_steps": 183, "total_steps": 219, "loss": 0.2128, "lr": 8.015879072707611e-07, "epoch": 2.506849315068493, "percentage": 83.56, "elapsed_time": "0:06:09", "remaining_time": "0:01:12"}
|
| 184 |
-
{"current_steps": 184, "total_steps": 219, "loss": 0.21, "lr": 7.588208173807943e-07, "epoch": 2.5205479452054793, "percentage": 84.02, "elapsed_time": "0:06:10", "remaining_time": "0:01:10"}
|
| 185 |
-
{"current_steps": 185, "total_steps": 219, "loss": 0.227, "lr": 7.171322884852988e-07, "epoch": 2.5342465753424657, "percentage": 84.47, "elapsed_time": "0:06:11", "remaining_time": "0:01:08"}
|
| 186 |
-
{"current_steps": 186, "total_steps": 219, "loss": 0.2004, "lr": 6.765329222634892e-07, "epoch": 2.547945205479452, "percentage": 84.93, "elapsed_time": "0:06:13", "remaining_time": "0:01:06"}
|
| 187 |
-
{"current_steps": 187, "total_steps": 219, "loss": 0.2319, "lr": 6.370330434130317e-07, "epoch": 2.5616438356164384, "percentage": 85.39, "elapsed_time": "0:06:14", "remaining_time": "0:01:04"}
|
| 188 |
-
{"current_steps": 188, "total_steps": 219, "loss": 0.242, "lr": 5.986426970244009e-07, "epoch": 2.5753424657534247, "percentage": 85.84, "elapsed_time": "0:06:15", "remaining_time": "0:01:01"}
|
| 189 |
-
{"current_steps": 189, "total_steps": 219, "loss": 0.1823, "lr": 5.613716460263485e-07, "epoch": 2.589041095890411, "percentage": 86.3, "elapsed_time": "0:06:17", "remaining_time": "0:00:59"}
|
| 190 |
-
{"current_steps": 190, "total_steps": 219, "loss": 0.2112, "lr": 5.252293687031196e-07, "epoch": 2.602739726027397, "percentage": 86.76, "elapsed_time": "0:06:18", "remaining_time": "0:00:57"}
|
| 191 |
-
{"current_steps": 191, "total_steps": 219, "loss": 0.2016, "lr": 4.902250562840622e-07, "epoch": 2.616438356164384, "percentage": 87.21, "elapsed_time": "0:06:20", "remaining_time": "0:00:55"}
|
| 192 |
-
{"current_steps": 192, "total_steps": 219, "loss": 0.2507, "lr": 4.5636761060623314e-07, "epoch": 2.6301369863013697, "percentage": 87.67, "elapsed_time": "0:06:21", "remaining_time": "0:00:53"}
|
| 193 |
-
{"current_steps": 193, "total_steps": 219, "loss": 0.2042, "lr": 4.2366564185060134e-07, "epoch": 2.643835616438356, "percentage": 88.13, "elapsed_time": "0:06:22", "remaining_time": "0:00:51"}
|
| 194 |
-
{"current_steps": 194, "total_steps": 219, "loss": 0.2087, "lr": 3.921274663524183e-07, "epoch": 2.6575342465753424, "percentage": 88.58, "elapsed_time": "0:06:24", "remaining_time": "0:00:49"}
|
| 195 |
-
{"current_steps": 195, "total_steps": 219, "loss": 0.2578, "lr": 3.61761104486314e-07, "epoch": 2.671232876712329, "percentage": 89.04, "elapsed_time": "0:06:25", "remaining_time": "0:00:47"}
|
| 196 |
-
{"current_steps": 196, "total_steps": 219, "loss": 0.2471, "lr": 3.3257427862666894e-07, "epoch": 2.684931506849315, "percentage": 89.5, "elapsed_time": "0:06:26", "remaining_time": "0:00:45"}
|
| 197 |
-
{"current_steps": 197, "total_steps": 219, "loss": 0.2304, "lr": 3.045744111837529e-07, "epoch": 2.6986301369863015, "percentage": 89.95, "elapsed_time": "0:06:28", "remaining_time": "0:00:43"}
|
| 198 |
-
{"current_steps": 198, "total_steps": 219, "loss": 0.1633, "lr": 2.777686227161591e-07, "epoch": 2.712328767123288, "percentage": 90.41, "elapsed_time": "0:06:29", "remaining_time": "0:00:41"}
|
| 199 |
-
{"current_steps": 199, "total_steps": 219, "loss": 0.2266, "lr": 2.5216373011999697e-07, "epoch": 2.7260273972602738, "percentage": 90.87, "elapsed_time": "0:06:30", "remaining_time": "0:00:39"}
|
| 200 |
-
{"current_steps": 200, "total_steps": 219, "loss": 0.234, "lr": 2.2776624489530664e-07, "epoch": 2.73972602739726, "percentage": 91.32, "elapsed_time": "0:06:31", "remaining_time": "0:00:37"}
|
| 201 |
-
{"current_steps": 201, "total_steps": 219, "loss": 0.2286, "lr": 2.0458237149014347e-07, "epoch": 2.7534246575342465, "percentage": 91.78, "elapsed_time": "0:06:33", "remaining_time": "0:00:35"}
|
| 202 |
-
{"current_steps": 202, "total_steps": 219, "loss": 0.2296, "lr": 1.8261800572274001e-07, "epoch": 2.767123287671233, "percentage": 92.24, "elapsed_time": "0:06:34", "remaining_time": "0:00:33"}
|
| 203 |
-
{"current_steps": 203, "total_steps": 219, "loss": 0.2116, "lr": 1.6187873328216142e-07, "epoch": 2.780821917808219, "percentage": 92.69, "elapsed_time": "0:06:35", "remaining_time": "0:00:31"}
|
| 204 |
-
{"current_steps": 204, "total_steps": 219, "loss": 0.2032, "lr": 1.4236982830782676e-07, "epoch": 2.7945205479452055, "percentage": 93.15, "elapsed_time": "0:06:37", "remaining_time": "0:00:29"}
|
| 205 |
-
{"current_steps": 205, "total_steps": 219, "loss": 0.2345, "lr": 1.2409625204825802e-07, "epoch": 2.808219178082192, "percentage": 93.61, "elapsed_time": "0:06:38", "remaining_time": "0:00:27"}
|
| 206 |
-
{"current_steps": 206, "total_steps": 219, "loss": 0.19, "lr": 1.0706265159939944e-07, "epoch": 2.821917808219178, "percentage": 94.06, "elapsed_time": "0:06:39", "remaining_time": "0:00:25"}
|
| 207 |
-
{"current_steps": 207, "total_steps": 219, "loss": 0.1803, "lr": 9.12733587228326e-08, "epoch": 2.8356164383561646, "percentage": 94.52, "elapsed_time": "0:06:41", "remaining_time": "0:00:23"}
|
| 208 |
-
{"current_steps": 208, "total_steps": 219, "loss": 0.1956, "lr": 7.673238874417676e-08, "epoch": 2.8493150684931505, "percentage": 94.98, "elapsed_time": "0:06:42", "remaining_time": "0:00:21"}
|
| 209 |
-
{"current_steps": 209, "total_steps": 219, "loss": 0.2221, "lr": 6.344343953196386e-08, "epoch": 2.863013698630137, "percentage": 95.43, "elapsed_time": "0:06:43", "remaining_time": "0:00:19"}
|
| 210 |
-
{"current_steps": 210, "total_steps": 219, "loss": 0.2437, "lr": 5.1409890557246876e-08, "epoch": 2.8767123287671232, "percentage": 95.89, "elapsed_time": "0:06:45", "remaining_time": "0:00:17"}
|
| 211 |
-
{"current_steps": 211, "total_steps": 219, "loss": 0.2314, "lr": 4.063480203417625e-08, "epoch": 2.8904109589041096, "percentage": 96.35, "elapsed_time": "0:06:46", "remaining_time": "0:00:15"}
|
| 212 |
-
{"current_steps": 212, "total_steps": 219, "loss": 0.249, "lr": 3.1120914141766214e-08, "epoch": 2.904109589041096, "percentage": 96.8, "elapsed_time": "0:06:47", "remaining_time": "0:00:13"}
|
| 213 |
-
{"current_steps": 213, "total_steps": 219, "loss": 0.2131, "lr": 2.287064632705005e-08, "epoch": 2.9178082191780823, "percentage": 97.26, "elapsed_time": "0:06:49", "remaining_time": "0:00:11"}
|
| 214 |
-
{"current_steps": 214, "total_steps": 219, "loss": 0.2178, "lr": 1.588609668979446e-08, "epoch": 2.9315068493150687, "percentage": 97.72, "elapsed_time": "0:06:50", "remaining_time": "0:00:09"}
|
| 215 |
-
{"current_steps": 215, "total_steps": 219, "loss": 0.2207, "lr": 1.016904144894304e-08, "epoch": 2.9452054794520546, "percentage": 98.17, "elapsed_time": "0:06:52", "remaining_time": "0:00:07"}
|
| 216 |
-
{"current_steps": 216, "total_steps": 219, "loss": 0.2142, "lr": 5.720934490907604e-09, "epoch": 2.958904109589041, "percentage": 98.63, "elapsed_time": "0:06:53", "remaining_time": "0:00:05"}
|
| 217 |
-
{"current_steps": 217, "total_steps": 219, "loss": 0.2298, "lr": 2.542906999836725e-09, "epoch": 2.9726027397260273, "percentage": 99.09, "elapsed_time": "0:06:54", "remaining_time": "0:00:03"}
|
| 218 |
-
{"current_steps": 218, "total_steps": 219, "loss": 0.2056, "lr": 6.357671699486201e-10, "epoch": 2.9863013698630136, "percentage": 99.54, "elapsed_time": "0:06:56", "remaining_time": "0:00:01"}
|
| 219 |
-
{"current_steps": 219, "total_steps": 219, "loss": 0.1987, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:06:57", "remaining_time": "0:00:00"}
|
| 220 |
-
{"current_steps": 219, "total_steps": 219, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:09:06", "remaining_time": "0:00:00"}
|
|
|
|
| 1 |
+
{"current_steps": 1, "total_steps": 216, "loss": 0.4904, "lr": 4.5454545454545457e-07, "epoch": 0.013824884792626729, "percentage": 0.46, "elapsed_time": "0:00:06", "remaining_time": "0:23:47"}
|
| 2 |
+
{"current_steps": 2, "total_steps": 216, "loss": 0.4586, "lr": 9.090909090909091e-07, "epoch": 0.027649769585253458, "percentage": 0.93, "elapsed_time": "0:00:10", "remaining_time": "0:18:01"}
|
| 3 |
+
{"current_steps": 3, "total_steps": 216, "loss": 0.4491, "lr": 1.3636363636363636e-06, "epoch": 0.041474654377880185, "percentage": 1.39, "elapsed_time": "0:00:13", "remaining_time": "0:15:57"}
|
| 4 |
+
{"current_steps": 4, "total_steps": 216, "loss": 0.495, "lr": 1.8181818181818183e-06, "epoch": 0.055299539170506916, "percentage": 1.85, "elapsed_time": "0:00:16", "remaining_time": "0:14:59"}
|
| 5 |
+
{"current_steps": 5, "total_steps": 216, "loss": 0.4518, "lr": 2.2727272727272728e-06, "epoch": 0.06912442396313365, "percentage": 2.31, "elapsed_time": "0:00:20", "remaining_time": "0:14:22"}
|
| 6 |
+
{"current_steps": 6, "total_steps": 216, "loss": 0.4245, "lr": 2.7272727272727272e-06, "epoch": 0.08294930875576037, "percentage": 2.78, "elapsed_time": "0:00:23", "remaining_time": "0:13:56"}
|
| 7 |
+
{"current_steps": 7, "total_steps": 216, "loss": 0.4485, "lr": 3.181818181818182e-06, "epoch": 0.0967741935483871, "percentage": 3.24, "elapsed_time": "0:00:27", "remaining_time": "0:13:36"}
|
| 8 |
+
{"current_steps": 8, "total_steps": 216, "loss": 0.4126, "lr": 3.6363636363636366e-06, "epoch": 0.11059907834101383, "percentage": 3.7, "elapsed_time": "0:00:30", "remaining_time": "0:13:18"}
|
| 9 |
+
{"current_steps": 9, "total_steps": 216, "loss": 0.3782, "lr": 4.0909090909090915e-06, "epoch": 0.12442396313364056, "percentage": 4.17, "elapsed_time": "0:00:34", "remaining_time": "0:13:05"}
|
| 10 |
+
{"current_steps": 10, "total_steps": 216, "loss": 0.4114, "lr": 4.5454545454545455e-06, "epoch": 0.1382488479262673, "percentage": 4.63, "elapsed_time": "0:00:37", "remaining_time": "0:12:53"}
|
| 11 |
+
{"current_steps": 11, "total_steps": 216, "loss": 0.4018, "lr": 5e-06, "epoch": 0.15207373271889402, "percentage": 5.09, "elapsed_time": "0:00:40", "remaining_time": "0:12:42"}
|
| 12 |
+
{"current_steps": 12, "total_steps": 216, "loss": 0.3739, "lr": 5.4545454545454545e-06, "epoch": 0.16589861751152074, "percentage": 5.56, "elapsed_time": "0:00:44", "remaining_time": "0:12:33"}
|
| 13 |
+
{"current_steps": 13, "total_steps": 216, "loss": 0.3516, "lr": 5.90909090909091e-06, "epoch": 0.17972350230414746, "percentage": 6.02, "elapsed_time": "0:00:47", "remaining_time": "0:12:25"}
|
| 14 |
+
{"current_steps": 14, "total_steps": 216, "loss": 0.3873, "lr": 6.363636363636364e-06, "epoch": 0.1935483870967742, "percentage": 6.48, "elapsed_time": "0:00:51", "remaining_time": "0:12:18"}
|
| 15 |
+
{"current_steps": 15, "total_steps": 216, "loss": 0.3635, "lr": 6.818181818181818e-06, "epoch": 0.2073732718894009, "percentage": 6.94, "elapsed_time": "0:00:54", "remaining_time": "0:12:10"}
|
| 16 |
+
{"current_steps": 16, "total_steps": 216, "loss": 0.3538, "lr": 7.272727272727273e-06, "epoch": 0.22119815668202766, "percentage": 7.41, "elapsed_time": "0:00:57", "remaining_time": "0:12:04"}
|
| 17 |
+
{"current_steps": 17, "total_steps": 216, "loss": 0.3322, "lr": 7.727272727272727e-06, "epoch": 0.2350230414746544, "percentage": 7.87, "elapsed_time": "0:01:01", "remaining_time": "0:11:58"}
|
| 18 |
+
{"current_steps": 18, "total_steps": 216, "loss": 0.3175, "lr": 8.181818181818183e-06, "epoch": 0.2488479262672811, "percentage": 8.33, "elapsed_time": "0:01:04", "remaining_time": "0:11:52"}
|
| 19 |
+
{"current_steps": 19, "total_steps": 216, "loss": 0.2943, "lr": 8.636363636363637e-06, "epoch": 0.2626728110599078, "percentage": 8.8, "elapsed_time": "0:01:08", "remaining_time": "0:11:46"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 216, "loss": 0.3269, "lr": 9.090909090909091e-06, "epoch": 0.2764976958525346, "percentage": 9.26, "elapsed_time": "0:01:11", "remaining_time": "0:11:40"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 216, "loss": 0.3665, "lr": 9.545454545454547e-06, "epoch": 0.2903225806451613, "percentage": 9.72, "elapsed_time": "0:01:14", "remaining_time": "0:11:35"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 216, "loss": 0.3081, "lr": 1e-05, "epoch": 0.30414746543778803, "percentage": 10.19, "elapsed_time": "0:01:18", "remaining_time": "0:11:30"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 216, "loss": 0.3216, "lr": 9.999344418328161e-06, "epoch": 0.31797235023041476, "percentage": 10.65, "elapsed_time": "0:01:21", "remaining_time": "0:11:25"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 216, "loss": 0.322, "lr": 9.997377845227577e-06, "epoch": 0.3317972350230415, "percentage": 11.11, "elapsed_time": "0:01:25", "remaining_time": "0:11:21"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 216, "loss": 0.3406, "lr": 9.994100796397954e-06, "epoch": 0.3456221198156682, "percentage": 11.57, "elapsed_time": "0:01:28", "remaining_time": "0:11:16"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 216, "loss": 0.342, "lr": 9.98951413118856e-06, "epoch": 0.35944700460829493, "percentage": 12.04, "elapsed_time": "0:01:32", "remaining_time": "0:11:12"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 216, "loss": 0.3228, "lr": 9.983619052372847e-06, "epoch": 0.37327188940092165, "percentage": 12.5, "elapsed_time": "0:01:35", "remaining_time": "0:11:07"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 216, "loss": 0.34, "lr": 9.97641710583307e-06, "epoch": 0.3870967741935484, "percentage": 12.96, "elapsed_time": "0:01:38", "remaining_time": "0:11:02"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 216, "loss": 0.3624, "lr": 9.96791018015489e-06, "epoch": 0.4009216589861751, "percentage": 13.43, "elapsed_time": "0:01:42", "remaining_time": "0:10:58"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 216, "loss": 0.3362, "lr": 9.958100506132127e-06, "epoch": 0.4147465437788018, "percentage": 13.89, "elapsed_time": "0:01:45", "remaining_time": "0:10:54"}
|
| 31 |
+
{"current_steps": 31, "total_steps": 216, "loss": 0.3306, "lr": 9.946990656181782e-06, "epoch": 0.42857142857142855, "percentage": 14.35, "elapsed_time": "0:01:48", "remaining_time": "0:10:49"}
|
| 32 |
+
{"current_steps": 32, "total_steps": 216, "loss": 0.333, "lr": 9.934583543669454e-06, "epoch": 0.4423963133640553, "percentage": 14.81, "elapsed_time": "0:01:52", "remaining_time": "0:10:45"}
|
| 33 |
+
{"current_steps": 33, "total_steps": 216, "loss": 0.3297, "lr": 9.920882422145372e-06, "epoch": 0.45622119815668205, "percentage": 15.28, "elapsed_time": "0:01:55", "remaining_time": "0:10:41"}
|
| 34 |
+
{"current_steps": 34, "total_steps": 216, "loss": 0.3474, "lr": 9.905890884491196e-06, "epoch": 0.4700460829493088, "percentage": 15.74, "elapsed_time": "0:01:59", "remaining_time": "0:10:37"}
|
| 35 |
+
{"current_steps": 35, "total_steps": 216, "loss": 0.3366, "lr": 9.889612861977855e-06, "epoch": 0.4838709677419355, "percentage": 16.2, "elapsed_time": "0:02:02", "remaining_time": "0:10:33"}
|
| 36 |
+
{"current_steps": 36, "total_steps": 216, "loss": 0.3247, "lr": 9.872052623234632e-06, "epoch": 0.4976958525345622, "percentage": 16.67, "elapsed_time": "0:02:05", "remaining_time": "0:10:28"}
|
| 37 |
+
{"current_steps": 37, "total_steps": 216, "loss": 0.3035, "lr": 9.853214773129796e-06, "epoch": 0.511520737327189, "percentage": 17.13, "elapsed_time": "0:02:09", "remaining_time": "0:10:25"}
|
| 38 |
+
{"current_steps": 38, "total_steps": 216, "loss": 0.3222, "lr": 9.833104251563058e-06, "epoch": 0.5253456221198156, "percentage": 17.59, "elapsed_time": "0:02:12", "remaining_time": "0:10:20"}
|
| 39 |
+
{"current_steps": 39, "total_steps": 216, "loss": 0.3557, "lr": 9.811726332170153e-06, "epoch": 0.5391705069124424, "percentage": 18.06, "elapsed_time": "0:02:15", "remaining_time": "0:10:17"}
|
| 40 |
+
{"current_steps": 40, "total_steps": 216, "loss": 0.3392, "lr": 9.789086620939936e-06, "epoch": 0.5529953917050692, "percentage": 18.52, "elapsed_time": "0:02:19", "remaining_time": "0:10:12"}
|
| 41 |
+
{"current_steps": 41, "total_steps": 216, "loss": 0.3305, "lr": 9.765191054744305e-06, "epoch": 0.5668202764976958, "percentage": 18.98, "elapsed_time": "0:02:22", "remaining_time": "0:10:08"}
|
| 42 |
+
{"current_steps": 42, "total_steps": 216, "loss": 0.3387, "lr": 9.740045899781353e-06, "epoch": 0.5806451612903226, "percentage": 19.44, "elapsed_time": "0:02:26", "remaining_time": "0:10:05"}
|
| 43 |
+
{"current_steps": 43, "total_steps": 216, "loss": 0.378, "lr": 9.713657749932172e-06, "epoch": 0.5944700460829493, "percentage": 19.91, "elapsed_time": "0:02:29", "remaining_time": "0:10:01"}
|
| 44 |
+
{"current_steps": 44, "total_steps": 216, "loss": 0.3808, "lr": 9.68603352503172e-06, "epoch": 0.6082949308755761, "percentage": 20.37, "elapsed_time": "0:02:32", "remaining_time": "0:09:57"}
|
| 45 |
+
{"current_steps": 45, "total_steps": 216, "loss": 0.3561, "lr": 9.657180469054213e-06, "epoch": 0.6221198156682027, "percentage": 20.83, "elapsed_time": "0:02:36", "remaining_time": "0:09:53"}
|
| 46 |
+
{"current_steps": 46, "total_steps": 216, "loss": 0.3224, "lr": 9.627106148213521e-06, "epoch": 0.6359447004608295, "percentage": 21.3, "elapsed_time": "0:02:39", "remaining_time": "0:09:49"}
|
| 47 |
+
{"current_steps": 47, "total_steps": 216, "loss": 0.3502, "lr": 9.595818448979061e-06, "epoch": 0.6497695852534562, "percentage": 21.76, "elapsed_time": "0:02:43", "remaining_time": "0:09:46"}
|
| 48 |
+
{"current_steps": 48, "total_steps": 216, "loss": 0.3172, "lr": 9.563325576007702e-06, "epoch": 0.663594470046083, "percentage": 22.22, "elapsed_time": "0:02:46", "remaining_time": "0:09:42"}
|
| 49 |
+
{"current_steps": 49, "total_steps": 216, "loss": 0.3078, "lr": 9.529636049992235e-06, "epoch": 0.6774193548387096, "percentage": 22.69, "elapsed_time": "0:02:49", "remaining_time": "0:09:38"}
|
| 50 |
+
{"current_steps": 50, "total_steps": 216, "loss": 0.3378, "lr": 9.494758705426978e-06, "epoch": 0.6912442396313364, "percentage": 23.15, "elapsed_time": "0:02:53", "remaining_time": "0:09:34"}
|
| 51 |
+
{"current_steps": 51, "total_steps": 216, "loss": 0.3749, "lr": 9.458702688291072e-06, "epoch": 0.7050691244239631, "percentage": 23.61, "elapsed_time": "0:02:56", "remaining_time": "0:09:31"}
|
| 52 |
+
{"current_steps": 52, "total_steps": 216, "loss": 0.3646, "lr": 9.421477453650118e-06, "epoch": 0.7188940092165899, "percentage": 24.07, "elapsed_time": "0:02:59", "remaining_time": "0:09:27"}
|
| 53 |
+
{"current_steps": 53, "total_steps": 216, "loss": 0.2952, "lr": 9.38309276317674e-06, "epoch": 0.7327188940092166, "percentage": 24.54, "elapsed_time": "0:03:03", "remaining_time": "0:09:23"}
|
| 54 |
+
{"current_steps": 54, "total_steps": 216, "loss": 0.3402, "lr": 9.343558682590757e-06, "epoch": 0.7465437788018433, "percentage": 25.0, "elapsed_time": "0:03:06", "remaining_time": "0:09:20"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 216, "loss": 0.3157, "lr": 9.302885579019626e-06, "epoch": 0.7603686635944701, "percentage": 25.46, "elapsed_time": "0:03:10", "remaining_time": "0:09:16"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 216, "loss": 0.3724, "lr": 9.261084118279846e-06, "epoch": 0.7741935483870968, "percentage": 25.93, "elapsed_time": "0:03:13", "remaining_time": "0:09:12"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 216, "loss": 0.2915, "lr": 9.218165262080024e-06, "epoch": 0.7880184331797235, "percentage": 26.39, "elapsed_time": "0:03:16", "remaining_time": "0:09:09"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 216, "loss": 0.3374, "lr": 9.174140265146356e-06, "epoch": 0.8018433179723502, "percentage": 26.85, "elapsed_time": "0:03:20", "remaining_time": "0:09:05"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 216, "loss": 0.3119, "lr": 9.129020672271283e-06, "epoch": 0.815668202764977, "percentage": 27.31, "elapsed_time": "0:03:23", "remaining_time": "0:09:02"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 216, "loss": 0.3139, "lr": 9.082818315286054e-06, "epoch": 0.8294930875576036, "percentage": 27.78, "elapsed_time": "0:03:27", "remaining_time": "0:08:58"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 216, "loss": 0.3391, "lr": 9.035545309958048e-06, "epoch": 0.8433179723502304, "percentage": 28.24, "elapsed_time": "0:03:30", "remaining_time": "0:08:54"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 216, "loss": 0.3385, "lr": 8.987214052813605e-06, "epoch": 0.8571428571428571, "percentage": 28.7, "elapsed_time": "0:03:33", "remaining_time": "0:08:51"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 216, "loss": 0.3216, "lr": 8.937837217887273e-06, "epoch": 0.8709677419354839, "percentage": 29.17, "elapsed_time": "0:03:37", "remaining_time": "0:08:47"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 216, "loss": 0.2931, "lr": 8.887427753398249e-06, "epoch": 0.8847926267281107, "percentage": 29.63, "elapsed_time": "0:03:40", "remaining_time": "0:08:44"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 216, "loss": 0.3172, "lr": 8.83599887835493e-06, "epoch": 0.8986175115207373, "percentage": 30.09, "elapsed_time": "0:03:44", "remaining_time": "0:08:40"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 216, "loss": 0.3882, "lr": 8.783564079088478e-06, "epoch": 0.9124423963133641, "percentage": 30.56, "elapsed_time": "0:03:47", "remaining_time": "0:08:37"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 216, "loss": 0.2963, "lr": 8.730137105716231e-06, "epoch": 0.9262672811059908, "percentage": 31.02, "elapsed_time": "0:03:50", "remaining_time": "0:08:33"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 216, "loss": 0.2824, "lr": 8.675731968536004e-06, "epoch": 0.9400921658986175, "percentage": 31.48, "elapsed_time": "0:03:54", "remaining_time": "0:08:30"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 216, "loss": 0.3439, "lr": 8.620362934352109e-06, "epoch": 0.9539170506912442, "percentage": 31.94, "elapsed_time": "0:03:57", "remaining_time": "0:08:26"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 216, "loss": 0.345, "lr": 8.564044522734147e-06, "epoch": 0.967741935483871, "percentage": 32.41, "elapsed_time": "0:04:01", "remaining_time": "0:08:23"}
|
| 71 |
+
{"current_steps": 71, "total_steps": 216, "loss": 0.3383, "lr": 8.506791502209497e-06, "epoch": 0.9815668202764977, "percentage": 32.87, "elapsed_time": "0:04:04", "remaining_time": "0:08:19"}
|
| 72 |
+
{"current_steps": 72, "total_steps": 216, "loss": 0.31, "lr": 8.448618886390523e-06, "epoch": 0.9953917050691244, "percentage": 33.33, "elapsed_time": "0:04:08", "remaining_time": "0:08:16"}
|
| 73 |
+
{"current_steps": 73, "total_steps": 216, "loss": 0.4918, "lr": 8.389541930037516e-06, "epoch": 1.0092165898617511, "percentage": 33.8, "elapsed_time": "0:05:10", "remaining_time": "0:10:08"}
|
| 74 |
+
{"current_steps": 74, "total_steps": 216, "loss": 0.284, "lr": 8.329576125058406e-06, "epoch": 1.023041474654378, "percentage": 34.26, "elapsed_time": "0:05:14", "remaining_time": "0:10:03"}
|
| 75 |
+
{"current_steps": 75, "total_steps": 216, "loss": 0.2914, "lr": 8.268737196446264e-06, "epoch": 1.0368663594470047, "percentage": 34.72, "elapsed_time": "0:05:17", "remaining_time": "0:09:57"}
|
| 76 |
+
{"current_steps": 76, "total_steps": 216, "loss": 0.2723, "lr": 8.207041098155701e-06, "epoch": 1.0506912442396312, "percentage": 35.19, "elapsed_time": "0:05:21", "remaining_time": "0:09:51"}
|
| 77 |
+
{"current_steps": 77, "total_steps": 216, "loss": 0.3119, "lr": 8.144504008919224e-06, "epoch": 1.064516129032258, "percentage": 35.65, "elapsed_time": "0:05:24", "remaining_time": "0:09:45"}
|
| 78 |
+
{"current_steps": 78, "total_steps": 216, "loss": 0.2598, "lr": 8.081142328004638e-06, "epoch": 1.0783410138248848, "percentage": 36.11, "elapsed_time": "0:05:28", "remaining_time": "0:09:40"}
|
| 79 |
+
{"current_steps": 79, "total_steps": 216, "loss": 0.322, "lr": 8.016972670914624e-06, "epoch": 1.0921658986175116, "percentage": 36.57, "elapsed_time": "0:05:31", "remaining_time": "0:09:34"}
|
| 80 |
+
{"current_steps": 80, "total_steps": 216, "loss": 0.2509, "lr": 7.952011865029614e-06, "epoch": 1.1059907834101383, "percentage": 37.04, "elapsed_time": "0:05:34", "remaining_time": "0:09:29"}
|
| 81 |
+
{"current_steps": 81, "total_steps": 216, "loss": 0.2206, "lr": 7.886276945195098e-06, "epoch": 1.119815668202765, "percentage": 37.5, "elapsed_time": "0:05:38", "remaining_time": "0:09:24"}
|
| 82 |
+
{"current_steps": 82, "total_steps": 216, "loss": 0.2954, "lr": 7.819785149254534e-06, "epoch": 1.1336405529953917, "percentage": 37.96, "elapsed_time": "0:05:41", "remaining_time": "0:09:18"}
|
| 83 |
+
{"current_steps": 83, "total_steps": 216, "loss": 0.2628, "lr": 7.752553913529019e-06, "epoch": 1.1474654377880185, "percentage": 38.43, "elapsed_time": "0:05:45", "remaining_time": "0:09:13"}
|
| 84 |
+
{"current_steps": 84, "total_steps": 216, "loss": 0.3206, "lr": 7.68460086824492e-06, "epoch": 1.1612903225806452, "percentage": 38.89, "elapsed_time": "0:05:48", "remaining_time": "0:09:08"}
|
| 85 |
+
{"current_steps": 85, "total_steps": 216, "loss": 0.2363, "lr": 7.61594383291065e-06, "epoch": 1.1751152073732718, "percentage": 39.35, "elapsed_time": "0:05:52", "remaining_time": "0:09:03"}
|
| 86 |
+
{"current_steps": 86, "total_steps": 216, "loss": 0.3353, "lr": 7.546600811643816e-06, "epoch": 1.1889400921658986, "percentage": 39.81, "elapsed_time": "0:05:55", "remaining_time": "0:08:57"}
|
| 87 |
+
{"current_steps": 87, "total_steps": 216, "loss": 0.2618, "lr": 7.476589988449939e-06, "epoch": 1.2027649769585254, "percentage": 40.28, "elapsed_time": "0:05:59", "remaining_time": "0:08:52"}
|
| 88 |
+
{"current_steps": 88, "total_steps": 216, "loss": 0.2639, "lr": 7.405929722454026e-06, "epoch": 1.2165898617511521, "percentage": 40.74, "elapsed_time": "0:06:02", "remaining_time": "0:08:47"}
|
| 89 |
+
{"current_steps": 89, "total_steps": 216, "loss": 0.2477, "lr": 7.334638543086203e-06, "epoch": 1.230414746543779, "percentage": 41.2, "elapsed_time": "0:06:06", "remaining_time": "0:08:42"}
|
| 90 |
+
{"current_steps": 90, "total_steps": 216, "loss": 0.2437, "lr": 7.262735145222696e-06, "epoch": 1.2442396313364055, "percentage": 41.67, "elapsed_time": "0:06:09", "remaining_time": "0:08:37"}
|
| 91 |
+
{"current_steps": 91, "total_steps": 216, "loss": 0.2625, "lr": 7.190238384283413e-06, "epoch": 1.2580645161290323, "percentage": 42.13, "elapsed_time": "0:06:13", "remaining_time": "0:08:32"}
|
| 92 |
+
{"current_steps": 92, "total_steps": 216, "loss": 0.2838, "lr": 7.117167271287453e-06, "epoch": 1.271889400921659, "percentage": 42.59, "elapsed_time": "0:06:16", "remaining_time": "0:08:27"}
|
| 93 |
+
{"current_steps": 93, "total_steps": 216, "loss": 0.2596, "lr": 7.043540967867782e-06, "epoch": 1.2857142857142856, "percentage": 43.06, "elapsed_time": "0:06:20", "remaining_time": "0:08:22"}
|
| 94 |
+
{"current_steps": 94, "total_steps": 216, "loss": 0.295, "lr": 6.969378781246436e-06, "epoch": 1.2995391705069124, "percentage": 43.52, "elapsed_time": "0:06:23", "remaining_time": "0:08:17"}
|
| 95 |
+
{"current_steps": 95, "total_steps": 216, "loss": 0.2478, "lr": 6.894700159171535e-06, "epoch": 1.3133640552995391, "percentage": 43.98, "elapsed_time": "0:06:27", "remaining_time": "0:08:13"}
|
| 96 |
+
{"current_steps": 96, "total_steps": 216, "loss": 0.2375, "lr": 6.819524684817439e-06, "epoch": 1.327188940092166, "percentage": 44.44, "elapsed_time": "0:06:30", "remaining_time": "0:08:08"}
|
| 97 |
+
{"current_steps": 97, "total_steps": 216, "loss": 0.293, "lr": 6.743872071649411e-06, "epoch": 1.3410138248847927, "percentage": 44.91, "elapsed_time": "0:06:34", "remaining_time": "0:08:03"}
|
| 98 |
+
{"current_steps": 98, "total_steps": 216, "loss": 0.2759, "lr": 6.667762158254104e-06, "epoch": 1.3548387096774195, "percentage": 45.37, "elapsed_time": "0:06:37", "remaining_time": "0:07:58"}
|
| 99 |
+
{"current_steps": 99, "total_steps": 216, "loss": 0.2919, "lr": 6.591214903137221e-06, "epoch": 1.368663594470046, "percentage": 45.83, "elapsed_time": "0:06:41", "remaining_time": "0:07:54"}
|
| 100 |
+
{"current_steps": 100, "total_steps": 216, "loss": 0.3236, "lr": 6.514250379489754e-06, "epoch": 1.3824884792626728, "percentage": 46.3, "elapsed_time": "0:06:44", "remaining_time": "0:07:49"}
|
| 101 |
+
{"current_steps": 101, "total_steps": 216, "loss": 0.2599, "lr": 6.436888769924142e-06, "epoch": 1.3963133640552996, "percentage": 46.76, "elapsed_time": "0:06:47", "remaining_time": "0:07:44"}
|
| 102 |
+
{"current_steps": 102, "total_steps": 216, "loss": 0.2881, "lr": 6.3591503611817155e-06, "epoch": 1.4101382488479262, "percentage": 47.22, "elapsed_time": "0:06:51", "remaining_time": "0:07:39"}
|
| 103 |
+
{"current_steps": 103, "total_steps": 216, "loss": 0.2528, "lr": 6.281055538812861e-06, "epoch": 1.423963133640553, "percentage": 47.69, "elapsed_time": "0:06:54", "remaining_time": "0:07:35"}
|
| 104 |
+
{"current_steps": 104, "total_steps": 216, "loss": 0.2586, "lr": 6.202624781831269e-06, "epoch": 1.4377880184331797, "percentage": 48.15, "elapsed_time": "0:06:58", "remaining_time": "0:07:30"}
|
| 105 |
+
{"current_steps": 105, "total_steps": 216, "loss": 0.2933, "lr": 6.123878657343648e-06, "epoch": 1.4516129032258065, "percentage": 48.61, "elapsed_time": "0:07:01", "remaining_time": "0:07:25"}
|
| 106 |
+
{"current_steps": 106, "total_steps": 216, "loss": 0.2682, "lr": 6.044837815156377e-06, "epoch": 1.4654377880184333, "percentage": 49.07, "elapsed_time": "0:07:05", "remaining_time": "0:07:21"}
|
| 107 |
+
{"current_steps": 107, "total_steps": 216, "loss": 0.2574, "lr": 5.965522982360441e-06, "epoch": 1.4792626728110598, "percentage": 49.54, "elapsed_time": "0:07:08", "remaining_time": "0:07:16"}
|
| 108 |
+
{"current_steps": 108, "total_steps": 216, "loss": 0.256, "lr": 5.885954957896115e-06, "epoch": 1.4930875576036866, "percentage": 50.0, "elapsed_time": "0:07:12", "remaining_time": "0:07:12"}
|
| 109 |
+
{"current_steps": 109, "total_steps": 216, "loss": 0.3367, "lr": 5.806154607098799e-06, "epoch": 1.5069124423963134, "percentage": 50.46, "elapsed_time": "0:07:15", "remaining_time": "0:07:07"}
|
| 110 |
+
{"current_steps": 110, "total_steps": 216, "loss": 0.2801, "lr": 5.726142856227453e-06, "epoch": 1.52073732718894, "percentage": 50.93, "elapsed_time": "0:07:19", "remaining_time": "0:07:03"}
|
| 111 |
+
{"current_steps": 111, "total_steps": 216, "loss": 0.2512, "lr": 5.645940686977033e-06, "epoch": 1.5345622119815667, "percentage": 51.39, "elapsed_time": "0:07:22", "remaining_time": "0:06:58"}
|
| 112 |
+
{"current_steps": 112, "total_steps": 216, "loss": 0.2938, "lr": 5.5655691309764225e-06, "epoch": 1.5483870967741935, "percentage": 51.85, "elapsed_time": "0:07:26", "remaining_time": "0:06:54"}
|
| 113 |
+
{"current_steps": 113, "total_steps": 216, "loss": 0.2598, "lr": 5.485049264273241e-06, "epoch": 1.5622119815668203, "percentage": 52.31, "elapsed_time": "0:07:29", "remaining_time": "0:06:49"}
|
| 114 |
+
{"current_steps": 114, "total_steps": 216, "loss": 0.2587, "lr": 5.404402201807022e-06, "epoch": 1.576036866359447, "percentage": 52.78, "elapsed_time": "0:07:32", "remaining_time": "0:06:45"}
|
| 115 |
+
{"current_steps": 115, "total_steps": 216, "loss": 0.2917, "lr": 5.323649091872179e-06, "epoch": 1.5898617511520738, "percentage": 53.24, "elapsed_time": "0:07:36", "remaining_time": "0:06:40"}
|
| 116 |
+
{"current_steps": 116, "total_steps": 216, "loss": 0.2357, "lr": 5.242811110572243e-06, "epoch": 1.6036866359447006, "percentage": 53.7, "elapsed_time": "0:07:39", "remaining_time": "0:06:36"}
|
| 117 |
+
{"current_steps": 117, "total_steps": 216, "loss": 0.2259, "lr": 5.161909456266781e-06, "epoch": 1.6175115207373272, "percentage": 54.17, "elapsed_time": "0:07:43", "remaining_time": "0:06:31"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7288
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a91811e6e07dfcc842e6192d8eeb61b5cea677543130cfcef6e39900b918e368
|
| 3 |
size 7288
|