furmaniak commited on
Commit
cdea671
·
verified ·
1 Parent(s): b21cb9b

Training in progress, step 160

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/home/ubuntu/austrailia-east-1/qwen2.5-32b-openalex-with-references",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
@@ -22,7 +22,7 @@
22
  "sliding_window": null,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
- "transformers_version": "4.48.2",
26
  "use_cache": false,
27
  "use_sliding_window": false,
28
  "vocab_size": 152064
 
1
  {
2
+ "_name_or_path": "saves/qwen2.5-32b/works_with_references/full/pretrain",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
 
22
  "sliding_window": null,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.48.1",
26
  "use_cache": false,
27
  "use_sliding_window": false,
28
  "vocab_size": 152064
model-00001-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:677b60ad699bcd4de5e10af829b798dc4f6d3098495a16d38f73585290d41ee6
3
  size 4891730992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:877072f5a264e787dc8592082e2fce6ea6e6e1c143552f92c6bf8c151ee5b013
3
  size 4891730992
model-00002-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22e633198fe910e369a88046da9f1c1661a958ff6dfb74eb14c39153b55723ac
3
  size 4876059352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25f283172b327b0a445dc1693bc479bd5dd1aed7060b51ad4c07f064ea5df135
3
  size 4876059352
model-00003-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e89177175035278987ad312e2f668cd7316869d75e5e9c399c96db80a38045bd
3
  size 4876059384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b29a951313e48eeb0f47b665e70ee8bedabefa26753a9c56ed2fce99e8e5ba
3
  size 4876059384
model-00004-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87da12886695642c3a00b304f25c9d91f176d3918162aefcb32b698fbfea5e5a
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:064cad34d8e82023deab3e79bce08571d3a247e67d5786591f50b8bd620e4732
3
  size 4876059416
model-00005-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00cd4b9c25fc65176f186d3ba59835d1718a0ef22fdcbf8743a21ba35f184d66
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd24bd8575aec64aff272b25f913b3cc3157fa3bc01abd843f734cd5f1eb6bdc
3
  size 4876059416
model-00006-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1524d4a6b2f065a13ecf912181eff9f71945b47c90fa0dca363db593a8ba206e
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e16e4dc393145410b1ee9931c16ec7447ee7604982909717e0a9afecf706ec9
3
  size 4876059416
model-00007-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfbfd85e71437246a483f75f127346fcfde37b968fa5e36b9e84bbf99e9981ca
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d640e57b3eeabe4c58699e7447cdf19bc209735a28eacbcc847d5b4ecc41051f
3
  size 4876059416
model-00008-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3f083df175876257ef065fb0a9f0886e9866b0d82640846c2d71a9b294fc147
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f89c9deb39bd117fb2f3d34a131c13c3125f85c6ddebeb10bc44e49c908afa37
3
  size 4876059416
model-00009-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e4da683440b5235f2c5891d0e6b935a9fd3a28d7ec2aa71904eae597edb5f88
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b550de694aaad02d9c9dc4fb59c626460e4c727178485e39159b9c4556e90e8f
3
  size 4876059416
model-00010-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1674954265076e1d9ebc019499666bafbb20b69cf250b90d21cae7f4bfd992aa
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8d2189bba0cbb2c8e7d74d1c68dd59feab7efc046f87fa8d6bedd01a7485bb3
3
  size 4876059416
model-00011-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d295dbd0850c131a6adb316337f927ff01278cd88dfb062676604dc60d124c4
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ceb92299df4228cd515535bb1d235ecf9b7a3eed049276e9360eff7ac2cfb73
3
  size 4876059416
model-00012-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35813b1bd5145a0e89ae74f8faff6ebc387d94904a1c42f6872e232f728575ea
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:673bc76909801acd9a009e46f999baa8bde4a93a9dc3f9e9d4d8a4dcfaef500a
3
  size 4876059416
model-00013-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9eec08c79bae1c755dcaeb79c045632ea08ac252e4390a45d4837c1d347e2a3
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7f6f5e398a5787483d79921c4aa5c06695feb6e86ab64feac0dc3d3d3218e53
3
  size 4876059416
model-00014-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9771d8e8a90577d769769b15a6356b36fb889612a275ee79b6319c7a66dcd01
3
  size 2123397800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59bae169e109e7ef444903026f9bc3b6b47542d3fe11bdaad3afc5cc13e92bc6
3
  size 2123397800
trainer_log.jsonl CHANGED
@@ -1,323 +1,161 @@
1
- {"current_steps": 1, "total_steps": 322, "loss": 1.0755, "lr": 9.090909090909091e-07, "epoch": 0.006177606177606178, "percentage": 0.31, "elapsed_time": "0:03:56", "remaining_time": "21:03:17"}
2
- {"current_steps": 2, "total_steps": 322, "loss": 1.0857, "lr": 1.8181818181818183e-06, "epoch": 0.012355212355212355, "percentage": 0.62, "elapsed_time": "0:07:36", "remaining_time": "20:16:03"}
3
- {"current_steps": 3, "total_steps": 322, "loss": 1.1084, "lr": 2.7272727272727272e-06, "epoch": 0.018532818532818532, "percentage": 0.93, "elapsed_time": "0:11:07", "remaining_time": "19:43:40"}
4
- {"current_steps": 4, "total_steps": 322, "loss": 1.1061, "lr": 3.6363636363636366e-06, "epoch": 0.02471042471042471, "percentage": 1.24, "elapsed_time": "0:14:38", "remaining_time": "19:23:49"}
5
- {"current_steps": 5, "total_steps": 322, "loss": 1.0937, "lr": 4.5454545454545455e-06, "epoch": 0.03088803088803089, "percentage": 1.55, "elapsed_time": "0:18:03", "remaining_time": "19:05:12"}
6
- {"current_steps": 6, "total_steps": 322, "loss": 1.0966, "lr": 5.4545454545454545e-06, "epoch": 0.037065637065637064, "percentage": 1.86, "elapsed_time": "0:21:33", "remaining_time": "18:55:29"}
7
- {"current_steps": 7, "total_steps": 322, "loss": 1.0934, "lr": 6.363636363636364e-06, "epoch": 0.043243243243243246, "percentage": 2.17, "elapsed_time": "0:25:00", "remaining_time": "18:45:42"}
8
- {"current_steps": 8, "total_steps": 322, "loss": 1.0964, "lr": 7.272727272727273e-06, "epoch": 0.04942084942084942, "percentage": 2.48, "elapsed_time": "0:28:26", "remaining_time": "18:36:39"}
9
- {"current_steps": 9, "total_steps": 322, "loss": 1.0973, "lr": 8.181818181818181e-06, "epoch": 0.055598455598455596, "percentage": 2.8, "elapsed_time": "0:31:54", "remaining_time": "18:29:44"}
10
- {"current_steps": 10, "total_steps": 322, "loss": 1.1073, "lr": 9.090909090909091e-06, "epoch": 0.06177606177606178, "percentage": 3.11, "elapsed_time": "0:35:25", "remaining_time": "18:25:01"}
11
- {"current_steps": 11, "total_steps": 322, "loss": 1.0966, "lr": 9.999999999999999e-06, "epoch": 0.06795366795366796, "percentage": 3.42, "elapsed_time": "0:38:52", "remaining_time": "18:19:00"}
12
- {"current_steps": 12, "total_steps": 322, "loss": 1.1103, "lr": 1.0909090909090909e-05, "epoch": 0.07413127413127413, "percentage": 3.73, "elapsed_time": "0:42:18", "remaining_time": "18:12:59"}
13
- {"current_steps": 13, "total_steps": 322, "loss": 1.1097, "lr": 1.1818181818181819e-05, "epoch": 0.08030888030888031, "percentage": 4.04, "elapsed_time": "0:45:43", "remaining_time": "18:06:55"}
14
- {"current_steps": 14, "total_steps": 322, "loss": 1.0925, "lr": 1.2727272727272728e-05, "epoch": 0.08648648648648649, "percentage": 4.35, "elapsed_time": "0:49:11", "remaining_time": "18:02:08"}
15
- {"current_steps": 15, "total_steps": 322, "loss": 1.1059, "lr": 1.3636363636363637e-05, "epoch": 0.09266409266409266, "percentage": 4.66, "elapsed_time": "0:52:36", "remaining_time": "17:56:47"}
16
- {"current_steps": 16, "total_steps": 322, "loss": 1.1083, "lr": 1.4545454545454546e-05, "epoch": 0.09884169884169884, "percentage": 4.97, "elapsed_time": "0:56:04", "remaining_time": "17:52:29"}
17
- {"current_steps": 17, "total_steps": 322, "loss": 1.1083, "lr": 1.5454545454545454e-05, "epoch": 0.10501930501930502, "percentage": 5.28, "elapsed_time": "0:59:30", "remaining_time": "17:47:39"}
18
- {"current_steps": 18, "total_steps": 322, "loss": 1.1248, "lr": 1.6363636363636363e-05, "epoch": 0.11119691119691119, "percentage": 5.59, "elapsed_time": "1:02:59", "remaining_time": "17:43:57"}
19
- {"current_steps": 19, "total_steps": 322, "loss": 1.0965, "lr": 1.7272727272727274e-05, "epoch": 0.11737451737451737, "percentage": 5.9, "elapsed_time": "1:06:30", "remaining_time": "17:40:45"}
20
- {"current_steps": 20, "total_steps": 322, "loss": 1.0973, "lr": 1.8181818181818182e-05, "epoch": 0.12355212355212356, "percentage": 6.21, "elapsed_time": "1:09:56", "remaining_time": "17:36:13"}
21
- {"current_steps": 21, "total_steps": 322, "loss": 1.0804, "lr": 1.909090909090909e-05, "epoch": 0.12972972972972974, "percentage": 6.52, "elapsed_time": "1:13:24", "remaining_time": "17:32:15"}
22
- {"current_steps": 22, "total_steps": 322, "loss": 1.0753, "lr": 1.9999999999999998e-05, "epoch": 0.13590733590733592, "percentage": 6.83, "elapsed_time": "1:16:53", "remaining_time": "17:28:37"}
23
- {"current_steps": 23, "total_steps": 322, "loss": 1.0767, "lr": 2.090909090909091e-05, "epoch": 0.14208494208494207, "percentage": 7.14, "elapsed_time": "1:20:22", "remaining_time": "17:24:49"}
24
- {"current_steps": 24, "total_steps": 322, "loss": 1.0918, "lr": 2.1818181818181818e-05, "epoch": 0.14826254826254825, "percentage": 7.45, "elapsed_time": "1:23:51", "remaining_time": "17:21:14"}
25
- {"current_steps": 25, "total_steps": 322, "loss": 1.1037, "lr": 2.272727272727273e-05, "epoch": 0.15444015444015444, "percentage": 7.76, "elapsed_time": "1:27:21", "remaining_time": "17:17:44"}
26
- {"current_steps": 26, "total_steps": 322, "loss": 1.0654, "lr": 2.3636363636363637e-05, "epoch": 0.16061776061776062, "percentage": 8.07, "elapsed_time": "1:30:50", "remaining_time": "17:14:12"}
27
- {"current_steps": 27, "total_steps": 322, "loss": 1.0809, "lr": 2.454545454545455e-05, "epoch": 0.1667953667953668, "percentage": 8.39, "elapsed_time": "1:34:18", "remaining_time": "17:10:23"}
28
- {"current_steps": 28, "total_steps": 322, "loss": 1.083, "lr": 2.5454545454545457e-05, "epoch": 0.17297297297297298, "percentage": 8.7, "elapsed_time": "1:37:46", "remaining_time": "17:06:37"}
29
- {"current_steps": 29, "total_steps": 322, "loss": 1.0775, "lr": 2.6363636363636365e-05, "epoch": 0.17915057915057914, "percentage": 9.01, "elapsed_time": "1:41:14", "remaining_time": "17:02:52"}
30
- {"current_steps": 30, "total_steps": 322, "loss": 1.0792, "lr": 2.7272727272727273e-05, "epoch": 0.18532818532818532, "percentage": 9.32, "elapsed_time": "1:44:43", "remaining_time": "16:59:22"}
31
- {"current_steps": 31, "total_steps": 322, "loss": 1.0849, "lr": 2.8181818181818185e-05, "epoch": 0.1915057915057915, "percentage": 9.63, "elapsed_time": "1:48:13", "remaining_time": "16:55:53"}
32
- {"current_steps": 32, "total_steps": 322, "loss": 1.0772, "lr": 2.9090909090909093e-05, "epoch": 0.19768339768339768, "percentage": 9.94, "elapsed_time": "1:51:45", "remaining_time": "16:52:44"}
33
- {"current_steps": 33, "total_steps": 322, "loss": 1.0653, "lr": 3e-05, "epoch": 0.20386100386100386, "percentage": 10.25, "elapsed_time": "1:55:12", "remaining_time": "16:48:57"}
34
- {"current_steps": 34, "total_steps": 322, "loss": 1.0933, "lr": 2.999911374020804e-05, "epoch": 0.21003861003861005, "percentage": 10.56, "elapsed_time": "1:58:43", "remaining_time": "16:45:43"}
35
- {"current_steps": 35, "total_steps": 322, "loss": 1.0891, "lr": 2.9996455065559676e-05, "epoch": 0.21621621621621623, "percentage": 10.87, "elapsed_time": "2:02:12", "remaining_time": "16:42:10"}
36
- {"current_steps": 36, "total_steps": 322, "loss": 1.0557, "lr": 2.9992024290225105e-05, "epoch": 0.22239382239382238, "percentage": 11.18, "elapsed_time": "2:05:41", "remaining_time": "16:38:29"}
37
- {"current_steps": 37, "total_steps": 322, "loss": 1.0762, "lr": 2.9985821937780067e-05, "epoch": 0.22857142857142856, "percentage": 11.49, "elapsed_time": "2:09:10", "remaining_time": "16:34:56"}
38
- {"current_steps": 38, "total_steps": 322, "loss": 1.0742, "lr": 2.997784874114397e-05, "epoch": 0.23474903474903475, "percentage": 11.8, "elapsed_time": "2:12:39", "remaining_time": "16:31:27"}
39
- {"current_steps": 39, "total_steps": 322, "loss": 1.0968, "lr": 2.9968105642493287e-05, "epoch": 0.24092664092664093, "percentage": 12.11, "elapsed_time": "2:16:11", "remaining_time": "16:28:13"}
40
- {"current_steps": 40, "total_steps": 322, "loss": 1.081, "lr": 2.9956593793150235e-05, "epoch": 0.2471042471042471, "percentage": 12.42, "elapsed_time": "2:19:38", "remaining_time": "16:24:31"}
41
- {"current_steps": 41, "total_steps": 322, "loss": 1.0727, "lr": 2.994331455344671e-05, "epoch": 0.25328185328185326, "percentage": 12.73, "elapsed_time": "2:23:06", "remaining_time": "16:20:48"}
42
- {"current_steps": 42, "total_steps": 322, "loss": 1.0614, "lr": 2.992826949256354e-05, "epoch": 0.2594594594594595, "percentage": 13.04, "elapsed_time": "2:26:37", "remaining_time": "16:17:28"}
43
- {"current_steps": 43, "total_steps": 322, "loss": 1.0631, "lr": 2.9911460388345057e-05, "epoch": 0.26563706563706563, "percentage": 13.35, "elapsed_time": "2:30:06", "remaining_time": "16:13:59"}
44
- {"current_steps": 44, "total_steps": 322, "loss": 1.0662, "lr": 2.9892889227089025e-05, "epoch": 0.27181467181467184, "percentage": 13.66, "elapsed_time": "2:33:36", "remaining_time": "16:10:31"}
45
- {"current_steps": 45, "total_steps": 322, "loss": 1.0725, "lr": 2.9872558203311913e-05, "epoch": 0.277992277992278, "percentage": 13.98, "elapsed_time": "2:37:02", "remaining_time": "16:06:40"}
46
- {"current_steps": 46, "total_steps": 322, "loss": 1.085, "lr": 2.9850469719489576e-05, "epoch": 0.28416988416988415, "percentage": 14.29, "elapsed_time": "2:40:30", "remaining_time": "16:03:02"}
47
- {"current_steps": 47, "total_steps": 322, "loss": 1.0585, "lr": 2.9826626385773358e-05, "epoch": 0.29034749034749036, "percentage": 14.6, "elapsed_time": "2:43:58", "remaining_time": "15:59:27"}
48
- {"current_steps": 48, "total_steps": 322, "loss": 1.0599, "lr": 2.980103101968165e-05, "epoch": 0.2965250965250965, "percentage": 14.91, "elapsed_time": "2:47:25", "remaining_time": "15:55:42"}
49
- {"current_steps": 49, "total_steps": 322, "loss": 1.0696, "lr": 2.9773686645766963e-05, "epoch": 0.3027027027027027, "percentage": 15.22, "elapsed_time": "2:50:53", "remaining_time": "15:52:07"}
50
- {"current_steps": 50, "total_steps": 322, "loss": 1.0967, "lr": 2.974459649525853e-05, "epoch": 0.3088803088803089, "percentage": 15.53, "elapsed_time": "2:54:23", "remaining_time": "15:48:40"}
51
- {"current_steps": 51, "total_steps": 322, "loss": 1.0644, "lr": 2.9713764005680428e-05, "epoch": 0.3150579150579151, "percentage": 15.84, "elapsed_time": "2:57:52", "remaining_time": "15:45:08"}
52
- {"current_steps": 52, "total_steps": 322, "loss": 1.0761, "lr": 2.9681192820445445e-05, "epoch": 0.32123552123552124, "percentage": 16.15, "elapsed_time": "3:01:21", "remaining_time": "15:41:39"}
53
- {"current_steps": 53, "total_steps": 322, "loss": 1.0553, "lr": 2.964688678842449e-05, "epoch": 0.3274131274131274, "percentage": 16.46, "elapsed_time": "3:04:53", "remaining_time": "15:38:25"}
54
- {"current_steps": 54, "total_steps": 322, "loss": 1.0567, "lr": 2.96108499634918e-05, "epoch": 0.3335907335907336, "percentage": 16.77, "elapsed_time": "3:08:22", "remaining_time": "15:34:54"}
55
- {"current_steps": 55, "total_steps": 322, "loss": 1.0698, "lr": 2.9573086604045908e-05, "epoch": 0.33976833976833976, "percentage": 17.08, "elapsed_time": "3:11:48", "remaining_time": "15:31:08"}
56
- {"current_steps": 56, "total_steps": 322, "loss": 1.0617, "lr": 2.953360117250643e-05, "epoch": 0.34594594594594597, "percentage": 17.39, "elapsed_time": "3:15:15", "remaining_time": "15:27:30"}
57
- {"current_steps": 57, "total_steps": 322, "loss": 1.0529, "lr": 2.9492398334786734e-05, "epoch": 0.3521235521235521, "percentage": 17.7, "elapsed_time": "3:18:48", "remaining_time": "15:24:17"}
58
- {"current_steps": 58, "total_steps": 322, "loss": 1.0608, "lr": 2.944948295974261e-05, "epoch": 0.3583011583011583, "percentage": 18.01, "elapsed_time": "3:22:13", "remaining_time": "15:20:29"}
59
- {"current_steps": 59, "total_steps": 322, "loss": 1.0676, "lr": 2.9404860118596906e-05, "epoch": 0.3644787644787645, "percentage": 18.32, "elapsed_time": "3:25:44", "remaining_time": "15:17:05"}
60
- {"current_steps": 60, "total_steps": 322, "loss": 1.0632, "lr": 2.935853508434028e-05, "epoch": 0.37065637065637064, "percentage": 18.63, "elapsed_time": "3:29:09", "remaining_time": "15:13:20"}
61
- {"current_steps": 61, "total_steps": 322, "loss": 1.0612, "lr": 2.931051333110809e-05, "epoch": 0.37683397683397685, "percentage": 18.94, "elapsed_time": "3:32:34", "remaining_time": "15:09:31"}
62
- {"current_steps": 62, "total_steps": 322, "loss": 1.0384, "lr": 2.9260800533533537e-05, "epoch": 0.383011583011583, "percentage": 19.25, "elapsed_time": "3:35:58", "remaining_time": "15:05:43"}
63
- {"current_steps": 63, "total_steps": 322, "loss": 1.0472, "lr": 2.9209402566077113e-05, "epoch": 0.3891891891891892, "percentage": 19.57, "elapsed_time": "3:39:24", "remaining_time": "15:01:59"}
64
- {"current_steps": 64, "total_steps": 322, "loss": 1.0409, "lr": 2.9156325502332414e-05, "epoch": 0.39536679536679536, "percentage": 19.88, "elapsed_time": "3:42:54", "remaining_time": "14:58:37"}
65
- {"current_steps": 65, "total_steps": 322, "loss": 1.053, "lr": 2.9101575614308423e-05, "epoch": 0.4015444015444015, "percentage": 20.19, "elapsed_time": "3:46:22", "remaining_time": "14:55:03"}
66
- {"current_steps": 66, "total_steps": 322, "loss": 1.0589, "lr": 2.9045159371688403e-05, "epoch": 0.40772200772200773, "percentage": 20.5, "elapsed_time": "3:49:50", "remaining_time": "14:51:30"}
67
- {"current_steps": 67, "total_steps": 322, "loss": 1.0538, "lr": 2.8987083441065335e-05, "epoch": 0.4138996138996139, "percentage": 20.81, "elapsed_time": "3:53:16", "remaining_time": "14:47:50"}
68
- {"current_steps": 68, "total_steps": 322, "loss": 1.0505, "lr": 2.8927354685154188e-05, "epoch": 0.4200772200772201, "percentage": 21.12, "elapsed_time": "3:56:43", "remaining_time": "14:44:14"}
69
- {"current_steps": 69, "total_steps": 322, "loss": 1.0306, "lr": 2.8865980161980933e-05, "epoch": 0.42625482625482625, "percentage": 21.43, "elapsed_time": "4:00:13", "remaining_time": "14:40:50"}
70
- {"current_steps": 70, "total_steps": 322, "loss": 1.0506, "lr": 2.8802967124048512e-05, "epoch": 0.43243243243243246, "percentage": 21.74, "elapsed_time": "4:03:41", "remaining_time": "14:37:18"}
71
- {"current_steps": 71, "total_steps": 322, "loss": 1.0482, "lr": 2.873832301747985e-05, "epoch": 0.4386100386100386, "percentage": 22.05, "elapsed_time": "4:07:09", "remaining_time": "14:33:45"}
72
- {"current_steps": 72, "total_steps": 322, "loss": 1.0415, "lr": 2.867205548113794e-05, "epoch": 0.44478764478764476, "percentage": 22.36, "elapsed_time": "4:10:36", "remaining_time": "14:30:10"}
73
- {"current_steps": 73, "total_steps": 322, "loss": 1.0508, "lr": 2.860417234572318e-05, "epoch": 0.450965250965251, "percentage": 22.67, "elapsed_time": "4:14:07", "remaining_time": "14:26:48"}
74
- {"current_steps": 74, "total_steps": 322, "loss": 1.0512, "lr": 2.8534681632848027e-05, "epoch": 0.45714285714285713, "percentage": 22.98, "elapsed_time": "4:17:33", "remaining_time": "14:23:09"}
75
- {"current_steps": 75, "total_steps": 322, "loss": 1.0583, "lr": 2.8463591554089115e-05, "epoch": 0.46332046332046334, "percentage": 23.29, "elapsed_time": "4:20:58", "remaining_time": "14:19:27"}
76
- {"current_steps": 76, "total_steps": 322, "loss": 1.0306, "lr": 2.8390910510016898e-05, "epoch": 0.4694980694980695, "percentage": 23.6, "elapsed_time": "4:24:26", "remaining_time": "14:15:58"}
77
- {"current_steps": 77, "total_steps": 322, "loss": 1.0478, "lr": 2.831664708920298e-05, "epoch": 0.4756756756756757, "percentage": 23.91, "elapsed_time": "4:27:55", "remaining_time": "14:12:29"}
78
- {"current_steps": 78, "total_steps": 322, "loss": 1.0305, "lr": 2.8240810067205207e-05, "epoch": 0.48185328185328186, "percentage": 24.22, "elapsed_time": "4:31:24", "remaining_time": "14:09:00"}
79
- {"current_steps": 79, "total_steps": 322, "loss": 1.0542, "lr": 2.8163408405530692e-05, "epoch": 0.488030888030888, "percentage": 24.53, "elapsed_time": "4:34:54", "remaining_time": "14:05:34"}
80
- {"current_steps": 80, "total_steps": 322, "loss": 1.0293, "lr": 2.8084451250576847e-05, "epoch": 0.4942084942084942, "percentage": 24.84, "elapsed_time": "4:38:22", "remaining_time": "14:02:06"}
81
- {"current_steps": 81, "total_steps": 322, "loss": 1.0445, "lr": 2.8003947932550566e-05, "epoch": 0.5003861003861004, "percentage": 25.16, "elapsed_time": "4:41:48", "remaining_time": "13:58:28"}
82
- {"current_steps": 82, "total_steps": 322, "loss": 1.0491, "lr": 2.7921907964365703e-05, "epoch": 0.5065637065637065, "percentage": 25.47, "elapsed_time": "4:45:16", "remaining_time": "13:54:56"}
83
- {"current_steps": 83, "total_steps": 322, "loss": 1.048, "lr": 2.783834104051894e-05, "epoch": 0.5127413127413127, "percentage": 25.78, "elapsed_time": "4:48:45", "remaining_time": "13:51:29"}
84
- {"current_steps": 84, "total_steps": 322, "loss": 1.0354, "lr": 2.7753257035944216e-05, "epoch": 0.518918918918919, "percentage": 26.09, "elapsed_time": "4:52:17", "remaining_time": "13:48:08"}
85
- {"current_steps": 85, "total_steps": 322, "loss": 1.032, "lr": 2.7666666004845826e-05, "epoch": 0.525096525096525, "percentage": 26.4, "elapsed_time": "4:55:47", "remaining_time": "13:44:44"}
86
- {"current_steps": 86, "total_steps": 322, "loss": 1.0264, "lr": 2.7578578179510324e-05, "epoch": 0.5312741312741313, "percentage": 26.71, "elapsed_time": "4:59:13", "remaining_time": "13:41:09"}
87
- {"current_steps": 87, "total_steps": 322, "loss": 1.0319, "lr": 2.748900396909742e-05, "epoch": 0.5374517374517375, "percentage": 27.02, "elapsed_time": "5:02:42", "remaining_time": "13:37:40"}
88
- {"current_steps": 88, "total_steps": 322, "loss": 1.0396, "lr": 2.7397953958409925e-05, "epoch": 0.5436293436293437, "percentage": 27.33, "elapsed_time": "5:06:12", "remaining_time": "13:34:14"}
89
- {"current_steps": 89, "total_steps": 322, "loss": 1.0298, "lr": 2.730543890664297e-05, "epoch": 0.5498069498069498, "percentage": 27.64, "elapsed_time": "5:09:43", "remaining_time": "13:30:51"}
90
- {"current_steps": 90, "total_steps": 322, "loss": 1.0362, "lr": 2.7211469746112628e-05, "epoch": 0.555984555984556, "percentage": 27.95, "elapsed_time": "5:13:09", "remaining_time": "13:27:15"}
91
- {"current_steps": 91, "total_steps": 322, "loss": 1.0236, "lr": 2.711605758096406e-05, "epoch": 0.5621621621621622, "percentage": 28.26, "elapsed_time": "5:16:36", "remaining_time": "13:23:41"}
92
- {"current_steps": 92, "total_steps": 322, "loss": 1.0242, "lr": 2.7019213685859345e-05, "epoch": 0.5683397683397683, "percentage": 28.57, "elapsed_time": "5:20:02", "remaining_time": "13:20:06"}
93
- {"current_steps": 93, "total_steps": 322, "loss": 1.0205, "lr": 2.692094950464519e-05, "epoch": 0.5745173745173745, "percentage": 28.88, "elapsed_time": "5:23:31", "remaining_time": "13:16:38"}
94
- {"current_steps": 94, "total_steps": 322, "loss": 1.0311, "lr": 2.6821276649000643e-05, "epoch": 0.5806949806949807, "percentage": 29.19, "elapsed_time": "5:26:58", "remaining_time": "13:13:05"}
95
- {"current_steps": 95, "total_steps": 322, "loss": 1.0479, "lr": 2.6720206897064936e-05, "epoch": 0.5868725868725869, "percentage": 29.5, "elapsed_time": "5:30:24", "remaining_time": "13:09:29"}
96
- {"current_steps": 96, "total_steps": 322, "loss": 1.0384, "lr": 2.6617752192045723e-05, "epoch": 0.593050193050193, "percentage": 29.81, "elapsed_time": "5:33:52", "remaining_time": "13:06:00"}
97
- {"current_steps": 97, "total_steps": 322, "loss": 1.0388, "lr": 2.651392464080774e-05, "epoch": 0.5992277992277992, "percentage": 30.12, "elapsed_time": "5:37:18", "remaining_time": "13:02:23"}
98
- {"current_steps": 98, "total_steps": 322, "loss": 1.039, "lr": 2.640873651244218e-05, "epoch": 0.6054054054054054, "percentage": 30.43, "elapsed_time": "5:40:45", "remaining_time": "12:58:52"}
99
- {"current_steps": 99, "total_steps": 322, "loss": 1.0073, "lr": 2.6302200236816877e-05, "epoch": 0.6115830115830115, "percentage": 30.75, "elapsed_time": "5:44:17", "remaining_time": "12:55:32"}
100
- {"current_steps": 100, "total_steps": 322, "loss": 1.0123, "lr": 2.6194328403107493e-05, "epoch": 0.6177606177606177, "percentage": 31.06, "elapsed_time": "5:47:47", "remaining_time": "12:52:05"}
101
- {"current_steps": 101, "total_steps": 322, "loss": 1.0198, "lr": 2.6085133758309887e-05, "epoch": 0.623938223938224, "percentage": 31.37, "elapsed_time": "5:57:44", "remaining_time": "13:02:46"}
102
- {"current_steps": 102, "total_steps": 322, "loss": 1.0277, "lr": 2.5974629205733813e-05, "epoch": 0.6301158301158302, "percentage": 31.68, "elapsed_time": "6:01:13", "remaining_time": "12:59:07"}
103
- {"current_steps": 103, "total_steps": 322, "loss": 1.0194, "lr": 2.586282780347818e-05, "epoch": 0.6362934362934363, "percentage": 31.99, "elapsed_time": "6:04:40", "remaining_time": "12:55:21"}
104
- {"current_steps": 104, "total_steps": 322, "loss": 1.0079, "lr": 2.574974276288798e-05, "epoch": 0.6424710424710425, "percentage": 32.3, "elapsed_time": "6:08:08", "remaining_time": "12:51:40"}
105
- {"current_steps": 105, "total_steps": 322, "loss": 1.0161, "lr": 2.5635387446993157e-05, "epoch": 0.6486486486486487, "percentage": 32.61, "elapsed_time": "6:11:36", "remaining_time": "12:48:00"}
106
- {"current_steps": 106, "total_steps": 322, "loss": 1.008, "lr": 2.551977536892951e-05, "epoch": 0.6548262548262548, "percentage": 32.92, "elapsed_time": "6:15:02", "remaining_time": "12:44:14"}
107
- {"current_steps": 107, "total_steps": 322, "loss": 1.0102, "lr": 2.5402920190341864e-05, "epoch": 0.661003861003861, "percentage": 33.23, "elapsed_time": "6:18:33", "remaining_time": "12:40:39"}
108
- {"current_steps": 108, "total_steps": 322, "loss": 0.9876, "lr": 2.5284835719769735e-05, "epoch": 0.6671814671814672, "percentage": 33.54, "elapsed_time": "6:22:03", "remaining_time": "12:37:01"}
109
- {"current_steps": 109, "total_steps": 322, "loss": 1.0081, "lr": 2.516553591101555e-05, "epoch": 0.6733590733590734, "percentage": 33.85, "elapsed_time": "6:25:29", "remaining_time": "12:33:17"}
110
- {"current_steps": 110, "total_steps": 322, "loss": 1.0087, "lr": 2.5045034861495816e-05, "epoch": 0.6795366795366795, "percentage": 34.16, "elapsed_time": "6:28:54", "remaining_time": "12:29:32"}
111
- {"current_steps": 111, "total_steps": 322, "loss": 1.0135, "lr": 2.4923346810575197e-05, "epoch": 0.6857142857142857, "percentage": 34.47, "elapsed_time": "6:32:22", "remaining_time": "12:25:51"}
112
- {"current_steps": 112, "total_steps": 322, "loss": 1.018, "lr": 2.480048613788393e-05, "epoch": 0.6918918918918919, "percentage": 34.78, "elapsed_time": "6:35:50", "remaining_time": "12:22:12"}
113
- {"current_steps": 113, "total_steps": 322, "loss": 1.0104, "lr": 2.4676467361618565e-05, "epoch": 0.698069498069498, "percentage": 35.09, "elapsed_time": "6:39:21", "remaining_time": "12:18:38"}
114
- {"current_steps": 114, "total_steps": 322, "loss": 1.0211, "lr": 2.4551305136826426e-05, "epoch": 0.7042471042471042, "percentage": 35.4, "elapsed_time": "6:42:50", "remaining_time": "12:15:01"}
115
- {"current_steps": 115, "total_steps": 322, "loss": 1.0235, "lr": 2.4425014253673824e-05, "epoch": 0.7104247104247104, "percentage": 35.71, "elapsed_time": "6:46:19", "remaining_time": "12:11:23"}
116
- {"current_steps": 116, "total_steps": 322, "loss": 1.0089, "lr": 2.4297609635698322e-05, "epoch": 0.7166023166023165, "percentage": 36.02, "elapsed_time": "6:49:49", "remaining_time": "12:07:47"}
117
- {"current_steps": 117, "total_steps": 322, "loss": 1.0079, "lr": 2.416910633804529e-05, "epoch": 0.7227799227799228, "percentage": 36.34, "elapsed_time": "6:53:18", "remaining_time": "12:04:11"}
118
- {"current_steps": 118, "total_steps": 322, "loss": 1.0211, "lr": 2.4039519545688848e-05, "epoch": 0.728957528957529, "percentage": 36.65, "elapsed_time": "6:56:47", "remaining_time": "12:00:33"}
119
- {"current_steps": 119, "total_steps": 322, "loss": 1.0216, "lr": 2.3908864571637466e-05, "epoch": 0.7351351351351352, "percentage": 36.96, "elapsed_time": "7:00:16", "remaining_time": "11:56:57"}
120
- {"current_steps": 120, "total_steps": 322, "loss": 1.0082, "lr": 2.377715685512451e-05, "epoch": 0.7413127413127413, "percentage": 37.27, "elapsed_time": "7:03:46", "remaining_time": "11:53:20"}
121
- {"current_steps": 121, "total_steps": 322, "loss": 1.0163, "lr": 2.3644411959783753e-05, "epoch": 0.7474903474903475, "percentage": 37.58, "elapsed_time": "7:07:13", "remaining_time": "11:49:41"}
122
- {"current_steps": 122, "total_steps": 322, "loss": 1.0021, "lr": 2.3510645571810318e-05, "epoch": 0.7536679536679537, "percentage": 37.89, "elapsed_time": "7:10:39", "remaining_time": "11:45:59"}
123
- {"current_steps": 123, "total_steps": 322, "loss": 0.9861, "lr": 2.337587349810703e-05, "epoch": 0.7598455598455598, "percentage": 38.2, "elapsed_time": "7:14:06", "remaining_time": "11:42:19"}
124
- {"current_steps": 124, "total_steps": 322, "loss": 1.0104, "lr": 2.3240111664416545e-05, "epoch": 0.766023166023166, "percentage": 38.51, "elapsed_time": "7:17:35", "remaining_time": "11:38:43"}
125
- {"current_steps": 125, "total_steps": 322, "loss": 1.0108, "lr": 2.3103376113439474e-05, "epoch": 0.7722007722007722, "percentage": 38.82, "elapsed_time": "7:21:01", "remaining_time": "11:35:02"}
126
- {"current_steps": 126, "total_steps": 322, "loss": 1.0136, "lr": 2.29656830029386e-05, "epoch": 0.7783783783783784, "percentage": 39.13, "elapsed_time": "7:24:31", "remaining_time": "11:31:28"}
127
- {"current_steps": 127, "total_steps": 322, "loss": 1.0037, "lr": 2.28270486038296e-05, "epoch": 0.7845559845559845, "percentage": 39.44, "elapsed_time": "7:27:58", "remaining_time": "11:27:49"}
128
- {"current_steps": 128, "total_steps": 322, "loss": 0.9893, "lr": 2.2687489298258284e-05, "epoch": 0.7907335907335907, "percentage": 39.75, "elapsed_time": "7:31:26", "remaining_time": "11:24:12"}
129
- {"current_steps": 129, "total_steps": 322, "loss": 0.993, "lr": 2.254702157766482e-05, "epoch": 0.7969111969111969, "percentage": 40.06, "elapsed_time": "7:34:52", "remaining_time": "11:20:32"}
130
- {"current_steps": 130, "total_steps": 322, "loss": 0.9973, "lr": 2.2405662040834897e-05, "epoch": 0.803088803088803, "percentage": 40.37, "elapsed_time": "7:38:20", "remaining_time": "11:16:56"}
131
- {"current_steps": 131, "total_steps": 322, "loss": 0.9992, "lr": 2.2263427391938362e-05, "epoch": 0.8092664092664092, "percentage": 40.68, "elapsed_time": "7:41:48", "remaining_time": "11:13:19"}
132
- {"current_steps": 132, "total_steps": 322, "loss": 0.9943, "lr": 2.212033443855525e-05, "epoch": 0.8154440154440155, "percentage": 40.99, "elapsed_time": "7:45:19", "remaining_time": "11:09:47"}
133
- {"current_steps": 133, "total_steps": 322, "loss": 1.009, "lr": 2.1976400089689712e-05, "epoch": 0.8216216216216217, "percentage": 41.3, "elapsed_time": "7:48:47", "remaining_time": "11:06:10"}
134
- {"current_steps": 134, "total_steps": 322, "loss": 1.0021, "lr": 2.1831641353771887e-05, "epoch": 0.8277992277992278, "percentage": 41.61, "elapsed_time": "7:52:14", "remaining_time": "11:02:33"}
135
- {"current_steps": 135, "total_steps": 322, "loss": 1.026, "lr": 2.1686075336648075e-05, "epoch": 0.833976833976834, "percentage": 41.93, "elapsed_time": "7:55:43", "remaining_time": "10:58:58"}
136
- {"current_steps": 136, "total_steps": 322, "loss": 1.0069, "lr": 2.153971923955934e-05, "epoch": 0.8401544401544402, "percentage": 42.24, "elapsed_time": "7:59:11", "remaining_time": "10:55:21"}
137
- {"current_steps": 137, "total_steps": 322, "loss": 0.9936, "lr": 2.1392590357108906e-05, "epoch": 0.8463320463320463, "percentage": 42.55, "elapsed_time": "8:02:38", "remaining_time": "10:51:44"}
138
- {"current_steps": 138, "total_steps": 322, "loss": 0.9969, "lr": 2.1244706075218474e-05, "epoch": 0.8525096525096525, "percentage": 42.86, "elapsed_time": "8:06:08", "remaining_time": "10:48:11"}
139
- {"current_steps": 139, "total_steps": 322, "loss": 0.9924, "lr": 2.1096083869073767e-05, "epoch": 0.8586872586872587, "percentage": 43.17, "elapsed_time": "8:09:37", "remaining_time": "10:44:36"}
140
- {"current_steps": 140, "total_steps": 322, "loss": 1.0021, "lr": 2.0946741301059517e-05, "epoch": 0.8648648648648649, "percentage": 43.48, "elapsed_time": "8:13:08", "remaining_time": "10:41:04"}
141
- {"current_steps": 141, "total_steps": 322, "loss": 0.9928, "lr": 2.0796696018684154e-05, "epoch": 0.871042471042471, "percentage": 43.79, "elapsed_time": "8:16:33", "remaining_time": "10:37:26"}
142
- {"current_steps": 142, "total_steps": 322, "loss": 1.0013, "lr": 2.0645965752494447e-05, "epoch": 0.8772200772200772, "percentage": 44.1, "elapsed_time": "8:20:00", "remaining_time": "10:33:48"}
143
- {"current_steps": 143, "total_steps": 322, "loss": 1.0047, "lr": 2.049456831398031e-05, "epoch": 0.8833976833976834, "percentage": 44.41, "elapsed_time": "8:23:27", "remaining_time": "10:30:12"}
144
- {"current_steps": 144, "total_steps": 322, "loss": 0.995, "lr": 2.0342521593470055e-05, "epoch": 0.8895752895752895, "percentage": 44.72, "elapsed_time": "8:26:57", "remaining_time": "10:26:38"}
145
- {"current_steps": 145, "total_steps": 322, "loss": 0.9908, "lr": 2.018984355801634e-05, "epoch": 0.8957528957528957, "percentage": 45.03, "elapsed_time": "8:30:29", "remaining_time": "10:23:09"}
146
- {"current_steps": 146, "total_steps": 322, "loss": 0.9874, "lr": 2.0036552249273017e-05, "epoch": 0.901930501930502, "percentage": 45.34, "elapsed_time": "8:33:58", "remaining_time": "10:19:35"}
147
- {"current_steps": 147, "total_steps": 322, "loss": 0.9996, "lr": 1.988266578136321e-05, "epoch": 0.9081081081081082, "percentage": 45.65, "elapsed_time": "8:37:24", "remaining_time": "10:15:57"}
148
- {"current_steps": 148, "total_steps": 322, "loss": 0.9861, "lr": 1.9728202338738786e-05, "epoch": 0.9142857142857143, "percentage": 45.96, "elapsed_time": "8:40:52", "remaining_time": "10:12:23"}
149
- {"current_steps": 149, "total_steps": 322, "loss": 0.9723, "lr": 1.9573180174031558e-05, "epoch": 0.9204633204633205, "percentage": 46.27, "elapsed_time": "8:44:19", "remaining_time": "10:08:47"}
150
- {"current_steps": 150, "total_steps": 322, "loss": 0.9837, "lr": 1.941761760589637e-05, "epoch": 0.9266409266409267, "percentage": 46.58, "elapsed_time": "8:47:50", "remaining_time": "10:05:14"}
151
- {"current_steps": 151, "total_steps": 322, "loss": 0.9941, "lr": 1.926153301684647e-05, "epoch": 0.9328185328185328, "percentage": 46.89, "elapsed_time": "8:51:14", "remaining_time": "10:01:36"}
152
- {"current_steps": 152, "total_steps": 322, "loss": 0.9776, "lr": 1.9104944851081247e-05, "epoch": 0.938996138996139, "percentage": 47.2, "elapsed_time": "8:54:39", "remaining_time": "9:57:58"}
153
- {"current_steps": 153, "total_steps": 322, "loss": 0.9997, "lr": 1.8947871612306724e-05, "epoch": 0.9451737451737452, "percentage": 47.52, "elapsed_time": "8:58:11", "remaining_time": "9:54:28"}
154
- {"current_steps": 154, "total_steps": 322, "loss": 0.9867, "lr": 1.8790331861549025e-05, "epoch": 0.9513513513513514, "percentage": 47.83, "elapsed_time": "9:01:38", "remaining_time": "9:50:52"}
155
- {"current_steps": 155, "total_steps": 322, "loss": 0.967, "lr": 1.863234421496105e-05, "epoch": 0.9575289575289575, "percentage": 48.14, "elapsed_time": "9:05:04", "remaining_time": "9:47:16"}
156
- {"current_steps": 156, "total_steps": 322, "loss": 0.977, "lr": 1.8473927341622628e-05, "epoch": 0.9637065637065637, "percentage": 48.45, "elapsed_time": "9:08:32", "remaining_time": "9:43:42"}
157
- {"current_steps": 157, "total_steps": 322, "loss": 0.9771, "lr": 1.831509996133447e-05, "epoch": 0.9698841698841699, "percentage": 48.76, "elapsed_time": "9:11:58", "remaining_time": "9:40:06"}
158
- {"current_steps": 158, "total_steps": 322, "loss": 0.9936, "lr": 1.8155880842406042e-05, "epoch": 0.976061776061776, "percentage": 49.07, "elapsed_time": "9:15:24", "remaining_time": "9:36:29"}
159
- {"current_steps": 159, "total_steps": 322, "loss": 0.9914, "lr": 1.7996288799437762e-05, "epoch": 0.9822393822393822, "percentage": 49.38, "elapsed_time": "9:18:50", "remaining_time": "9:32:54"}
160
- {"current_steps": 160, "total_steps": 322, "loss": 0.9961, "lr": 1.7836342691097745e-05, "epoch": 0.9884169884169884, "percentage": 49.69, "elapsed_time": "9:22:19", "remaining_time": "9:29:20"}
161
- {"current_steps": 161, "total_steps": 322, "loss": 0.9809, "lr": 1.7676061417893278e-05, "epoch": 0.9945945945945946, "percentage": 50.0, "elapsed_time": "9:25:46", "remaining_time": "9:25:46"}
162
- {"current_steps": 162, "total_steps": 322, "loss": 1.9052, "lr": 1.7515463919937416e-05, "epoch": 1.0061776061776062, "percentage": 50.31, "elapsed_time": "9:29:38", "remaining_time": "9:22:36"}
163
- {"current_steps": 163, "total_steps": 322, "loss": 0.8504, "lr": 1.735456917471084e-05, "epoch": 1.0123552123552124, "percentage": 50.62, "elapsed_time": "9:33:08", "remaining_time": "9:19:04"}
164
- {"current_steps": 164, "total_steps": 322, "loss": 0.8583, "lr": 1.7193396194819332e-05, "epoch": 1.0185328185328186, "percentage": 50.93, "elapsed_time": "9:36:35", "remaining_time": "9:15:30"}
165
- {"current_steps": 165, "total_steps": 322, "loss": 0.8515, "lr": 1.703196402574712e-05, "epoch": 1.0247104247104246, "percentage": 51.24, "elapsed_time": "9:40:06", "remaining_time": "9:11:59"}
166
- {"current_steps": 166, "total_steps": 322, "loss": 0.8551, "lr": 1.6870291743606273e-05, "epoch": 1.0308880308880308, "percentage": 51.55, "elapsed_time": "9:43:36", "remaining_time": "9:08:26"}
167
- {"current_steps": 167, "total_steps": 322, "loss": 0.8667, "lr": 1.6708398452882552e-05, "epoch": 1.037065637065637, "percentage": 51.86, "elapsed_time": "9:47:02", "remaining_time": "9:04:51"}
168
- {"current_steps": 168, "total_steps": 322, "loss": 0.8531, "lr": 1.654630328417784e-05, "epoch": 1.0432432432432432, "percentage": 52.17, "elapsed_time": "9:50:27", "remaining_time": "9:01:14"}
169
- {"current_steps": 169, "total_steps": 322, "loss": 0.8642, "lr": 1.638402539194953e-05, "epoch": 1.0494208494208495, "percentage": 52.48, "elapsed_time": "9:53:52", "remaining_time": "8:57:38"}
170
- {"current_steps": 170, "total_steps": 322, "loss": 0.8718, "lr": 1.6221583952247098e-05, "epoch": 1.0555984555984557, "percentage": 52.8, "elapsed_time": "9:57:17", "remaining_time": "8:54:02"}
171
- {"current_steps": 171, "total_steps": 322, "loss": 0.8623, "lr": 1.605899816044608e-05, "epoch": 1.0617760617760619, "percentage": 53.11, "elapsed_time": "10:00:41", "remaining_time": "8:50:26"}
172
- {"current_steps": 172, "total_steps": 322, "loss": 0.8547, "lr": 1.589628722897982e-05, "epoch": 1.0679536679536679, "percentage": 53.42, "elapsed_time": "10:04:07", "remaining_time": "8:46:51"}
173
- {"current_steps": 173, "total_steps": 322, "loss": 0.8752, "lr": 1.5733470385069142e-05, "epoch": 1.074131274131274, "percentage": 53.73, "elapsed_time": "10:07:36", "remaining_time": "8:43:18"}
174
- {"current_steps": 174, "total_steps": 322, "loss": 0.8529, "lr": 1.5570566868450345e-05, "epoch": 1.0803088803088803, "percentage": 54.04, "elapsed_time": "10:11:04", "remaining_time": "8:39:45"}
175
- {"current_steps": 175, "total_steps": 322, "loss": 0.8453, "lr": 1.540759592910167e-05, "epoch": 1.0864864864864865, "percentage": 54.35, "elapsed_time": "10:14:35", "remaining_time": "8:36:15"}
176
- {"current_steps": 176, "total_steps": 322, "loss": 0.8521, "lr": 1.5244576824968541e-05, "epoch": 1.0926640926640927, "percentage": 54.66, "elapsed_time": "10:18:03", "remaining_time": "8:32:42"}
177
- {"current_steps": 177, "total_steps": 322, "loss": 0.8573, "lr": 1.5081528819687952e-05, "epoch": 1.098841698841699, "percentage": 54.97, "elapsed_time": "10:21:29", "remaining_time": "8:29:08"}
178
- {"current_steps": 178, "total_steps": 322, "loss": 0.8694, "lr": 1.4918471180312052e-05, "epoch": 1.1050193050193051, "percentage": 55.28, "elapsed_time": "10:24:54", "remaining_time": "8:25:32"}
179
- {"current_steps": 179, "total_steps": 322, "loss": 0.8429, "lr": 1.4755423175031461e-05, "epoch": 1.111196911196911, "percentage": 55.59, "elapsed_time": "10:28:20", "remaining_time": "8:21:58"}
180
- {"current_steps": 180, "total_steps": 322, "loss": 0.8474, "lr": 1.4592404070898337e-05, "epoch": 1.1173745173745173, "percentage": 55.9, "elapsed_time": "10:31:48", "remaining_time": "8:18:25"}
181
- {"current_steps": 181, "total_steps": 322, "loss": 0.8643, "lr": 1.4429433131549661e-05, "epoch": 1.1235521235521235, "percentage": 56.21, "elapsed_time": "10:35:17", "remaining_time": "8:14:53"}
182
- {"current_steps": 182, "total_steps": 322, "loss": 0.847, "lr": 1.4266529614930862e-05, "epoch": 1.1297297297297297, "percentage": 56.52, "elapsed_time": "10:38:46", "remaining_time": "8:11:22"}
183
- {"current_steps": 183, "total_steps": 322, "loss": 0.8416, "lr": 1.4103712771020188e-05, "epoch": 1.135907335907336, "percentage": 56.83, "elapsed_time": "10:42:14", "remaining_time": "8:07:49"}
184
- {"current_steps": 184, "total_steps": 322, "loss": 0.8808, "lr": 1.3941001839553921e-05, "epoch": 1.1420849420849422, "percentage": 57.14, "elapsed_time": "10:45:40", "remaining_time": "8:04:15"}
185
- {"current_steps": 185, "total_steps": 322, "loss": 0.8422, "lr": 1.3778416047752906e-05, "epoch": 1.1482625482625481, "percentage": 57.45, "elapsed_time": "10:49:05", "remaining_time": "8:00:40"}
186
- {"current_steps": 186, "total_steps": 322, "loss": 0.8537, "lr": 1.3615974608050472e-05, "epoch": 1.1544401544401544, "percentage": 57.76, "elapsed_time": "10:52:32", "remaining_time": "7:57:07"}
187
- {"current_steps": 187, "total_steps": 322, "loss": 0.853, "lr": 1.3453696715822165e-05, "epoch": 1.1606177606177606, "percentage": 58.07, "elapsed_time": "10:55:57", "remaining_time": "7:53:33"}
188
- {"current_steps": 188, "total_steps": 322, "loss": 0.8552, "lr": 1.329160154711745e-05, "epoch": 1.1667953667953668, "percentage": 58.39, "elapsed_time": "10:59:28", "remaining_time": "7:50:02"}
189
- {"current_steps": 189, "total_steps": 322, "loss": 0.8346, "lr": 1.3129708256393725e-05, "epoch": 1.172972972972973, "percentage": 58.7, "elapsed_time": "11:02:57", "remaining_time": "7:46:31"}
190
- {"current_steps": 190, "total_steps": 322, "loss": 0.8561, "lr": 1.2968035974252882e-05, "epoch": 1.1791505791505792, "percentage": 59.01, "elapsed_time": "11:06:25", "remaining_time": "7:42:59"}
191
- {"current_steps": 191, "total_steps": 322, "loss": 0.8518, "lr": 1.2806603805180668e-05, "epoch": 1.1853281853281854, "percentage": 59.32, "elapsed_time": "11:09:51", "remaining_time": "7:39:26"}
192
- {"current_steps": 192, "total_steps": 322, "loss": 0.8588, "lr": 1.2645430825289166e-05, "epoch": 1.1915057915057914, "percentage": 59.63, "elapsed_time": "11:13:20", "remaining_time": "7:35:54"}
193
- {"current_steps": 193, "total_steps": 322, "loss": 0.839, "lr": 1.2484536080062583e-05, "epoch": 1.1976833976833976, "percentage": 59.94, "elapsed_time": "11:16:51", "remaining_time": "7:32:24"}
194
- {"current_steps": 194, "total_steps": 322, "loss": 0.8534, "lr": 1.2323938582106725e-05, "epoch": 1.2038610038610038, "percentage": 60.25, "elapsed_time": "11:20:17", "remaining_time": "7:28:50"}
195
- {"current_steps": 195, "total_steps": 322, "loss": 0.8586, "lr": 1.2163657308902256e-05, "epoch": 1.21003861003861, "percentage": 60.56, "elapsed_time": "11:23:41", "remaining_time": "7:25:16"}
196
- {"current_steps": 196, "total_steps": 322, "loss": 0.8394, "lr": 1.2003711200562243e-05, "epoch": 1.2162162162162162, "percentage": 60.87, "elapsed_time": "11:27:06", "remaining_time": "7:21:42"}
197
- {"current_steps": 197, "total_steps": 322, "loss": 0.8434, "lr": 1.1844119157593962e-05, "epoch": 1.2223938223938224, "percentage": 61.18, "elapsed_time": "11:30:31", "remaining_time": "7:18:09"}
198
- {"current_steps": 198, "total_steps": 322, "loss": 0.8568, "lr": 1.1684900038665532e-05, "epoch": 1.2285714285714286, "percentage": 61.49, "elapsed_time": "11:34:00", "remaining_time": "7:14:37"}
199
- {"current_steps": 199, "total_steps": 322, "loss": 0.8499, "lr": 1.1526072658377371e-05, "epoch": 1.2347490347490346, "percentage": 61.8, "elapsed_time": "11:37:29", "remaining_time": "7:11:06"}
200
- {"current_steps": 200, "total_steps": 322, "loss": 0.8376, "lr": 1.1367655785038958e-05, "epoch": 1.2409266409266408, "percentage": 62.11, "elapsed_time": "11:41:00", "remaining_time": "7:07:36"}
201
- {"current_steps": 201, "total_steps": 322, "loss": 0.8401, "lr": 1.120966813845098e-05, "epoch": 1.247104247104247, "percentage": 62.42, "elapsed_time": "11:51:53", "remaining_time": "7:08:33"}
202
- {"current_steps": 202, "total_steps": 322, "loss": 0.8486, "lr": 1.1052128387693282e-05, "epoch": 1.2532818532818533, "percentage": 62.73, "elapsed_time": "11:55:22", "remaining_time": "7:04:58"}
203
- {"current_steps": 203, "total_steps": 322, "loss": 0.8427, "lr": 1.0895055148918758e-05, "epoch": 1.2594594594594595, "percentage": 63.04, "elapsed_time": "11:58:50", "remaining_time": "7:01:23"}
204
- {"current_steps": 204, "total_steps": 322, "loss": 0.84, "lr": 1.0738466983153535e-05, "epoch": 1.2656370656370657, "percentage": 63.35, "elapsed_time": "12:02:16", "remaining_time": "6:57:47"}
205
- {"current_steps": 205, "total_steps": 322, "loss": 0.8361, "lr": 1.0582382394103629e-05, "epoch": 1.271814671814672, "percentage": 63.66, "elapsed_time": "12:05:42", "remaining_time": "6:54:10"}
206
- {"current_steps": 206, "total_steps": 322, "loss": 0.851, "lr": 1.042681982596845e-05, "epoch": 1.2779922779922779, "percentage": 63.98, "elapsed_time": "12:09:07", "remaining_time": "6:50:34"}
207
- {"current_steps": 207, "total_steps": 322, "loss": 0.8335, "lr": 1.0271797661261216e-05, "epoch": 1.284169884169884, "percentage": 64.29, "elapsed_time": "12:12:33", "remaining_time": "6:46:58"}
208
- {"current_steps": 208, "total_steps": 322, "loss": 0.8413, "lr": 1.0117334218636795e-05, "epoch": 1.2903474903474903, "percentage": 64.6, "elapsed_time": "12:15:59", "remaining_time": "6:43:22"}
209
- {"current_steps": 209, "total_steps": 322, "loss": 0.8418, "lr": 9.963447750726985e-06, "epoch": 1.2965250965250965, "percentage": 64.91, "elapsed_time": "12:19:25", "remaining_time": "6:39:47"}
210
- {"current_steps": 210, "total_steps": 322, "loss": 0.8436, "lr": 9.810156441983667e-06, "epoch": 1.3027027027027027, "percentage": 65.22, "elapsed_time": "12:22:50", "remaining_time": "6:36:11"}
211
- {"current_steps": 211, "total_steps": 322, "loss": 0.8382, "lr": 9.657478406529946e-06, "epoch": 1.308880308880309, "percentage": 65.53, "elapsed_time": "12:26:19", "remaining_time": "6:32:37"}
212
- {"current_steps": 212, "total_steps": 322, "loss": 0.8519, "lr": 9.505431686019694e-06, "epoch": 1.3150579150579151, "percentage": 65.84, "elapsed_time": "12:29:47", "remaining_time": "6:29:02"}
213
- {"current_steps": 213, "total_steps": 322, "loss": 0.8502, "lr": 9.354034247505557e-06, "epoch": 1.3212355212355211, "percentage": 66.15, "elapsed_time": "12:33:17", "remaining_time": "6:25:29"}
214
- {"current_steps": 214, "total_steps": 322, "loss": 0.8172, "lr": 9.203303981315849e-06, "epoch": 1.3274131274131273, "percentage": 66.46, "elapsed_time": "12:36:46", "remaining_time": "6:21:55"}
215
- {"current_steps": 215, "total_steps": 322, "loss": 0.8285, "lr": 9.053258698940485e-06, "epoch": 1.3335907335907335, "percentage": 66.77, "elapsed_time": "12:40:13", "remaining_time": "6:18:20"}
216
- {"current_steps": 216, "total_steps": 322, "loss": 0.8411, "lr": 8.903916130926232e-06, "epoch": 1.3397683397683398, "percentage": 67.08, "elapsed_time": "12:43:42", "remaining_time": "6:14:47"}
217
- {"current_steps": 217, "total_steps": 322, "loss": 0.8405, "lr": 8.755293924781524e-06, "epoch": 1.345945945945946, "percentage": 67.39, "elapsed_time": "12:47:14", "remaining_time": "6:11:14"}
218
- {"current_steps": 218, "total_steps": 322, "loss": 0.8398, "lr": 8.607409642891091e-06, "epoch": 1.3521235521235522, "percentage": 67.7, "elapsed_time": "12:50:40", "remaining_time": "6:07:39"}
219
- {"current_steps": 219, "total_steps": 322, "loss": 0.8214, "lr": 8.460280760440664e-06, "epoch": 1.3583011583011584, "percentage": 68.01, "elapsed_time": "12:54:09", "remaining_time": "6:04:06"}
220
- {"current_steps": 220, "total_steps": 322, "loss": 0.8489, "lr": 8.313924663351927e-06, "epoch": 1.3644787644787644, "percentage": 68.32, "elapsed_time": "12:57:34", "remaining_time": "6:00:30"}
221
- {"current_steps": 221, "total_steps": 322, "loss": 0.8297, "lr": 8.168358646228115e-06, "epoch": 1.3706563706563706, "percentage": 68.63, "elapsed_time": "13:01:00", "remaining_time": "5:56:55"}
222
- {"current_steps": 222, "total_steps": 322, "loss": 0.8128, "lr": 8.023599910310287e-06, "epoch": 1.3768339768339768, "percentage": 68.94, "elapsed_time": "13:04:24", "remaining_time": "5:53:20"}
223
- {"current_steps": 223, "total_steps": 322, "loss": 0.832, "lr": 7.879665561444752e-06, "epoch": 1.383011583011583, "percentage": 69.25, "elapsed_time": "13:07:52", "remaining_time": "5:49:46"}
224
- {"current_steps": 224, "total_steps": 322, "loss": 0.8262, "lr": 7.73657260806164e-06, "epoch": 1.3891891891891892, "percentage": 69.57, "elapsed_time": "13:11:20", "remaining_time": "5:46:12"}
225
- {"current_steps": 225, "total_steps": 322, "loss": 0.8375, "lr": 7.594337959165108e-06, "epoch": 1.3953667953667954, "percentage": 69.88, "elapsed_time": "13:14:45", "remaining_time": "5:42:37"}
226
- {"current_steps": 226, "total_steps": 322, "loss": 0.8464, "lr": 7.452978422335191e-06, "epoch": 1.4015444015444016, "percentage": 70.19, "elapsed_time": "13:18:12", "remaining_time": "5:39:03"}
227
- {"current_steps": 227, "total_steps": 322, "loss": 0.8301, "lr": 7.312510701741718e-06, "epoch": 1.4077220077220076, "percentage": 70.5, "elapsed_time": "13:21:36", "remaining_time": "5:35:28"}
228
- {"current_steps": 228, "total_steps": 322, "loss": 0.8282, "lr": 7.172951396170404e-06, "epoch": 1.4138996138996138, "percentage": 70.81, "elapsed_time": "13:25:01", "remaining_time": "5:31:53"}
229
- {"current_steps": 229, "total_steps": 322, "loss": 0.8406, "lr": 7.0343169970614e-06, "epoch": 1.42007722007722, "percentage": 71.12, "elapsed_time": "13:28:28", "remaining_time": "5:28:20"}
230
- {"current_steps": 230, "total_steps": 322, "loss": 0.8262, "lr": 6.896623886560529e-06, "epoch": 1.4262548262548262, "percentage": 71.43, "elapsed_time": "13:31:55", "remaining_time": "5:24:46"}
231
- {"current_steps": 231, "total_steps": 322, "loss": 0.8454, "lr": 6.759888335583458e-06, "epoch": 1.4324324324324325, "percentage": 71.74, "elapsed_time": "13:35:21", "remaining_time": "5:21:11"}
232
- {"current_steps": 232, "total_steps": 322, "loss": 0.8284, "lr": 6.624126501892971e-06, "epoch": 1.4386100386100387, "percentage": 72.05, "elapsed_time": "13:38:45", "remaining_time": "5:17:37"}
233
- {"current_steps": 233, "total_steps": 322, "loss": 0.8314, "lr": 6.489354428189684e-06, "epoch": 1.4447876447876449, "percentage": 72.36, "elapsed_time": "13:42:13", "remaining_time": "5:14:04"}
234
- {"current_steps": 234, "total_steps": 322, "loss": 0.8281, "lr": 6.355588040216249e-06, "epoch": 1.4509652509652509, "percentage": 72.67, "elapsed_time": "13:45:39", "remaining_time": "5:10:30"}
235
- {"current_steps": 235, "total_steps": 322, "loss": 0.8294, "lr": 6.222843144875494e-06, "epoch": 1.457142857142857, "percentage": 72.98, "elapsed_time": "13:49:04", "remaining_time": "5:06:56"}
236
- {"current_steps": 236, "total_steps": 322, "loss": 0.8207, "lr": 6.091135428362536e-06, "epoch": 1.4633204633204633, "percentage": 73.29, "elapsed_time": "13:52:29", "remaining_time": "5:03:22"}
237
- {"current_steps": 237, "total_steps": 322, "loss": 0.8243, "lr": 5.960480454311155e-06, "epoch": 1.4694980694980695, "percentage": 73.6, "elapsed_time": "13:55:57", "remaining_time": "4:59:49"}
238
- {"current_steps": 238, "total_steps": 322, "loss": 0.817, "lr": 5.830893661954708e-06, "epoch": 1.4756756756756757, "percentage": 73.91, "elapsed_time": "13:59:22", "remaining_time": "4:56:15"}
239
- {"current_steps": 239, "total_steps": 322, "loss": 0.8307, "lr": 5.702390364301677e-06, "epoch": 1.481853281853282, "percentage": 74.22, "elapsed_time": "14:02:47", "remaining_time": "4:52:41"}
240
- {"current_steps": 240, "total_steps": 322, "loss": 0.8327, "lr": 5.574985746326181e-06, "epoch": 1.4880308880308881, "percentage": 74.53, "elapsed_time": "14:06:12", "remaining_time": "4:49:07"}
241
- {"current_steps": 241, "total_steps": 322, "loss": 0.828, "lr": 5.448694863173572e-06, "epoch": 1.494208494208494, "percentage": 74.84, "elapsed_time": "14:09:40", "remaining_time": "4:45:34"}
242
- {"current_steps": 242, "total_steps": 322, "loss": 0.8289, "lr": 5.3235326383814324e-06, "epoch": 1.5003861003861005, "percentage": 75.16, "elapsed_time": "14:13:08", "remaining_time": "4:42:01"}
243
- {"current_steps": 243, "total_steps": 322, "loss": 0.8271, "lr": 5.19951386211607e-06, "epoch": 1.5065637065637065, "percentage": 75.47, "elapsed_time": "14:16:33", "remaining_time": "4:38:28"}
244
- {"current_steps": 244, "total_steps": 322, "loss": 0.8246, "lr": 5.076653189424804e-06, "epoch": 1.5127413127413127, "percentage": 75.78, "elapsed_time": "14:19:57", "remaining_time": "4:34:54"}
245
- {"current_steps": 245, "total_steps": 322, "loss": 0.8338, "lr": 4.954965138504187e-06, "epoch": 1.518918918918919, "percentage": 76.09, "elapsed_time": "14:23:25", "remaining_time": "4:31:21"}
246
- {"current_steps": 246, "total_steps": 322, "loss": 0.8344, "lr": 4.834464088984452e-06, "epoch": 1.525096525096525, "percentage": 76.4, "elapsed_time": "14:26:52", "remaining_time": "4:27:49"}
247
- {"current_steps": 247, "total_steps": 322, "loss": 0.8219, "lr": 4.7151642802302695e-06, "epoch": 1.5312741312741314, "percentage": 76.71, "elapsed_time": "14:30:19", "remaining_time": "4:24:16"}
248
- {"current_steps": 248, "total_steps": 322, "loss": 0.8073, "lr": 4.597079809658136e-06, "epoch": 1.5374517374517374, "percentage": 77.02, "elapsed_time": "14:33:44", "remaining_time": "4:20:42"}
249
- {"current_steps": 249, "total_steps": 322, "loss": 0.8256, "lr": 4.480224631070493e-06, "epoch": 1.5436293436293438, "percentage": 77.33, "elapsed_time": "14:37:09", "remaining_time": "4:17:09"}
250
- {"current_steps": 250, "total_steps": 322, "loss": 0.8119, "lr": 4.364612553006847e-06, "epoch": 1.5498069498069498, "percentage": 77.64, "elapsed_time": "14:40:35", "remaining_time": "4:13:36"}
251
- {"current_steps": 251, "total_steps": 322, "loss": 0.8455, "lr": 4.250257237112023e-06, "epoch": 1.555984555984556, "percentage": 77.95, "elapsed_time": "14:44:03", "remaining_time": "4:10:04"}
252
- {"current_steps": 252, "total_steps": 322, "loss": 0.8231, "lr": 4.137172196521823e-06, "epoch": 1.5621621621621622, "percentage": 78.26, "elapsed_time": "14:47:31", "remaining_time": "4:06:31"}
253
- {"current_steps": 253, "total_steps": 322, "loss": 0.8271, "lr": 4.0253707942661845e-06, "epoch": 1.5683397683397682, "percentage": 78.57, "elapsed_time": "14:51:01", "remaining_time": "4:03:00"}
254
- {"current_steps": 254, "total_steps": 322, "loss": 0.8276, "lr": 3.914866241690115e-06, "epoch": 1.5745173745173746, "percentage": 78.88, "elapsed_time": "14:54:28", "remaining_time": "3:59:28"}
255
- {"current_steps": 255, "total_steps": 322, "loss": 0.8394, "lr": 3.8056715968925094e-06, "epoch": 1.5806949806949806, "percentage": 79.19, "elapsed_time": "14:57:55", "remaining_time": "3:55:55"}
256
- {"current_steps": 256, "total_steps": 322, "loss": 0.8383, "lr": 3.697799763183127e-06, "epoch": 1.586872586872587, "percentage": 79.5, "elapsed_time": "15:01:22", "remaining_time": "3:52:23"}
257
- {"current_steps": 257, "total_steps": 322, "loss": 0.8372, "lr": 3.5912634875578267e-06, "epoch": 1.593050193050193, "percentage": 79.81, "elapsed_time": "15:04:52", "remaining_time": "3:48:51"}
258
- {"current_steps": 258, "total_steps": 322, "loss": 0.8194, "lr": 3.4860753591922604e-06, "epoch": 1.5992277992277992, "percentage": 80.12, "elapsed_time": "15:08:17", "remaining_time": "3:45:18"}
259
- {"current_steps": 259, "total_steps": 322, "loss": 0.8526, "lr": 3.3822478079542774e-06, "epoch": 1.6054054054054054, "percentage": 80.43, "elapsed_time": "15:11:42", "remaining_time": "3:41:46"}
260
- {"current_steps": 260, "total_steps": 322, "loss": 0.8137, "lr": 3.2797931029350614e-06, "epoch": 1.6115830115830114, "percentage": 80.75, "elapsed_time": "15:15:09", "remaining_time": "3:38:13"}
261
- {"current_steps": 261, "total_steps": 322, "loss": 0.8174, "lr": 3.178723350999362e-06, "epoch": 1.6177606177606179, "percentage": 81.06, "elapsed_time": "15:18:40", "remaining_time": "3:34:42"}
262
- {"current_steps": 262, "total_steps": 322, "loss": 0.8307, "lr": 3.0790504953548115e-06, "epoch": 1.6239382239382238, "percentage": 81.37, "elapsed_time": "15:22:07", "remaining_time": "3:31:10"}
263
- {"current_steps": 263, "total_steps": 322, "loss": 0.8281, "lr": 2.980786314140658e-06, "epoch": 1.6301158301158303, "percentage": 81.68, "elapsed_time": "15:25:32", "remaining_time": "3:27:37"}
264
- {"current_steps": 264, "total_steps": 322, "loss": 0.8431, "lr": 2.8839424190359386e-06, "epoch": 1.6362934362934363, "percentage": 81.99, "elapsed_time": "15:28:59", "remaining_time": "3:24:05"}
265
- {"current_steps": 265, "total_steps": 322, "loss": 0.8268, "lr": 2.788530253887371e-06, "epoch": 1.6424710424710425, "percentage": 82.3, "elapsed_time": "15:32:24", "remaining_time": "3:20:33"}
266
- {"current_steps": 266, "total_steps": 322, "loss": 0.8086, "lr": 2.6945610933570297e-06, "epoch": 1.6486486486486487, "percentage": 82.61, "elapsed_time": "15:35:55", "remaining_time": "3:17:02"}
267
- {"current_steps": 267, "total_steps": 322, "loss": 0.8345, "lr": 2.6020460415900786e-06, "epoch": 1.6548262548262547, "percentage": 82.92, "elapsed_time": "15:39:19", "remaining_time": "3:13:29"}
268
- {"current_steps": 268, "total_steps": 322, "loss": 0.829, "lr": 2.510996030902581e-06, "epoch": 1.661003861003861, "percentage": 83.23, "elapsed_time": "15:42:47", "remaining_time": "3:09:57"}
269
- {"current_steps": 269, "total_steps": 322, "loss": 0.8322, "lr": 2.4214218204896776e-06, "epoch": 1.667181467181467, "percentage": 83.54, "elapsed_time": "15:46:14", "remaining_time": "3:06:26"}
270
- {"current_steps": 270, "total_steps": 322, "loss": 0.8307, "lr": 2.333333995154178e-06, "epoch": 1.6733590733590735, "percentage": 83.85, "elapsed_time": "15:49:39", "remaining_time": "3:02:53"}
271
- {"current_steps": 271, "total_steps": 322, "loss": 0.8241, "lr": 2.2467429640557903e-06, "epoch": 1.6795366795366795, "percentage": 84.16, "elapsed_time": "15:53:04", "remaining_time": "2:59:21"}
272
- {"current_steps": 272, "total_steps": 322, "loss": 0.8308, "lr": 2.161658959481065e-06, "epoch": 1.6857142857142857, "percentage": 84.47, "elapsed_time": "15:56:31", "remaining_time": "2:55:49"}
273
- {"current_steps": 273, "total_steps": 322, "loss": 0.8202, "lr": 2.0780920356343015e-06, "epoch": 1.691891891891892, "percentage": 84.78, "elapsed_time": "15:59:56", "remaining_time": "2:52:17"}
274
- {"current_steps": 274, "total_steps": 322, "loss": 0.8226, "lr": 1.9960520674494354e-06, "epoch": 1.698069498069498, "percentage": 85.09, "elapsed_time": "16:03:24", "remaining_time": "2:48:46"}
275
- {"current_steps": 275, "total_steps": 322, "loss": 0.8259, "lr": 1.915548749423157e-06, "epoch": 1.7042471042471043, "percentage": 85.4, "elapsed_time": "16:06:49", "remaining_time": "2:45:14"}
276
- {"current_steps": 276, "total_steps": 322, "loss": 0.842, "lr": 1.8365915944693102e-06, "epoch": 1.7104247104247103, "percentage": 85.71, "elapsed_time": "16:10:16", "remaining_time": "2:41:42"}
277
- {"current_steps": 277, "total_steps": 322, "loss": 0.8068, "lr": 1.759189932794798e-06, "epoch": 1.7166023166023165, "percentage": 86.02, "elapsed_time": "16:13:42", "remaining_time": "2:38:11"}
278
- {"current_steps": 278, "total_steps": 322, "loss": 0.8414, "lr": 1.6833529107970236e-06, "epoch": 1.7227799227799228, "percentage": 86.34, "elapsed_time": "16:17:08", "remaining_time": "2:34:39"}
279
- {"current_steps": 279, "total_steps": 322, "loss": 0.8305, "lr": 1.6090894899831017e-06, "epoch": 1.728957528957529, "percentage": 86.65, "elapsed_time": "16:20:39", "remaining_time": "2:31:08"}
280
- {"current_steps": 280, "total_steps": 322, "loss": 0.8345, "lr": 1.5364084459108874e-06, "epoch": 1.7351351351351352, "percentage": 86.96, "elapsed_time": "16:24:06", "remaining_time": "2:27:36"}
281
- {"current_steps": 281, "total_steps": 322, "loss": 0.813, "lr": 1.4653183671519749e-06, "epoch": 1.7413127413127412, "percentage": 87.27, "elapsed_time": "16:27:34", "remaining_time": "2:24:05"}
282
- {"current_steps": 282, "total_steps": 322, "loss": 0.8154, "lr": 1.395827654276825e-06, "epoch": 1.7474903474903476, "percentage": 87.58, "elapsed_time": "16:31:01", "remaining_time": "2:20:34"}
283
- {"current_steps": 283, "total_steps": 322, "loss": 0.8256, "lr": 1.3279445188620614e-06, "epoch": 1.7536679536679536, "percentage": 87.89, "elapsed_time": "16:34:27", "remaining_time": "2:17:02"}
284
- {"current_steps": 284, "total_steps": 322, "loss": 0.8265, "lr": 1.26167698252015e-06, "epoch": 1.7598455598455598, "percentage": 88.2, "elapsed_time": "16:37:56", "remaining_time": "2:13:31"}
285
- {"current_steps": 285, "total_steps": 322, "loss": 0.834, "lr": 1.1970328759514893e-06, "epoch": 1.766023166023166, "percentage": 88.51, "elapsed_time": "16:41:25", "remaining_time": "2:10:00"}
286
- {"current_steps": 286, "total_steps": 322, "loss": 0.8226, "lr": 1.1340198380190725e-06, "epoch": 1.7722007722007722, "percentage": 88.82, "elapsed_time": "16:44:55", "remaining_time": "2:06:29"}
287
- {"current_steps": 287, "total_steps": 322, "loss": 0.8255, "lr": 1.0726453148458115e-06, "epoch": 1.7783783783783784, "percentage": 89.13, "elapsed_time": "16:48:21", "remaining_time": "2:02:58"}
288
- {"current_steps": 288, "total_steps": 322, "loss": 0.8183, "lr": 1.0129165589346644e-06, "epoch": 1.7845559845559844, "percentage": 89.44, "elapsed_time": "16:51:48", "remaining_time": "1:59:26"}
289
- {"current_steps": 289, "total_steps": 322, "loss": 0.8041, "lr": 9.548406283115969e-07, "epoch": 1.7907335907335908, "percentage": 89.75, "elapsed_time": "16:55:13", "remaining_time": "1:55:55"}
290
- {"current_steps": 290, "total_steps": 322, "loss": 0.8229, "lr": 8.984243856915763e-07, "epoch": 1.7969111969111968, "percentage": 90.06, "elapsed_time": "16:58:42", "remaining_time": "1:52:24"}
291
- {"current_steps": 291, "total_steps": 322, "loss": 0.8121, "lr": 8.436744976675875e-07, "epoch": 1.803088803088803, "percentage": 90.37, "elapsed_time": "17:02:10", "remaining_time": "1:48:53"}
292
- {"current_steps": 292, "total_steps": 322, "loss": 0.794, "lr": 7.905974339228861e-07, "epoch": 1.8092664092664092, "percentage": 90.68, "elapsed_time": "17:05:38", "remaining_time": "1:45:22"}
293
- {"current_steps": 293, "total_steps": 322, "loss": 0.8121, "lr": 7.391994664664625e-07, "epoch": 1.8154440154440155, "percentage": 90.99, "elapsed_time": "17:09:09", "remaining_time": "1:41:51"}
294
- {"current_steps": 294, "total_steps": 322, "loss": 0.8169, "lr": 6.894866688919133e-07, "epoch": 1.8216216216216217, "percentage": 91.3, "elapsed_time": "17:12:36", "remaining_time": "1:38:20"}
295
- {"current_steps": 295, "total_steps": 322, "loss": 0.8202, "lr": 6.41464915659723e-07, "epoch": 1.8277992277992277, "percentage": 91.61, "elapsed_time": "17:15:59", "remaining_time": "1:34:49"}
296
- {"current_steps": 296, "total_steps": 322, "loss": 0.809, "lr": 5.951398814030951e-07, "epoch": 1.833976833976834, "percentage": 91.93, "elapsed_time": "17:19:24", "remaining_time": "1:31:17"}
297
- {"current_steps": 297, "total_steps": 322, "loss": 0.829, "lr": 5.505170402573911e-07, "epoch": 1.84015444015444, "percentage": 92.24, "elapsed_time": "17:22:52", "remaining_time": "1:27:47"}
298
- {"current_steps": 298, "total_steps": 322, "loss": 0.8155, "lr": 5.076016652132703e-07, "epoch": 1.8463320463320463, "percentage": 92.55, "elapsed_time": "17:26:21", "remaining_time": "1:24:16"}
299
- {"current_steps": 299, "total_steps": 322, "loss": 0.8328, "lr": 4.6639882749357264e-07, "epoch": 1.8525096525096525, "percentage": 92.86, "elapsed_time": "17:29:49", "remaining_time": "1:20:45"}
300
- {"current_steps": 300, "total_steps": 322, "loss": 0.8211, "lr": 4.2691339595408995e-07, "epoch": 1.8586872586872587, "percentage": 93.17, "elapsed_time": "17:33:17", "remaining_time": "1:17:14"}
301
- {"current_steps": 301, "total_steps": 322, "loss": 0.8136, "lr": 3.891500365081996e-07, "epoch": 1.864864864864865, "percentage": 93.48, "elapsed_time": "17:44:10", "remaining_time": "1:14:14"}
302
- {"current_steps": 302, "total_steps": 322, "loss": 0.8128, "lr": 3.53113211575512e-07, "epoch": 1.871042471042471, "percentage": 93.79, "elapsed_time": "17:47:40", "remaining_time": "1:10:42"}
303
- {"current_steps": 303, "total_steps": 322, "loss": 0.8199, "lr": 3.188071795545561e-07, "epoch": 1.8772200772200773, "percentage": 94.1, "elapsed_time": "17:51:09", "remaining_time": "1:07:10"}
304
- {"current_steps": 304, "total_steps": 322, "loss": 0.8232, "lr": 2.8623599431957137e-07, "epoch": 1.8833976833976833, "percentage": 94.41, "elapsed_time": "17:54:36", "remaining_time": "1:03:37"}
305
- {"current_steps": 305, "total_steps": 322, "loss": 0.8266, "lr": 2.5540350474147324e-07, "epoch": 1.8895752895752895, "percentage": 94.72, "elapsed_time": "17:58:05", "remaining_time": "1:00:05"}
306
- {"current_steps": 306, "total_steps": 322, "loss": 0.8275, "lr": 2.2631335423303312e-07, "epoch": 1.8957528957528957, "percentage": 95.03, "elapsed_time": "18:01:36", "remaining_time": "0:56:33"}
307
- {"current_steps": 307, "total_steps": 322, "loss": 0.8141, "lr": 1.989689803183531e-07, "epoch": 1.901930501930502, "percentage": 95.34, "elapsed_time": "18:05:05", "remaining_time": "0:53:01"}
308
- {"current_steps": 308, "total_steps": 322, "loss": 0.839, "lr": 1.7337361422664567e-07, "epoch": 1.9081081081081082, "percentage": 95.65, "elapsed_time": "18:08:33", "remaining_time": "0:49:28"}
309
- {"current_steps": 309, "total_steps": 322, "loss": 0.8289, "lr": 1.4953028051042428e-07, "epoch": 1.9142857142857141, "percentage": 95.96, "elapsed_time": "18:12:00", "remaining_time": "0:45:56"}
310
- {"current_steps": 310, "total_steps": 322, "loss": 0.8209, "lr": 1.2744179668808588e-07, "epoch": 1.9204633204633206, "percentage": 96.27, "elapsed_time": "18:15:38", "remaining_time": "0:42:24"}
311
- {"current_steps": 311, "total_steps": 322, "loss": 0.8281, "lr": 1.0711077291097548e-07, "epoch": 1.9266409266409266, "percentage": 96.58, "elapsed_time": "18:19:04", "remaining_time": "0:38:52"}
312
- {"current_steps": 312, "total_steps": 322, "loss": 0.8144, "lr": 8.853961165494472e-08, "epoch": 1.9328185328185328, "percentage": 96.89, "elapsed_time": "18:22:35", "remaining_time": "0:35:20"}
313
- {"current_steps": 313, "total_steps": 322, "loss": 0.8205, "lr": 7.173050743646382e-08, "epoch": 1.938996138996139, "percentage": 97.2, "elapsed_time": "18:26:00", "remaining_time": "0:31:48"}
314
- {"current_steps": 314, "total_steps": 322, "loss": 0.8063, "lr": 5.668544655329067e-08, "epoch": 1.9451737451737452, "percentage": 97.52, "elapsed_time": "18:29:24", "remaining_time": "0:28:15"}
315
- {"current_steps": 315, "total_steps": 322, "loss": 0.8186, "lr": 4.3406206849763707e-08, "epoch": 1.9513513513513514, "percentage": 97.83, "elapsed_time": "18:32:50", "remaining_time": "0:24:43"}
316
- {"current_steps": 316, "total_steps": 322, "loss": 0.8371, "lr": 3.189435750671321e-08, "epoch": 1.9575289575289574, "percentage": 98.14, "elapsed_time": "18:36:16", "remaining_time": "0:21:11"}
317
- {"current_steps": 317, "total_steps": 322, "loss": 0.8223, "lr": 2.2151258856032974e-08, "epoch": 1.9637065637065638, "percentage": 98.45, "elapsed_time": "18:39:44", "remaining_time": "0:17:39"}
318
- {"current_steps": 318, "total_steps": 322, "loss": 0.8275, "lr": 1.417806221993223e-08, "epoch": 1.9698841698841698, "percentage": 98.76, "elapsed_time": "18:43:12", "remaining_time": "0:14:07"}
319
- {"current_steps": 319, "total_steps": 322, "loss": 0.8302, "lr": 7.975709774892815e-09, "epoch": 1.976061776061776, "percentage": 99.07, "elapsed_time": "18:46:43", "remaining_time": "0:10:35"}
320
- {"current_steps": 320, "total_steps": 322, "loss": 0.8215, "lr": 3.544934440323222e-09, "epoch": 1.9822393822393822, "percentage": 99.38, "elapsed_time": "18:50:10", "remaining_time": "0:07:03"}
321
- {"current_steps": 321, "total_steps": 322, "loss": 0.827, "lr": 8.862597919612192e-10, "epoch": 1.9884169884169884, "percentage": 99.69, "elapsed_time": "18:53:40", "remaining_time": "0:03:31"}
322
- {"current_steps": 322, "total_steps": 322, "loss": 0.8302, "lr": 0.0, "epoch": 1.9945945945945946, "percentage": 100.0, "elapsed_time": "18:57:08", "remaining_time": "0:00:00"}
323
- {"current_steps": 322, "total_steps": 322, "epoch": 1.9945945945945946, "percentage": 100.0, "elapsed_time": "19:04:26", "remaining_time": "0:00:00"}
 
1
+ {"current_steps": 1, "total_steps": 160, "loss": 1.097, "lr": 1.25e-06, "epoch": 0.01237432327919567, "percentage": 0.62, "elapsed_time": "0:07:00", "remaining_time": "18:33:53"}
2
+ {"current_steps": 2, "total_steps": 160, "loss": 1.0897, "lr": 2.5e-06, "epoch": 0.02474864655839134, "percentage": 1.25, "elapsed_time": "0:13:44", "remaining_time": "18:05:33"}
3
+ {"current_steps": 3, "total_steps": 160, "loss": 1.1065, "lr": 3.7500000000000005e-06, "epoch": 0.037122969837587005, "percentage": 1.88, "elapsed_time": "0:20:16", "remaining_time": "17:41:13"}
4
+ {"current_steps": 4, "total_steps": 160, "loss": 1.1059, "lr": 5e-06, "epoch": 0.04949729311678268, "percentage": 2.5, "elapsed_time": "0:26:50", "remaining_time": "17:26:38"}
5
+ {"current_steps": 5, "total_steps": 160, "loss": 1.1144, "lr": 6.25e-06, "epoch": 0.061871616395978345, "percentage": 3.12, "elapsed_time": "0:33:22", "remaining_time": "17:14:48"}
6
+ {"current_steps": 6, "total_steps": 160, "loss": 1.1001, "lr": 7.500000000000001e-06, "epoch": 0.07424593967517401, "percentage": 3.75, "elapsed_time": "0:39:57", "remaining_time": "17:05:24"}
7
+ {"current_steps": 7, "total_steps": 160, "loss": 1.0976, "lr": 8.750000000000001e-06, "epoch": 0.08662026295436968, "percentage": 4.38, "elapsed_time": "0:46:28", "remaining_time": "16:55:53"}
8
+ {"current_steps": 8, "total_steps": 160, "loss": 1.1055, "lr": 1e-05, "epoch": 0.09899458623356536, "percentage": 5.0, "elapsed_time": "0:53:02", "remaining_time": "16:47:41"}
9
+ {"current_steps": 9, "total_steps": 160, "loss": 1.1013, "lr": 1.125e-05, "epoch": 0.11136890951276102, "percentage": 5.62, "elapsed_time": "0:59:38", "remaining_time": "16:40:40"}
10
+ {"current_steps": 10, "total_steps": 160, "loss": 1.0971, "lr": 1.25e-05, "epoch": 0.12374323279195669, "percentage": 6.25, "elapsed_time": "1:06:12", "remaining_time": "16:33:08"}
11
+ {"current_steps": 11, "total_steps": 160, "loss": 1.0972, "lr": 1.375e-05, "epoch": 0.13611755607115236, "percentage": 6.88, "elapsed_time": "1:12:49", "remaining_time": "16:26:22"}
12
+ {"current_steps": 12, "total_steps": 160, "loss": 1.0934, "lr": 1.5000000000000002e-05, "epoch": 0.14849187935034802, "percentage": 7.5, "elapsed_time": "1:19:22", "remaining_time": "16:18:53"}
13
+ {"current_steps": 13, "total_steps": 160, "loss": 1.1053, "lr": 1.6250000000000002e-05, "epoch": 0.1608662026295437, "percentage": 8.12, "elapsed_time": "1:25:54", "remaining_time": "16:11:29"}
14
+ {"current_steps": 14, "total_steps": 160, "loss": 1.1018, "lr": 1.7500000000000002e-05, "epoch": 0.17324052590873937, "percentage": 8.75, "elapsed_time": "1:32:30", "remaining_time": "16:04:40"}
15
+ {"current_steps": 15, "total_steps": 160, "loss": 1.0898, "lr": 1.8750000000000002e-05, "epoch": 0.18561484918793503, "percentage": 9.38, "elapsed_time": "1:39:03", "remaining_time": "15:57:30"}
16
+ {"current_steps": 16, "total_steps": 160, "loss": 1.0954, "lr": 2e-05, "epoch": 0.19798917246713071, "percentage": 10.0, "elapsed_time": "1:45:34", "remaining_time": "15:50:11"}
17
+ {"current_steps": 17, "total_steps": 160, "loss": 1.0887, "lr": 1.999762027079909e-05, "epoch": 0.21036349574632637, "percentage": 10.62, "elapsed_time": "1:52:08", "remaining_time": "15:43:14"}
18
+ {"current_steps": 18, "total_steps": 160, "loss": 1.0951, "lr": 1.999048221581858e-05, "epoch": 0.22273781902552203, "percentage": 11.25, "elapsed_time": "1:58:38", "remaining_time": "15:35:55"}
19
+ {"current_steps": 19, "total_steps": 160, "loss": 1.0872, "lr": 1.9978589232386036e-05, "epoch": 0.23511214230471772, "percentage": 11.88, "elapsed_time": "2:05:08", "remaining_time": "15:28:41"}
20
+ {"current_steps": 20, "total_steps": 160, "loss": 1.0849, "lr": 1.9961946980917457e-05, "epoch": 0.24748646558391338, "percentage": 12.5, "elapsed_time": "2:11:43", "remaining_time": "15:22:04"}
21
+ {"current_steps": 21, "total_steps": 160, "loss": 1.091, "lr": 1.9940563382223196e-05, "epoch": 0.25986078886310904, "percentage": 13.12, "elapsed_time": "2:18:16", "remaining_time": "15:15:17"}
22
+ {"current_steps": 22, "total_steps": 160, "loss": 1.0975, "lr": 1.9914448613738107e-05, "epoch": 0.2722351121423047, "percentage": 13.75, "elapsed_time": "2:24:46", "remaining_time": "15:08:08"}
23
+ {"current_steps": 23, "total_steps": 160, "loss": 1.0882, "lr": 1.988361510467761e-05, "epoch": 0.2846094354215004, "percentage": 14.37, "elapsed_time": "2:31:19", "remaining_time": "15:01:24"}
24
+ {"current_steps": 24, "total_steps": 160, "loss": 1.0874, "lr": 1.9848077530122083e-05, "epoch": 0.29698375870069604, "percentage": 15.0, "elapsed_time": "2:37:55", "remaining_time": "14:54:54"}
25
+ {"current_steps": 25, "total_steps": 160, "loss": 1.0813, "lr": 1.9807852804032306e-05, "epoch": 0.30935808197989173, "percentage": 15.62, "elapsed_time": "2:44:31", "remaining_time": "14:48:26"}
26
+ {"current_steps": 26, "total_steps": 160, "loss": 1.0889, "lr": 1.9762960071199334e-05, "epoch": 0.3217324052590874, "percentage": 16.25, "elapsed_time": "2:51:05", "remaining_time": "14:41:48"}
27
+ {"current_steps": 27, "total_steps": 160, "loss": 1.0728, "lr": 1.9713420698132614e-05, "epoch": 0.33410672853828305, "percentage": 16.88, "elapsed_time": "2:57:37", "remaining_time": "14:34:56"}
28
+ {"current_steps": 28, "total_steps": 160, "loss": 1.0798, "lr": 1.9659258262890683e-05, "epoch": 0.34648105181747874, "percentage": 17.5, "elapsed_time": "3:04:09", "remaining_time": "14:28:11"}
29
+ {"current_steps": 29, "total_steps": 160, "loss": 1.0805, "lr": 1.960049854385929e-05, "epoch": 0.3588553750966744, "percentage": 18.12, "elapsed_time": "3:10:45", "remaining_time": "14:21:40"}
30
+ {"current_steps": 30, "total_steps": 160, "loss": 1.0761, "lr": 1.953716950748227e-05, "epoch": 0.37122969837587005, "percentage": 18.75, "elapsed_time": "3:17:21", "remaining_time": "14:15:12"}
31
+ {"current_steps": 31, "total_steps": 160, "loss": 1.0889, "lr": 1.946930129495106e-05, "epoch": 0.38360402165506574, "percentage": 19.38, "elapsed_time": "3:23:56", "remaining_time": "14:08:38"}
32
+ {"current_steps": 32, "total_steps": 160, "loss": 1.0831, "lr": 1.9396926207859085e-05, "epoch": 0.39597834493426143, "percentage": 20.0, "elapsed_time": "3:30:31", "remaining_time": "14:02:05"}
33
+ {"current_steps": 33, "total_steps": 160, "loss": 1.0624, "lr": 1.932007869282799e-05, "epoch": 0.40835266821345706, "percentage": 20.62, "elapsed_time": "3:37:06", "remaining_time": "13:55:33"}
34
+ {"current_steps": 34, "total_steps": 160, "loss": 1.0742, "lr": 1.9238795325112867e-05, "epoch": 0.42072699149265275, "percentage": 21.25, "elapsed_time": "3:43:37", "remaining_time": "13:48:43"}
35
+ {"current_steps": 35, "total_steps": 160, "loss": 1.0683, "lr": 1.9153114791194475e-05, "epoch": 0.43310131477184843, "percentage": 21.88, "elapsed_time": "3:50:11", "remaining_time": "13:42:08"}
36
+ {"current_steps": 36, "total_steps": 160, "loss": 1.0793, "lr": 1.9063077870366504e-05, "epoch": 0.44547563805104406, "percentage": 22.5, "elapsed_time": "3:56:45", "remaining_time": "13:35:28"}
37
+ {"current_steps": 37, "total_steps": 160, "loss": 1.0764, "lr": 1.8968727415326885e-05, "epoch": 0.45784996133023975, "percentage": 23.12, "elapsed_time": "4:03:14", "remaining_time": "13:28:36"}
38
+ {"current_steps": 38, "total_steps": 160, "loss": 1.0586, "lr": 1.887010833178222e-05, "epoch": 0.47022428460943544, "percentage": 23.75, "elapsed_time": "4:09:45", "remaining_time": "13:21:51"}
39
+ {"current_steps": 39, "total_steps": 160, "loss": 1.0676, "lr": 1.876726755707508e-05, "epoch": 0.48259860788863107, "percentage": 24.38, "elapsed_time": "4:16:16", "remaining_time": "13:15:06"}
40
+ {"current_steps": 40, "total_steps": 160, "loss": 1.0653, "lr": 1.866025403784439e-05, "epoch": 0.49497293116782676, "percentage": 25.0, "elapsed_time": "4:22:52", "remaining_time": "13:08:37"}
41
+ {"current_steps": 41, "total_steps": 160, "loss": 1.0617, "lr": 1.854911870672947e-05, "epoch": 0.5073472544470224, "percentage": 25.62, "elapsed_time": "4:29:23", "remaining_time": "13:01:53"}
42
+ {"current_steps": 42, "total_steps": 160, "loss": 1.0661, "lr": 1.843391445812886e-05, "epoch": 0.5197215777262181, "percentage": 26.25, "elapsed_time": "4:35:54", "remaining_time": "12:55:11"}
43
+ {"current_steps": 43, "total_steps": 160, "loss": 1.0652, "lr": 1.8314696123025456e-05, "epoch": 0.5320959010054138, "percentage": 26.88, "elapsed_time": "4:42:26", "remaining_time": "12:48:31"}
44
+ {"current_steps": 44, "total_steps": 160, "loss": 1.0713, "lr": 1.819152044288992e-05, "epoch": 0.5444702242846094, "percentage": 27.5, "elapsed_time": "4:48:58", "remaining_time": "12:41:50"}
45
+ {"current_steps": 45, "total_steps": 160, "loss": 1.0591, "lr": 1.806444604267483e-05, "epoch": 0.5568445475638051, "percentage": 28.12, "elapsed_time": "4:55:28", "remaining_time": "12:35:06"}
46
+ {"current_steps": 46, "total_steps": 160, "loss": 1.0472, "lr": 1.7933533402912354e-05, "epoch": 0.5692188708430008, "percentage": 28.75, "elapsed_time": "5:02:03", "remaining_time": "12:28:34"}
47
+ {"current_steps": 47, "total_steps": 160, "loss": 1.0621, "lr": 1.7798844830928818e-05, "epoch": 0.5815931941221965, "percentage": 29.38, "elapsed_time": "5:08:37", "remaining_time": "12:21:59"}
48
+ {"current_steps": 48, "total_steps": 160, "loss": 1.0467, "lr": 1.766044443118978e-05, "epoch": 0.5939675174013921, "percentage": 30.0, "elapsed_time": "5:15:10", "remaining_time": "12:15:24"}
49
+ {"current_steps": 49, "total_steps": 160, "loss": 1.0654, "lr": 1.7518398074789776e-05, "epoch": 0.6063418406805878, "percentage": 30.63, "elapsed_time": "5:21:46", "remaining_time": "12:08:55"}
50
+ {"current_steps": 50, "total_steps": 160, "loss": 1.0477, "lr": 1.737277336810124e-05, "epoch": 0.6187161639597835, "percentage": 31.25, "elapsed_time": "5:28:16", "remaining_time": "12:02:11"}
51
+ {"current_steps": 51, "total_steps": 160, "loss": 1.0619, "lr": 1.7223639620597556e-05, "epoch": 0.6310904872389791, "percentage": 31.87, "elapsed_time": "5:34:50", "remaining_time": "11:55:39"}
52
+ {"current_steps": 52, "total_steps": 160, "loss": 1.0471, "lr": 1.7071067811865477e-05, "epoch": 0.6434648105181748, "percentage": 32.5, "elapsed_time": "5:41:21", "remaining_time": "11:48:58"}
53
+ {"current_steps": 53, "total_steps": 160, "loss": 1.0534, "lr": 1.6915130557822698e-05, "epoch": 0.6558391337973705, "percentage": 33.12, "elapsed_time": "5:47:54", "remaining_time": "11:42:23"}
54
+ {"current_steps": 54, "total_steps": 160, "loss": 1.0618, "lr": 1.6755902076156606e-05, "epoch": 0.6682134570765661, "percentage": 33.75, "elapsed_time": "5:54:26", "remaining_time": "11:35:46"}
55
+ {"current_steps": 55, "total_steps": 160, "loss": 1.0612, "lr": 1.659345815100069e-05, "epoch": 0.6805877803557618, "percentage": 34.38, "elapsed_time": "6:01:00", "remaining_time": "11:29:12"}
56
+ {"current_steps": 56, "total_steps": 160, "loss": 1.0495, "lr": 1.6427876096865394e-05, "epoch": 0.6929621036349575, "percentage": 35.0, "elapsed_time": "6:07:34", "remaining_time": "11:22:38"}
57
+ {"current_steps": 57, "total_steps": 160, "loss": 1.0646, "lr": 1.6259234721840595e-05, "epoch": 0.7053364269141531, "percentage": 35.62, "elapsed_time": "6:14:10", "remaining_time": "11:16:09"}
58
+ {"current_steps": 58, "total_steps": 160, "loss": 1.0578, "lr": 1.608761429008721e-05, "epoch": 0.7177107501933488, "percentage": 36.25, "elapsed_time": "6:20:43", "remaining_time": "11:09:33"}
59
+ {"current_steps": 59, "total_steps": 160, "loss": 1.045, "lr": 1.5913096483635827e-05, "epoch": 0.7300850734725445, "percentage": 36.88, "elapsed_time": "6:27:14", "remaining_time": "11:02:55"}
60
+ {"current_steps": 60, "total_steps": 160, "loss": 1.051, "lr": 1.573576436351046e-05, "epoch": 0.7424593967517401, "percentage": 37.5, "elapsed_time": "6:33:46", "remaining_time": "10:56:17"}
61
+ {"current_steps": 61, "total_steps": 160, "loss": 1.0533, "lr": 1.5555702330196024e-05, "epoch": 0.7548337200309359, "percentage": 38.12, "elapsed_time": "6:40:20", "remaining_time": "10:49:44"}
62
+ {"current_steps": 62, "total_steps": 160, "loss": 1.0595, "lr": 1.5372996083468242e-05, "epoch": 0.7672080433101315, "percentage": 38.75, "elapsed_time": "6:46:50", "remaining_time": "10:43:04"}
63
+ {"current_steps": 63, "total_steps": 160, "loss": 1.0503, "lr": 1.5187732581605217e-05, "epoch": 0.7795823665893271, "percentage": 39.38, "elapsed_time": "6:53:24", "remaining_time": "10:36:31"}
64
+ {"current_steps": 64, "total_steps": 160, "loss": 1.0328, "lr": 1.5000000000000002e-05, "epoch": 0.7919566898685229, "percentage": 40.0, "elapsed_time": "6:59:59", "remaining_time": "10:29:59"}
65
+ {"current_steps": 65, "total_steps": 160, "loss": 1.0479, "lr": 1.4809887689193878e-05, "epoch": 0.8043310131477185, "percentage": 40.62, "elapsed_time": "7:06:33", "remaining_time": "10:23:25"}
66
+ {"current_steps": 66, "total_steps": 160, "loss": 1.0514, "lr": 1.4617486132350343e-05, "epoch": 0.8167053364269141, "percentage": 41.25, "elapsed_time": "7:13:07", "remaining_time": "10:16:52"}
67
+ {"current_steps": 67, "total_steps": 160, "loss": 1.0387, "lr": 1.4422886902190014e-05, "epoch": 0.8290796597061099, "percentage": 41.88, "elapsed_time": "7:19:39", "remaining_time": "10:10:16"}
68
+ {"current_steps": 68, "total_steps": 160, "loss": 1.0399, "lr": 1.4226182617406996e-05, "epoch": 0.8414539829853055, "percentage": 42.5, "elapsed_time": "7:26:12", "remaining_time": "10:03:42"}
69
+ {"current_steps": 69, "total_steps": 160, "loss": 1.0403, "lr": 1.4027466898587375e-05, "epoch": 0.8538283062645011, "percentage": 43.12, "elapsed_time": "7:32:45", "remaining_time": "9:57:06"}
70
+ {"current_steps": 70, "total_steps": 160, "loss": 1.0378, "lr": 1.3826834323650899e-05, "epoch": 0.8662026295436969, "percentage": 43.75, "elapsed_time": "7:39:15", "remaining_time": "9:50:28"}
71
+ {"current_steps": 71, "total_steps": 160, "loss": 1.045, "lr": 1.3624380382837017e-05, "epoch": 0.8785769528228925, "percentage": 44.38, "elapsed_time": "7:45:44", "remaining_time": "9:43:49"}
72
+ {"current_steps": 72, "total_steps": 160, "loss": 1.0344, "lr": 1.342020143325669e-05, "epoch": 0.8909512761020881, "percentage": 45.0, "elapsed_time": "7:52:12", "remaining_time": "9:37:08"}
73
+ {"current_steps": 73, "total_steps": 160, "loss": 1.0428, "lr": 1.3214394653031616e-05, "epoch": 0.9033255993812839, "percentage": 45.62, "elapsed_time": "7:58:43", "remaining_time": "9:30:32"}
74
+ {"current_steps": 74, "total_steps": 160, "loss": 1.043, "lr": 1.300705799504273e-05, "epoch": 0.9156999226604795, "percentage": 46.25, "elapsed_time": "8:05:12", "remaining_time": "9:23:53"}
75
+ {"current_steps": 75, "total_steps": 160, "loss": 1.0453, "lr": 1.2798290140309924e-05, "epoch": 0.9280742459396751, "percentage": 46.88, "elapsed_time": "8:11:45", "remaining_time": "9:17:19"}
76
+ {"current_steps": 76, "total_steps": 160, "loss": 1.0341, "lr": 1.2588190451025209e-05, "epoch": 0.9404485692188709, "percentage": 47.5, "elapsed_time": "8:18:15", "remaining_time": "9:10:42"}
77
+ {"current_steps": 77, "total_steps": 160, "loss": 1.0462, "lr": 1.2376858923261732e-05, "epoch": 0.9528228924980665, "percentage": 48.12, "elapsed_time": "8:24:46", "remaining_time": "9:04:06"}
78
+ {"current_steps": 78, "total_steps": 160, "loss": 1.0446, "lr": 1.2164396139381029e-05, "epoch": 0.9651972157772621, "percentage": 48.75, "elapsed_time": "8:31:15", "remaining_time": "8:57:28"}
79
+ {"current_steps": 79, "total_steps": 160, "loss": 1.045, "lr": 1.1950903220161286e-05, "epoch": 0.9775715390564579, "percentage": 49.38, "elapsed_time": "8:37:47", "remaining_time": "8:50:53"}
80
+ {"current_steps": 80, "total_steps": 160, "loss": 1.0377, "lr": 1.1736481776669307e-05, "epoch": 0.9899458623356535, "percentage": 50.0, "elapsed_time": "8:44:20", "remaining_time": "8:44:20"}
81
+ {"current_steps": 81, "total_steps": 160, "loss": 2.0242, "lr": 1.1521233861899168e-05, "epoch": 1.0123743232791957, "percentage": 50.62, "elapsed_time": "8:55:08", "remaining_time": "8:41:55"}
82
+ {"current_steps": 82, "total_steps": 160, "loss": 0.9894, "lr": 1.130526192220052e-05, "epoch": 1.0247486465583913, "percentage": 51.25, "elapsed_time": "9:01:38", "remaining_time": "8:35:13"}
83
+ {"current_steps": 83, "total_steps": 160, "loss": 0.9824, "lr": 1.1088668748519646e-05, "epoch": 1.037122969837587, "percentage": 51.88, "elapsed_time": "9:08:08", "remaining_time": "8:28:31"}
84
+ {"current_steps": 84, "total_steps": 160, "loss": 0.971, "lr": 1.0871557427476585e-05, "epoch": 1.0494972931167827, "percentage": 52.5, "elapsed_time": "9:14:37", "remaining_time": "8:21:47"}
85
+ {"current_steps": 85, "total_steps": 160, "loss": 0.9799, "lr": 1.0654031292301432e-05, "epoch": 1.0618716163959783, "percentage": 53.12, "elapsed_time": "9:21:13", "remaining_time": "8:15:11"}
86
+ {"current_steps": 86, "total_steps": 160, "loss": 0.975, "lr": 1.0436193873653362e-05, "epoch": 1.074245939675174, "percentage": 53.75, "elapsed_time": "9:27:50", "remaining_time": "8:08:36"}
87
+ {"current_steps": 87, "total_steps": 160, "loss": 0.9633, "lr": 1.0218148850345613e-05, "epoch": 1.0866202629543698, "percentage": 54.37, "elapsed_time": "9:34:21", "remaining_time": "8:01:56"}
88
+ {"current_steps": 88, "total_steps": 160, "loss": 0.9802, "lr": 1e-05, "epoch": 1.0989945862335653, "percentage": 55.0, "elapsed_time": "9:40:51", "remaining_time": "7:55:14"}
89
+ {"current_steps": 89, "total_steps": 160, "loss": 0.9617, "lr": 9.78185114965439e-06, "epoch": 1.111368909512761, "percentage": 55.62, "elapsed_time": "9:47:21", "remaining_time": "7:48:33"}
90
+ {"current_steps": 90, "total_steps": 160, "loss": 0.9729, "lr": 9.563806126346643e-06, "epoch": 1.1237432327919568, "percentage": 56.25, "elapsed_time": "9:53:51", "remaining_time": "7:41:53"}
91
+ {"current_steps": 91, "total_steps": 160, "loss": 0.9787, "lr": 9.34596870769857e-06, "epoch": 1.1361175560711523, "percentage": 56.88, "elapsed_time": "10:00:21", "remaining_time": "7:35:13"}
92
+ {"current_steps": 92, "total_steps": 160, "loss": 0.9715, "lr": 9.128442572523418e-06, "epoch": 1.148491879350348, "percentage": 57.5, "elapsed_time": "10:06:59", "remaining_time": "7:28:38"}
93
+ {"current_steps": 93, "total_steps": 160, "loss": 0.973, "lr": 8.911331251480357e-06, "epoch": 1.1608662026295438, "percentage": 58.13, "elapsed_time": "10:13:30", "remaining_time": "7:21:59"}
94
+ {"current_steps": 94, "total_steps": 160, "loss": 0.9718, "lr": 8.694738077799487e-06, "epoch": 1.1732405259087393, "percentage": 58.75, "elapsed_time": "10:20:04", "remaining_time": "7:15:22"}
95
+ {"current_steps": 95, "total_steps": 160, "loss": 0.9653, "lr": 8.478766138100834e-06, "epoch": 1.185614849187935, "percentage": 59.38, "elapsed_time": "10:26:35", "remaining_time": "7:08:43"}
96
+ {"current_steps": 96, "total_steps": 160, "loss": 0.9696, "lr": 8.263518223330698e-06, "epoch": 1.1979891724671308, "percentage": 60.0, "elapsed_time": "10:33:07", "remaining_time": "7:02:04"}
97
+ {"current_steps": 97, "total_steps": 160, "loss": 0.9661, "lr": 8.04909677983872e-06, "epoch": 1.2103634957463263, "percentage": 60.62, "elapsed_time": "10:39:38", "remaining_time": "6:55:26"}
98
+ {"current_steps": 98, "total_steps": 160, "loss": 0.972, "lr": 7.835603860618973e-06, "epoch": 1.222737819025522, "percentage": 61.25, "elapsed_time": "10:46:10", "remaining_time": "6:48:48"}
99
+ {"current_steps": 99, "total_steps": 160, "loss": 0.971, "lr": 7.623141076738271e-06, "epoch": 1.2351121423047178, "percentage": 61.88, "elapsed_time": "10:52:41", "remaining_time": "6:42:09"}
100
+ {"current_steps": 100, "total_steps": 160, "loss": 0.9619, "lr": 7.411809548974792e-06, "epoch": 1.2474864655839133, "percentage": 62.5, "elapsed_time": "10:59:10", "remaining_time": "6:35:30"}
101
+ {"current_steps": 101, "total_steps": 160, "loss": 0.958, "lr": 7.201709859690081e-06, "epoch": 1.259860788863109, "percentage": 63.12, "elapsed_time": "11:12:16", "remaining_time": "6:32:42"}
102
+ {"current_steps": 102, "total_steps": 160, "loss": 0.9727, "lr": 6.992942004957271e-06, "epoch": 1.2722351121423048, "percentage": 63.75, "elapsed_time": "11:18:49", "remaining_time": "6:26:00"}
103
+ {"current_steps": 103, "total_steps": 160, "loss": 0.9639, "lr": 6.785605346968387e-06, "epoch": 1.2846094354215003, "percentage": 64.38, "elapsed_time": "11:25:22", "remaining_time": "6:19:16"}
104
+ {"current_steps": 104, "total_steps": 160, "loss": 0.9648, "lr": 6.579798566743314e-06, "epoch": 1.296983758700696, "percentage": 65.0, "elapsed_time": "11:31:52", "remaining_time": "6:12:32"}
105
+ {"current_steps": 105, "total_steps": 160, "loss": 0.9695, "lr": 6.375619617162985e-06, "epoch": 1.3093580819798918, "percentage": 65.62, "elapsed_time": "11:38:23", "remaining_time": "6:05:49"}
106
+ {"current_steps": 106, "total_steps": 160, "loss": 0.9505, "lr": 6.173165676349103e-06, "epoch": 1.3217324052590875, "percentage": 66.25, "elapsed_time": "11:44:52", "remaining_time": "5:59:05"}
107
+ {"current_steps": 107, "total_steps": 160, "loss": 0.9694, "lr": 5.97253310141263e-06, "epoch": 1.334106728538283, "percentage": 66.88, "elapsed_time": "11:51:22", "remaining_time": "5:52:21"}
108
+ {"current_steps": 108, "total_steps": 160, "loss": 0.9609, "lr": 5.773817382593008e-06, "epoch": 1.3464810518174788, "percentage": 67.5, "elapsed_time": "11:57:52", "remaining_time": "5:45:38"}
109
+ {"current_steps": 109, "total_steps": 160, "loss": 0.962, "lr": 5.5771130978099896e-06, "epoch": 1.3588553750966743, "percentage": 68.12, "elapsed_time": "12:04:23", "remaining_time": "5:38:56"}
110
+ {"current_steps": 110, "total_steps": 160, "loss": 0.9764, "lr": 5.382513867649663e-06, "epoch": 1.37122969837587, "percentage": 68.75, "elapsed_time": "12:10:52", "remaining_time": "5:32:13"}
111
+ {"current_steps": 111, "total_steps": 160, "loss": 0.9574, "lr": 5.190112310806126e-06, "epoch": 1.3836040216550658, "percentage": 69.38, "elapsed_time": "12:17:22", "remaining_time": "5:25:30"}
112
+ {"current_steps": 112, "total_steps": 160, "loss": 0.968, "lr": 5.000000000000003e-06, "epoch": 1.3959783449342615, "percentage": 70.0, "elapsed_time": "12:23:52", "remaining_time": "5:18:48"}
113
+ {"current_steps": 113, "total_steps": 160, "loss": 0.9563, "lr": 4.812267418394784e-06, "epoch": 1.408352668213457, "percentage": 70.62, "elapsed_time": "12:30:25", "remaining_time": "5:12:07"}
114
+ {"current_steps": 114, "total_steps": 160, "loss": 0.9594, "lr": 4.627003916531761e-06, "epoch": 1.4207269914926528, "percentage": 71.25, "elapsed_time": "12:36:58", "remaining_time": "5:05:26"}
115
+ {"current_steps": 115, "total_steps": 160, "loss": 0.951, "lr": 4.444297669803981e-06, "epoch": 1.4331013147718483, "percentage": 71.88, "elapsed_time": "12:43:31", "remaining_time": "4:58:46"}
116
+ {"current_steps": 116, "total_steps": 160, "loss": 0.9445, "lr": 4.264235636489542e-06, "epoch": 1.445475638051044, "percentage": 72.5, "elapsed_time": "12:50:00", "remaining_time": "4:52:04"}
117
+ {"current_steps": 117, "total_steps": 160, "loss": 0.9681, "lr": 4.086903516364179e-06, "epoch": 1.4578499613302398, "percentage": 73.12, "elapsed_time": "12:56:31", "remaining_time": "4:45:23"}
118
+ {"current_steps": 118, "total_steps": 160, "loss": 0.9654, "lr": 3.912385709912794e-06, "epoch": 1.4702242846094355, "percentage": 73.75, "elapsed_time": "13:03:00", "remaining_time": "4:38:41"}
119
+ {"current_steps": 119, "total_steps": 160, "loss": 0.9589, "lr": 3.7407652781594094e-06, "epoch": 1.482598607888631, "percentage": 74.38, "elapsed_time": "13:09:31", "remaining_time": "4:32:01"}
120
+ {"current_steps": 120, "total_steps": 160, "loss": 0.9614, "lr": 3.5721239031346067e-06, "epoch": 1.4949729311678268, "percentage": 75.0, "elapsed_time": "13:16:01", "remaining_time": "4:25:20"}
121
+ {"current_steps": 121, "total_steps": 160, "loss": 0.9687, "lr": 3.4065418489993118e-06, "epoch": 1.5073472544470223, "percentage": 75.62, "elapsed_time": "13:22:32", "remaining_time": "4:18:40"}
122
+ {"current_steps": 122, "total_steps": 160, "loss": 0.9556, "lr": 3.2440979238433977e-06, "epoch": 1.519721577726218, "percentage": 76.25, "elapsed_time": "13:29:08", "remaining_time": "4:12:01"}
123
+ {"current_steps": 123, "total_steps": 160, "loss": 0.9579, "lr": 3.0848694421773075e-06, "epoch": 1.5320959010054138, "percentage": 76.88, "elapsed_time": "13:35:39", "remaining_time": "4:05:21"}
124
+ {"current_steps": 124, "total_steps": 160, "loss": 0.9647, "lr": 2.9289321881345257e-06, "epoch": 1.5444702242846096, "percentage": 77.5, "elapsed_time": "13:42:08", "remaining_time": "3:58:41"}
125
+ {"current_steps": 125, "total_steps": 160, "loss": 0.9512, "lr": 2.776360379402445e-06, "epoch": 1.556844547563805, "percentage": 78.12, "elapsed_time": "13:48:45", "remaining_time": "3:52:03"}
126
+ {"current_steps": 126, "total_steps": 160, "loss": 0.9643, "lr": 2.6272266318987606e-06, "epoch": 1.5692188708430008, "percentage": 78.75, "elapsed_time": "13:55:18", "remaining_time": "3:45:24"}
127
+ {"current_steps": 127, "total_steps": 160, "loss": 0.9416, "lr": 2.4816019252102274e-06, "epoch": 1.5815931941221963, "percentage": 79.38, "elapsed_time": "14:01:55", "remaining_time": "3:38:46"}
128
+ {"current_steps": 128, "total_steps": 160, "loss": 0.9655, "lr": 2.339555568810221e-06, "epoch": 1.593967517401392, "percentage": 80.0, "elapsed_time": "14:08:29", "remaining_time": "3:32:07"}
129
+ {"current_steps": 129, "total_steps": 160, "loss": 0.9618, "lr": 2.201155169071184e-06, "epoch": 1.6063418406805878, "percentage": 80.62, "elapsed_time": "14:14:59", "remaining_time": "3:25:27"}
130
+ {"current_steps": 130, "total_steps": 160, "loss": 0.9559, "lr": 2.0664665970876496e-06, "epoch": 1.6187161639597836, "percentage": 81.25, "elapsed_time": "14:21:31", "remaining_time": "3:18:48"}
131
+ {"current_steps": 131, "total_steps": 160, "loss": 0.9561, "lr": 1.9355539573251737e-06, "epoch": 1.631090487238979, "percentage": 81.88, "elapsed_time": "14:28:08", "remaining_time": "3:12:11"}
132
+ {"current_steps": 132, "total_steps": 160, "loss": 0.9613, "lr": 1.808479557110081e-06, "epoch": 1.6434648105181748, "percentage": 82.5, "elapsed_time": "14:34:43", "remaining_time": "3:05:32"}
133
+ {"current_steps": 133, "total_steps": 160, "loss": 0.9633, "lr": 1.6853038769745466e-06, "epoch": 1.6558391337973704, "percentage": 83.12, "elapsed_time": "14:41:19", "remaining_time": "2:58:54"}
134
+ {"current_steps": 134, "total_steps": 160, "loss": 0.9524, "lr": 1.566085541871145e-06, "epoch": 1.668213457076566, "percentage": 83.75, "elapsed_time": "14:47:51", "remaining_time": "2:52:16"}
135
+ {"current_steps": 135, "total_steps": 160, "loss": 0.9564, "lr": 1.4508812932705364e-06, "epoch": 1.6805877803557618, "percentage": 84.38, "elapsed_time": "14:54:21", "remaining_time": "2:45:37"}
136
+ {"current_steps": 136, "total_steps": 160, "loss": 0.9581, "lr": 1.339745962155613e-06, "epoch": 1.6929621036349576, "percentage": 85.0, "elapsed_time": "15:00:52", "remaining_time": "2:38:58"}
137
+ {"current_steps": 137, "total_steps": 160, "loss": 0.9515, "lr": 1.2327324429249232e-06, "epoch": 1.705336426914153, "percentage": 85.62, "elapsed_time": "15:07:27", "remaining_time": "2:32:20"}
138
+ {"current_steps": 138, "total_steps": 160, "loss": 0.965, "lr": 1.129891668217783e-06, "epoch": 1.7177107501933488, "percentage": 86.25, "elapsed_time": "15:14:01", "remaining_time": "2:25:42"}
139
+ {"current_steps": 139, "total_steps": 160, "loss": 0.9627, "lr": 1.0312725846731174e-06, "epoch": 1.7300850734725444, "percentage": 86.88, "elapsed_time": "15:20:34", "remaining_time": "2:19:04"}
140
+ {"current_steps": 140, "total_steps": 160, "loss": 0.9638, "lr": 9.369221296335007e-07, "epoch": 1.74245939675174, "percentage": 87.5, "elapsed_time": "15:27:08", "remaining_time": "2:12:26"}
141
+ {"current_steps": 141, "total_steps": 160, "loss": 0.9511, "lr": 8.468852088055291e-07, "epoch": 1.7548337200309359, "percentage": 88.12, "elapsed_time": "15:33:40", "remaining_time": "2:05:48"}
142
+ {"current_steps": 142, "total_steps": 160, "loss": 0.9513, "lr": 7.612046748871327e-07, "epoch": 1.7672080433101316, "percentage": 88.75, "elapsed_time": "15:40:12", "remaining_time": "1:59:10"}
143
+ {"current_steps": 143, "total_steps": 160, "loss": 0.9522, "lr": 6.799213071720156e-07, "epoch": 1.7795823665893271, "percentage": 89.38, "elapsed_time": "15:46:41", "remaining_time": "1:52:32"}
144
+ {"current_steps": 144, "total_steps": 160, "loss": 0.9581, "lr": 6.030737921409169e-07, "epoch": 1.7919566898685229, "percentage": 90.0, "elapsed_time": "15:53:14", "remaining_time": "1:45:54"}
145
+ {"current_steps": 145, "total_steps": 160, "loss": 0.9579, "lr": 5.306987050489442e-07, "epoch": 1.8043310131477184, "percentage": 90.62, "elapsed_time": "15:59:45", "remaining_time": "1:39:17"}
146
+ {"current_steps": 146, "total_steps": 160, "loss": 0.9709, "lr": 4.628304925177318e-07, "epoch": 1.8167053364269141, "percentage": 91.25, "elapsed_time": "16:06:14", "remaining_time": "1:32:39"}
147
+ {"current_steps": 147, "total_steps": 160, "loss": 0.9512, "lr": 3.99501456140714e-07, "epoch": 1.8290796597061099, "percentage": 91.88, "elapsed_time": "16:12:45", "remaining_time": "1:26:01"}
148
+ {"current_steps": 148, "total_steps": 160, "loss": 0.9525, "lr": 3.4074173710931804e-07, "epoch": 1.8414539829853056, "percentage": 92.5, "elapsed_time": "16:19:15", "remaining_time": "1:19:23"}
149
+ {"current_steps": 149, "total_steps": 160, "loss": 0.9463, "lr": 2.865793018673857e-07, "epoch": 1.8538283062645011, "percentage": 93.12, "elapsed_time": "16:25:52", "remaining_time": "1:12:46"}
150
+ {"current_steps": 150, "total_steps": 160, "loss": 0.9469, "lr": 2.370399288006664e-07, "epoch": 1.8662026295436969, "percentage": 93.75, "elapsed_time": "16:32:24", "remaining_time": "1:06:09"}
151
+ {"current_steps": 151, "total_steps": 160, "loss": 0.961, "lr": 1.921471959676957e-07, "epoch": 1.8785769528228924, "percentage": 94.38, "elapsed_time": "16:38:59", "remaining_time": "0:59:32"}
152
+ {"current_steps": 152, "total_steps": 160, "loss": 0.9465, "lr": 1.519224698779198e-07, "epoch": 1.8909512761020881, "percentage": 95.0, "elapsed_time": "16:45:33", "remaining_time": "0:52:55"}
153
+ {"current_steps": 153, "total_steps": 160, "loss": 0.9539, "lr": 1.1638489532239339e-07, "epoch": 1.9033255993812839, "percentage": 95.62, "elapsed_time": "16:52:04", "remaining_time": "0:46:18"}
154
+ {"current_steps": 154, "total_steps": 160, "loss": 0.9512, "lr": 8.555138626189619e-08, "epoch": 1.9156999226604796, "percentage": 96.25, "elapsed_time": "16:58:35", "remaining_time": "0:39:41"}
155
+ {"current_steps": 155, "total_steps": 160, "loss": 0.9656, "lr": 5.943661777680354e-08, "epoch": 1.9280742459396751, "percentage": 96.88, "elapsed_time": "17:05:07", "remaining_time": "0:33:04"}
156
+ {"current_steps": 156, "total_steps": 160, "loss": 0.9528, "lr": 3.805301908254455e-08, "epoch": 1.9404485692188709, "percentage": 97.5, "elapsed_time": "17:11:39", "remaining_time": "0:26:27"}
157
+ {"current_steps": 157, "total_steps": 160, "loss": 0.9609, "lr": 2.1410767613965212e-08, "epoch": 1.9528228924980664, "percentage": 98.12, "elapsed_time": "17:18:14", "remaining_time": "0:19:50"}
158
+ {"current_steps": 158, "total_steps": 160, "loss": 0.962, "lr": 9.517784181422018e-09, "epoch": 1.9651972157772621, "percentage": 98.75, "elapsed_time": "17:24:45", "remaining_time": "0:13:13"}
159
+ {"current_steps": 159, "total_steps": 160, "loss": 0.9612, "lr": 2.379729200908676e-09, "epoch": 1.9775715390564579, "percentage": 99.38, "elapsed_time": "17:31:16", "remaining_time": "0:06:36"}
160
+ {"current_steps": 160, "total_steps": 160, "loss": 0.9597, "lr": 0.0, "epoch": 1.9899458623356536, "percentage": 100.0, "elapsed_time": "17:37:46", "remaining_time": "0:00:00"}
161
+ {"current_steps": 160, "total_steps": 160, "epoch": 1.9899458623356536, "percentage": 100.0, "elapsed_time": "17:45:01", "remaining_time": "0:00:00"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc51ce48253c31706cfe677ddc5c90072d374066fd669930926b5d1ab2ddf913
3
  size 7736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05f1aa67890e57a74ebaa46fadabcff22deb3bb50e42f0179e1a1cfadaa403fd
3
  size 7736