furmaniak commited on
Commit
5bdc908
·
verified ·
1 Parent(s): 4a2d6c5

Training in progress, step 100

Browse files
model-00001-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc5854d3f1c991156c1931bea3b6fffb334d590219e11c61b5ef8478ec859b1c
3
  size 4933656472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d71eb25767550422205fe89bb697c423225ee25b93c9254bd16d6548fb017ce0
3
  size 4933656472
model-00002-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0140d1172722c350e2371b37abe2e89f4d32049e5afd6ae221479f190255a9d1
3
  size 4954690712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5727b54c6a608c1cd654fb530332a3e5e298be6f7e1ae3afb37e6124bc45f6c3
3
  size 4954690712
model-00003-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7db684bec19f273ecf19da1eb6db1b6aaf97b51d37bf094e439a1361d5333b8d
3
  size 4902241352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6547b62ef757ff2252f630beed71452dcb8a525a40f4bc0d6aa16cf0540f28e
3
  size 4902241352
model-00004-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4955507ba5976df09f7ed849a45680006ed183994a628d4604cc4422e7457e23
3
  size 4771169120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daf268d466e9891ea803f46d76b541a5f13804d9efc8ad1f36d8b71967756519
3
  size 4771169120
model-00005-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a13b05c94c3c61e4ec82d7cb1db5ad90c022830c6b2817ebfaeab0be52b57f0
3
  size 4771169120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c56935fca60f62e9b15c2fed62910b34e6c0dc41627f5cc0a80d1cdc2cffc05
3
  size 4771169120
model-00006-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c3cb65a71ee9a406ed45080f4a1c88bd97bcb97414f609bf746a75b16e4ffa2
3
  size 4986116216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:087c22f9e41a37e59ffe9a1ce5a1ce80f3d0e002b17b22883277b247cfa3fc88
3
  size 4986116216
trainer_log.jsonl CHANGED
@@ -1,118 +1,102 @@
1
- {"current_steps": 1, "total_steps": 117, "loss": 1.8884, "lr": 1.6666666666666667e-06, "epoch": 0.008547008547008548, "percentage": 0.85, "elapsed_time": "0:03:29", "remaining_time": "6:45:06"}
2
- {"current_steps": 2, "total_steps": 117, "loss": 1.8929, "lr": 3.3333333333333333e-06, "epoch": 0.017094017094017096, "percentage": 1.71, "elapsed_time": "0:06:43", "remaining_time": "6:26:44"}
3
- {"current_steps": 3, "total_steps": 117, "loss": 1.9025, "lr": 5e-06, "epoch": 0.02564102564102564, "percentage": 2.56, "elapsed_time": "0:09:59", "remaining_time": "6:19:27"}
4
- {"current_steps": 4, "total_steps": 117, "loss": 1.8795, "lr": 6.666666666666667e-06, "epoch": 0.03418803418803419, "percentage": 3.42, "elapsed_time": "0:13:13", "remaining_time": "6:13:42"}
5
- {"current_steps": 5, "total_steps": 117, "loss": 1.8705, "lr": 8.333333333333334e-06, "epoch": 0.042735042735042736, "percentage": 4.27, "elapsed_time": "0:16:25", "remaining_time": "6:07:48"}
6
- {"current_steps": 6, "total_steps": 117, "loss": 1.8572, "lr": 1e-05, "epoch": 0.05128205128205128, "percentage": 5.13, "elapsed_time": "0:19:36", "remaining_time": "6:02:43"}
7
- {"current_steps": 7, "total_steps": 117, "loss": 1.8696, "lr": 9.99799753559161e-06, "epoch": 0.05982905982905983, "percentage": 5.98, "elapsed_time": "0:22:48", "remaining_time": "5:58:17"}
8
- {"current_steps": 8, "total_steps": 117, "loss": 1.8535, "lr": 9.991991746311916e-06, "epoch": 0.06837606837606838, "percentage": 6.84, "elapsed_time": "0:25:58", "remaining_time": "5:53:58"}
9
- {"current_steps": 9, "total_steps": 117, "loss": 1.8623, "lr": 9.981987442712634e-06, "epoch": 0.07692307692307693, "percentage": 7.69, "elapsed_time": "0:29:09", "remaining_time": "5:49:49"}
10
- {"current_steps": 10, "total_steps": 117, "loss": 1.8575, "lr": 9.967992638098517e-06, "epoch": 0.08547008547008547, "percentage": 8.55, "elapsed_time": "0:32:18", "remaining_time": "5:45:44"}
11
- {"current_steps": 11, "total_steps": 117, "loss": 1.8533, "lr": 9.950018542108818e-06, "epoch": 0.09401709401709402, "percentage": 9.4, "elapsed_time": "0:35:27", "remaining_time": "5:41:44"}
12
- {"current_steps": 12, "total_steps": 117, "loss": 1.8447, "lr": 9.928079551738542e-06, "epoch": 0.10256410256410256, "percentage": 10.26, "elapsed_time": "0:38:36", "remaining_time": "5:37:46"}
13
- {"current_steps": 13, "total_steps": 117, "loss": 1.8458, "lr": 9.902193239806634e-06, "epoch": 0.1111111111111111, "percentage": 11.11, "elapsed_time": "0:41:47", "remaining_time": "5:34:16"}
14
- {"current_steps": 14, "total_steps": 117, "loss": 1.8447, "lr": 9.872380340880416e-06, "epoch": 0.11965811965811966, "percentage": 11.97, "elapsed_time": "0:44:57", "remaining_time": "5:30:42"}
15
- {"current_steps": 15, "total_steps": 117, "loss": 1.8474, "lr": 9.838664734667496e-06, "epoch": 0.1282051282051282, "percentage": 12.82, "elapsed_time": "0:48:05", "remaining_time": "5:27:01"}
16
- {"current_steps": 16, "total_steps": 117, "loss": 1.8424, "lr": 9.801073426888447e-06, "epoch": 0.13675213675213677, "percentage": 13.68, "elapsed_time": "0:51:14", "remaining_time": "5:23:30"}
17
- {"current_steps": 17, "total_steps": 117, "loss": 1.8274, "lr": 9.759636527645633e-06, "epoch": 0.1452991452991453, "percentage": 14.53, "elapsed_time": "0:54:23", "remaining_time": "5:19:58"}
18
- {"current_steps": 18, "total_steps": 117, "loss": 1.8262, "lr": 9.714387227305422e-06, "epoch": 0.15384615384615385, "percentage": 15.38, "elapsed_time": "0:57:34", "remaining_time": "5:16:41"}
19
- {"current_steps": 19, "total_steps": 117, "loss": 1.8331, "lr": 9.665361769913187e-06, "epoch": 0.1623931623931624, "percentage": 16.24, "elapsed_time": "1:00:44", "remaining_time": "5:13:17"}
20
- {"current_steps": 20, "total_steps": 117, "loss": 1.8278, "lr": 9.612599424162344e-06, "epoch": 0.17094017094017094, "percentage": 17.09, "elapsed_time": "1:03:55", "remaining_time": "5:10:00"}
21
- {"current_steps": 21, "total_steps": 117, "loss": 1.8238, "lr": 9.55614245194068e-06, "epoch": 0.1794871794871795, "percentage": 17.95, "elapsed_time": "1:07:03", "remaining_time": "5:06:31"}
22
- {"current_steps": 22, "total_steps": 117, "loss": 1.8282, "lr": 9.496036074479184e-06, "epoch": 0.18803418803418803, "percentage": 18.8, "elapsed_time": "1:10:13", "remaining_time": "5:03:13"}
23
- {"current_steps": 23, "total_steps": 117, "loss": 1.825, "lr": 9.432328436130493e-06, "epoch": 0.19658119658119658, "percentage": 19.66, "elapsed_time": "1:13:22", "remaining_time": "4:59:54"}
24
- {"current_steps": 24, "total_steps": 117, "loss": 1.8165, "lr": 9.365070565805941e-06, "epoch": 0.20512820512820512, "percentage": 20.51, "elapsed_time": "1:16:34", "remaining_time": "4:56:43"}
25
- {"current_steps": 25, "total_steps": 117, "loss": 1.8194, "lr": 9.294316336102132e-06, "epoch": 0.21367521367521367, "percentage": 21.37, "elapsed_time": "1:19:43", "remaining_time": "4:53:23"}
26
- {"current_steps": 26, "total_steps": 117, "loss": 1.822, "lr": 9.220122420149753e-06, "epoch": 0.2222222222222222, "percentage": 22.22, "elapsed_time": "1:22:54", "remaining_time": "4:50:09"}
27
- {"current_steps": 27, "total_steps": 117, "loss": 1.8218, "lr": 9.142548246219212e-06, "epoch": 0.23076923076923078, "percentage": 23.08, "elapsed_time": "1:26:05", "remaining_time": "4:46:59"}
28
- {"current_steps": 28, "total_steps": 117, "loss": 1.8245, "lr": 9.06165595011943e-06, "epoch": 0.23931623931623933, "percentage": 23.93, "elapsed_time": "1:29:16", "remaining_time": "4:43:46"}
29
- {"current_steps": 29, "total_steps": 117, "loss": 1.8087, "lr": 8.97751032542795e-06, "epoch": 0.24786324786324787, "percentage": 24.79, "elapsed_time": "1:32:26", "remaining_time": "4:40:31"}
30
- {"current_steps": 30, "total_steps": 117, "loss": 1.8097, "lr": 8.890178771592198e-06, "epoch": 0.2564102564102564, "percentage": 25.64, "elapsed_time": "1:35:37", "remaining_time": "4:37:19"}
31
- {"current_steps": 31, "total_steps": 117, "loss": 1.8207, "lr": 8.799731239943488e-06, "epoch": 0.26495726495726496, "percentage": 26.5, "elapsed_time": "1:38:48", "remaining_time": "4:34:05"}
32
- {"current_steps": 32, "total_steps": 117, "loss": 1.8124, "lr": 8.706240177667003e-06, "epoch": 0.27350427350427353, "percentage": 27.35, "elapsed_time": "1:41:58", "remaining_time": "4:30:51"}
33
- {"current_steps": 33, "total_steps": 117, "loss": 1.8184, "lr": 8.609780469772623e-06, "epoch": 0.28205128205128205, "percentage": 28.21, "elapsed_time": "1:45:07", "remaining_time": "4:27:34"}
34
- {"current_steps": 34, "total_steps": 117, "loss": 1.819, "lr": 8.510429379113114e-06, "epoch": 0.2905982905982906, "percentage": 29.06, "elapsed_time": "1:48:15", "remaining_time": "4:24:17"}
35
- {"current_steps": 35, "total_steps": 117, "loss": 1.8153, "lr": 8.408266484497664e-06, "epoch": 0.29914529914529914, "percentage": 29.91, "elapsed_time": "1:51:23", "remaining_time": "4:20:58"}
36
- {"current_steps": 36, "total_steps": 117, "loss": 1.8141, "lr": 8.303373616950408e-06, "epoch": 0.3076923076923077, "percentage": 30.77, "elapsed_time": "1:54:33", "remaining_time": "4:17:44"}
37
- {"current_steps": 37, "total_steps": 117, "loss": 1.8072, "lr": 8.195834794164925e-06, "epoch": 0.3162393162393162, "percentage": 31.62, "elapsed_time": "1:57:40", "remaining_time": "4:14:25"}
38
- {"current_steps": 38, "total_steps": 117, "loss": 1.8171, "lr": 8.085736153207277e-06, "epoch": 0.3247863247863248, "percentage": 32.48, "elapsed_time": "2:00:51", "remaining_time": "4:11:15"}
39
- {"current_steps": 39, "total_steps": 117, "loss": 1.8192, "lr": 7.973165881521435e-06, "epoch": 0.3333333333333333, "percentage": 33.33, "elapsed_time": "2:04:00", "remaining_time": "4:08:00"}
40
- {"current_steps": 40, "total_steps": 117, "loss": 1.8069, "lr": 7.858214146292394e-06, "epoch": 0.3418803418803419, "percentage": 34.19, "elapsed_time": "2:07:09", "remaining_time": "4:04:47"}
41
- {"current_steps": 41, "total_steps": 117, "loss": 1.8093, "lr": 7.74097302222355e-06, "epoch": 0.3504273504273504, "percentage": 35.04, "elapsed_time": "2:10:19", "remaining_time": "4:01:33"}
42
- {"current_steps": 42, "total_steps": 117, "loss": 1.8014, "lr": 7.621536417786159e-06, "epoch": 0.358974358974359, "percentage": 35.9, "elapsed_time": "2:13:29", "remaining_time": "3:58:23"}
43
- {"current_steps": 43, "total_steps": 117, "loss": 1.8108, "lr": 7.500000000000001e-06, "epoch": 0.36752136752136755, "percentage": 36.75, "elapsed_time": "2:16:38", "remaining_time": "3:55:09"}
44
- {"current_steps": 44, "total_steps": 117, "loss": 1.8069, "lr": 7.37646111780545e-06, "epoch": 0.37606837606837606, "percentage": 37.61, "elapsed_time": "2:19:47", "remaining_time": "3:51:56"}
45
- {"current_steps": 45, "total_steps": 117, "loss": 1.8057, "lr": 7.251018724088367e-06, "epoch": 0.38461538461538464, "percentage": 38.46, "elapsed_time": "2:22:56", "remaining_time": "3:48:43"}
46
- {"current_steps": 46, "total_steps": 117, "loss": 1.8065, "lr": 7.12377329642024e-06, "epoch": 0.39316239316239315, "percentage": 39.32, "elapsed_time": "2:26:05", "remaining_time": "3:45:29"}
47
- {"current_steps": 47, "total_steps": 117, "loss": 1.7997, "lr": 6.994826756577082e-06, "epoch": 0.4017094017094017, "percentage": 40.17, "elapsed_time": "2:29:13", "remaining_time": "3:42:15"}
48
- {"current_steps": 48, "total_steps": 117, "loss": 1.8073, "lr": 6.864282388901544e-06, "epoch": 0.41025641025641024, "percentage": 41.03, "elapsed_time": "2:32:22", "remaining_time": "3:39:01"}
49
- {"current_steps": 49, "total_steps": 117, "loss": 1.8056, "lr": 6.732244757573619e-06, "epoch": 0.4188034188034188, "percentage": 41.88, "elapsed_time": "2:35:30", "remaining_time": "3:35:47"}
50
- {"current_steps": 50, "total_steps": 117, "loss": 1.807, "lr": 6.598819622856227e-06, "epoch": 0.42735042735042733, "percentage": 42.74, "elapsed_time": "2:38:38", "remaining_time": "3:32:35"}
51
- {"current_steps": 51, "total_steps": 117, "loss": 1.8098, "lr": 6.464113856382752e-06, "epoch": 0.4358974358974359, "percentage": 43.59, "elapsed_time": "2:41:48", "remaining_time": "3:29:23"}
52
- {"current_steps": 52, "total_steps": 117, "loss": 1.8016, "lr": 6.328235355554382e-06, "epoch": 0.4444444444444444, "percentage": 44.44, "elapsed_time": "2:44:59", "remaining_time": "3:26:14"}
53
- {"current_steps": 53, "total_steps": 117, "loss": 1.8111, "lr": 6.191292957115825e-06, "epoch": 0.452991452991453, "percentage": 45.3, "elapsed_time": "2:48:09", "remaining_time": "3:23:03"}
54
- {"current_steps": 54, "total_steps": 117, "loss": 1.8038, "lr": 6.053396349978632e-06, "epoch": 0.46153846153846156, "percentage": 46.15, "elapsed_time": "2:51:18", "remaining_time": "3:19:51"}
55
- {"current_steps": 55, "total_steps": 117, "loss": 1.7871, "lr": 5.914655987361934e-06, "epoch": 0.4700854700854701, "percentage": 47.01, "elapsed_time": "2:54:27", "remaining_time": "3:16:39"}
56
- {"current_steps": 56, "total_steps": 117, "loss": 1.8018, "lr": 5.77518299832099e-06, "epoch": 0.47863247863247865, "percentage": 47.86, "elapsed_time": "2:57:36", "remaining_time": "3:13:27"}
57
- {"current_steps": 57, "total_steps": 117, "loss": 1.8044, "lr": 5.635089098734394e-06, "epoch": 0.48717948717948717, "percentage": 48.72, "elapsed_time": "3:00:45", "remaining_time": "3:10:16"}
58
- {"current_steps": 58, "total_steps": 117, "loss": 1.8005, "lr": 5.49448650182125e-06, "epoch": 0.49572649572649574, "percentage": 49.57, "elapsed_time": "3:03:54", "remaining_time": "3:07:05"}
59
- {"current_steps": 59, "total_steps": 117, "loss": 1.8026, "lr": 5.353487828259973e-06, "epoch": 0.5042735042735043, "percentage": 50.43, "elapsed_time": "3:07:03", "remaining_time": "3:03:52"}
60
- {"current_steps": 60, "total_steps": 117, "loss": 1.7954, "lr": 5.212206015980742e-06, "epoch": 0.5128205128205128, "percentage": 51.28, "elapsed_time": "3:10:11", "remaining_time": "3:00:40"}
61
- {"current_steps": 61, "total_steps": 117, "loss": 1.7961, "lr": 5.070754229703811e-06, "epoch": 0.5213675213675214, "percentage": 52.14, "elapsed_time": "3:13:18", "remaining_time": "2:57:28"}
62
- {"current_steps": 62, "total_steps": 117, "loss": 1.8036, "lr": 4.929245770296191e-06, "epoch": 0.5299145299145299, "percentage": 52.99, "elapsed_time": "3:16:27", "remaining_time": "2:54:16"}
63
- {"current_steps": 63, "total_steps": 117, "loss": 1.8029, "lr": 4.78779398401926e-06, "epoch": 0.5384615384615384, "percentage": 53.85, "elapsed_time": "3:19:36", "remaining_time": "2:51:05"}
64
- {"current_steps": 64, "total_steps": 117, "loss": 1.8026, "lr": 4.646512171740028e-06, "epoch": 0.5470085470085471, "percentage": 54.7, "elapsed_time": "3:22:44", "remaining_time": "2:47:53"}
65
- {"current_steps": 65, "total_steps": 117, "loss": 1.8079, "lr": 4.505513498178752e-06, "epoch": 0.5555555555555556, "percentage": 55.56, "elapsed_time": "3:25:51", "remaining_time": "2:44:41"}
66
- {"current_steps": 66, "total_steps": 117, "loss": 1.8008, "lr": 4.364910901265607e-06, "epoch": 0.5641025641025641, "percentage": 56.41, "elapsed_time": "3:29:00", "remaining_time": "2:41:30"}
67
- {"current_steps": 67, "total_steps": 117, "loss": 1.7983, "lr": 4.224817001679011e-06, "epoch": 0.5726495726495726, "percentage": 57.26, "elapsed_time": "3:32:12", "remaining_time": "2:38:21"}
68
- {"current_steps": 68, "total_steps": 117, "loss": 1.799, "lr": 4.085344012638067e-06, "epoch": 0.5811965811965812, "percentage": 58.12, "elapsed_time": "3:35:21", "remaining_time": "2:35:11"}
69
- {"current_steps": 69, "total_steps": 117, "loss": 1.7981, "lr": 3.94660365002137e-06, "epoch": 0.5897435897435898, "percentage": 58.97, "elapsed_time": "3:38:31", "remaining_time": "2:32:01"}
70
- {"current_steps": 70, "total_steps": 117, "loss": 1.7983, "lr": 3.808707042884176e-06, "epoch": 0.5982905982905983, "percentage": 59.83, "elapsed_time": "3:41:40", "remaining_time": "2:28:50"}
71
- {"current_steps": 71, "total_steps": 117, "loss": 1.7924, "lr": 3.6717646444456196e-06, "epoch": 0.6068376068376068, "percentage": 60.68, "elapsed_time": "3:44:51", "remaining_time": "2:25:41"}
72
- {"current_steps": 72, "total_steps": 117, "loss": 1.799, "lr": 3.5358861436172487e-06, "epoch": 0.6153846153846154, "percentage": 61.54, "elapsed_time": "3:48:00", "remaining_time": "2:22:30"}
73
- {"current_steps": 73, "total_steps": 117, "loss": 1.8005, "lr": 3.401180377143774e-06, "epoch": 0.6239316239316239, "percentage": 62.39, "elapsed_time": "3:51:11", "remaining_time": "2:19:20"}
74
- {"current_steps": 74, "total_steps": 117, "loss": 1.7956, "lr": 3.2677552424263836e-06, "epoch": 0.6324786324786325, "percentage": 63.25, "elapsed_time": "3:54:20", "remaining_time": "2:16:10"}
75
- {"current_steps": 75, "total_steps": 117, "loss": 1.798, "lr": 3.1357176110984578e-06, "epoch": 0.6410256410256411, "percentage": 64.1, "elapsed_time": "3:57:29", "remaining_time": "2:12:59"}
76
- {"current_steps": 76, "total_steps": 117, "loss": 1.7934, "lr": 3.0051732434229185e-06, "epoch": 0.6495726495726496, "percentage": 64.96, "elapsed_time": "4:00:37", "remaining_time": "2:09:48"}
77
- {"current_steps": 77, "total_steps": 117, "loss": 1.8012, "lr": 2.8762267035797607e-06, "epoch": 0.6581196581196581, "percentage": 65.81, "elapsed_time": "4:03:46", "remaining_time": "2:06:37"}
78
- {"current_steps": 78, "total_steps": 117, "loss": 1.7915, "lr": 2.748981275911633e-06, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "4:06:54", "remaining_time": "2:03:27"}
79
- {"current_steps": 79, "total_steps": 117, "loss": 1.7867, "lr": 2.6235388821945497e-06, "epoch": 0.6752136752136753, "percentage": 67.52, "elapsed_time": "4:10:05", "remaining_time": "2:00:17"}
80
- {"current_steps": 80, "total_steps": 117, "loss": 1.7952, "lr": 2.5000000000000015e-06, "epoch": 0.6837606837606838, "percentage": 68.38, "elapsed_time": "4:13:13", "remaining_time": "1:57:07"}
81
- {"current_steps": 81, "total_steps": 117, "loss": 1.8026, "lr": 2.3784635822138424e-06, "epoch": 0.6923076923076923, "percentage": 69.23, "elapsed_time": "4:16:22", "remaining_time": "1:53:56"}
82
- {"current_steps": 82, "total_steps": 117, "loss": 1.7956, "lr": 2.2590269777764516e-06, "epoch": 0.7008547008547008, "percentage": 70.09, "elapsed_time": "4:19:32", "remaining_time": "1:50:46"}
83
- {"current_steps": 83, "total_steps": 117, "loss": 1.7947, "lr": 2.141785853707607e-06, "epoch": 0.7094017094017094, "percentage": 70.94, "elapsed_time": "4:22:41", "remaining_time": "1:47:36"}
84
- {"current_steps": 84, "total_steps": 117, "loss": 1.7963, "lr": 2.0268341184785674e-06, "epoch": 0.717948717948718, "percentage": 71.79, "elapsed_time": "4:25:50", "remaining_time": "1:44:26"}
85
- {"current_steps": 85, "total_steps": 117, "loss": 1.7974, "lr": 1.9142638467927254e-06, "epoch": 0.7264957264957265, "percentage": 72.65, "elapsed_time": "4:28:59", "remaining_time": "1:41:15"}
86
- {"current_steps": 86, "total_steps": 117, "loss": 1.794, "lr": 1.8041652058350768e-06, "epoch": 0.7350427350427351, "percentage": 73.5, "elapsed_time": "4:32:07", "remaining_time": "1:38:05"}
87
- {"current_steps": 87, "total_steps": 117, "loss": 1.8017, "lr": 1.6966263830495939e-06, "epoch": 0.7435897435897436, "percentage": 74.36, "elapsed_time": "4:35:14", "remaining_time": "1:34:54"}
88
- {"current_steps": 88, "total_steps": 117, "loss": 1.7874, "lr": 1.5917335155023368e-06, "epoch": 0.7521367521367521, "percentage": 75.21, "elapsed_time": "4:38:24", "remaining_time": "1:31:44"}
89
- {"current_steps": 89, "total_steps": 117, "loss": 1.8012, "lr": 1.4895706208868876e-06, "epoch": 0.7606837606837606, "percentage": 76.07, "elapsed_time": "4:41:32", "remaining_time": "1:28:34"}
90
- {"current_steps": 90, "total_steps": 117, "loss": 1.8029, "lr": 1.390219530227378e-06, "epoch": 0.7692307692307693, "percentage": 76.92, "elapsed_time": "4:44:40", "remaining_time": "1:25:24"}
91
- {"current_steps": 91, "total_steps": 117, "loss": 1.7955, "lr": 1.2937598223330006e-06, "epoch": 0.7777777777777778, "percentage": 77.78, "elapsed_time": "4:47:48", "remaining_time": "1:22:13"}
92
- {"current_steps": 92, "total_steps": 117, "loss": 1.7919, "lr": 1.2002687600565138e-06, "epoch": 0.7863247863247863, "percentage": 78.63, "elapsed_time": "4:50:56", "remaining_time": "1:19:03"}
93
- {"current_steps": 93, "total_steps": 117, "loss": 1.794, "lr": 1.1098212284078037e-06, "epoch": 0.7948717948717948, "percentage": 79.49, "elapsed_time": "4:54:04", "remaining_time": "1:15:53"}
94
- {"current_steps": 94, "total_steps": 117, "loss": 1.7978, "lr": 1.0224896745720513e-06, "epoch": 0.8034188034188035, "percentage": 80.34, "elapsed_time": "4:57:12", "remaining_time": "1:12:43"}
95
- {"current_steps": 95, "total_steps": 117, "loss": 1.8013, "lr": 9.383440498805712e-07, "epoch": 0.811965811965812, "percentage": 81.2, "elapsed_time": "5:00:24", "remaining_time": "1:09:34"}
96
- {"current_steps": 96, "total_steps": 117, "loss": 1.7928, "lr": 8.574517537807897e-07, "epoch": 0.8205128205128205, "percentage": 82.05, "elapsed_time": "5:03:33", "remaining_time": "1:06:24"}
97
- {"current_steps": 97, "total_steps": 117, "loss": 1.7875, "lr": 7.798775798502484e-07, "epoch": 0.8290598290598291, "percentage": 82.91, "elapsed_time": "5:06:43", "remaining_time": "1:03:14"}
98
- {"current_steps": 98, "total_steps": 117, "loss": 1.7868, "lr": 7.056836638978698e-07, "epoch": 0.8376068376068376, "percentage": 83.76, "elapsed_time": "5:09:54", "remaining_time": "1:00:05"}
99
- {"current_steps": 99, "total_steps": 117, "loss": 1.7947, "lr": 6.349294341940593e-07, "epoch": 0.8461538461538461, "percentage": 84.62, "elapsed_time": "5:13:05", "remaining_time": "0:56:55"}
100
- {"current_steps": 100, "total_steps": 117, "loss": 1.7933, "lr": 5.676715638695063e-07, "epoch": 0.8547008547008547, "percentage": 85.47, "elapsed_time": "5:16:13", "remaining_time": "0:53:45"}
101
- {"current_steps": 101, "total_steps": 117, "loss": 1.7983, "lr": 5.039639255208156e-07, "epoch": 0.8632478632478633, "percentage": 86.32, "elapsed_time": "5:21:46", "remaining_time": "0:50:58"}
102
- {"current_steps": 102, "total_steps": 117, "loss": 1.7923, "lr": 4.43857548059321e-07, "epoch": 0.8717948717948718, "percentage": 87.18, "elapsed_time": "5:24:55", "remaining_time": "0:47:46"}
103
- {"current_steps": 103, "total_steps": 117, "loss": 1.8015, "lr": 3.87400575837657e-07, "epoch": 0.8803418803418803, "percentage": 88.03, "elapsed_time": "5:28:04", "remaining_time": "0:44:35"}
104
- {"current_steps": 104, "total_steps": 117, "loss": 1.7987, "lr": 3.346382300868134e-07, "epoch": 0.8888888888888888, "percentage": 88.89, "elapsed_time": "5:31:14", "remaining_time": "0:41:24"}
105
- {"current_steps": 105, "total_steps": 117, "loss": 1.801, "lr": 2.85612772694579e-07, "epoch": 0.8974358974358975, "percentage": 89.74, "elapsed_time": "5:34:25", "remaining_time": "0:38:13"}
106
- {"current_steps": 106, "total_steps": 117, "loss": 1.797, "lr": 2.403634723543674e-07, "epoch": 0.905982905982906, "percentage": 90.6, "elapsed_time": "5:37:36", "remaining_time": "0:35:02"}
107
- {"current_steps": 107, "total_steps": 117, "loss": 1.7963, "lr": 1.989265731115525e-07, "epoch": 0.9145299145299145, "percentage": 91.45, "elapsed_time": "5:40:48", "remaining_time": "0:31:51"}
108
- {"current_steps": 108, "total_steps": 117, "loss": 1.7919, "lr": 1.6133526533250566e-07, "epoch": 0.9230769230769231, "percentage": 92.31, "elapsed_time": "5:43:58", "remaining_time": "0:28:39"}
109
- {"current_steps": 109, "total_steps": 117, "loss": 1.7973, "lr": 1.2761965911958385e-07, "epoch": 0.9316239316239316, "percentage": 93.16, "elapsed_time": "5:47:09", "remaining_time": "0:25:28"}
110
- {"current_steps": 110, "total_steps": 117, "loss": 1.7944, "lr": 9.780676019336632e-08, "epoch": 0.9401709401709402, "percentage": 94.02, "elapsed_time": "5:50:21", "remaining_time": "0:22:17"}
111
- {"current_steps": 111, "total_steps": 117, "loss": 1.7929, "lr": 7.192044826145772e-08, "epoch": 0.9487179487179487, "percentage": 94.87, "elapsed_time": "5:53:32", "remaining_time": "0:19:06"}
112
- {"current_steps": 112, "total_steps": 117, "loss": 1.7953, "lr": 4.998145789118114e-08, "epoch": 0.9572649572649573, "percentage": 95.73, "elapsed_time": "5:56:42", "remaining_time": "0:15:55"}
113
- {"current_steps": 113, "total_steps": 117, "loss": 1.794, "lr": 3.2007361901485455e-08, "epoch": 0.9658119658119658, "percentage": 96.58, "elapsed_time": "5:59:52", "remaining_time": "0:12:44"}
114
- {"current_steps": 114, "total_steps": 117, "loss": 1.7915, "lr": 1.8012557287367394e-08, "epoch": 0.9743589743589743, "percentage": 97.44, "elapsed_time": "6:03:04", "remaining_time": "0:09:33"}
115
- {"current_steps": 115, "total_steps": 117, "loss": 1.7899, "lr": 8.008253688084888e-09, "epoch": 0.9829059829059829, "percentage": 98.29, "elapsed_time": "6:06:15", "remaining_time": "0:06:22"}
116
- {"current_steps": 116, "total_steps": 117, "loss": 1.7893, "lr": 2.002464408392135e-09, "epoch": 0.9914529914529915, "percentage": 99.15, "elapsed_time": "6:09:26", "remaining_time": "0:03:11"}
117
- {"current_steps": 117, "total_steps": 117, "loss": 1.7864, "lr": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "6:12:36", "remaining_time": "0:00:00"}
118
- {"current_steps": 117, "total_steps": 117, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "6:15:35", "remaining_time": "0:00:00"}
 
1
+ {"current_steps": 1, "total_steps": 550, "loss": 1.8898, "lr": 3.5714285714285716e-07, "epoch": 0.0018177686889343332, "percentage": 0.18, "elapsed_time": "0:03:25", "remaining_time": "1 day, 7:20:22"}
2
+ {"current_steps": 2, "total_steps": 550, "loss": 1.8867, "lr": 7.142857142857143e-07, "epoch": 0.0036355373778686664, "percentage": 0.36, "elapsed_time": "0:06:40", "remaining_time": "1 day, 6:30:39"}
3
+ {"current_steps": 3, "total_steps": 550, "loss": 1.8848, "lr": 1.0714285714285714e-06, "epoch": 0.0054533060668029995, "percentage": 0.55, "elapsed_time": "0:09:52", "remaining_time": "1 day, 5:59:21"}
4
+ {"current_steps": 4, "total_steps": 550, "loss": 1.888, "lr": 1.4285714285714286e-06, "epoch": 0.007271074755737333, "percentage": 0.73, "elapsed_time": "0:13:03", "remaining_time": "1 day, 5:43:05"}
5
+ {"current_steps": 5, "total_steps": 550, "loss": 1.8816, "lr": 1.7857142857142859e-06, "epoch": 0.009088843444671665, "percentage": 0.91, "elapsed_time": "0:16:16", "remaining_time": "1 day, 5:33:54"}
6
+ {"current_steps": 6, "total_steps": 550, "loss": 1.8851, "lr": 2.1428571428571427e-06, "epoch": 0.010906612133605999, "percentage": 1.09, "elapsed_time": "0:19:27", "remaining_time": "1 day, 5:24:27"}
7
+ {"current_steps": 7, "total_steps": 550, "loss": 1.8799, "lr": 2.5e-06, "epoch": 0.012724380822540331, "percentage": 1.27, "elapsed_time": "0:22:39", "remaining_time": "1 day, 5:17:57"}
8
+ {"current_steps": 8, "total_steps": 550, "loss": 1.8785, "lr": 2.8571428571428573e-06, "epoch": 0.014542149511474665, "percentage": 1.45, "elapsed_time": "0:25:51", "remaining_time": "1 day, 5:12:11"}
9
+ {"current_steps": 9, "total_steps": 550, "loss": 1.8763, "lr": 3.2142857142857147e-06, "epoch": 0.016359918200409, "percentage": 1.64, "elapsed_time": "0:29:03", "remaining_time": "1 day, 5:06:30"}
10
+ {"current_steps": 10, "total_steps": 550, "loss": 1.8676, "lr": 3.5714285714285718e-06, "epoch": 0.01817768688934333, "percentage": 1.82, "elapsed_time": "0:32:13", "remaining_time": "1 day, 5:00:21"}
11
+ {"current_steps": 11, "total_steps": 550, "loss": 1.8634, "lr": 3.928571428571429e-06, "epoch": 0.019995455578277664, "percentage": 2.0, "elapsed_time": "0:35:25", "remaining_time": "1 day, 4:55:59"}
12
+ {"current_steps": 12, "total_steps": 550, "loss": 1.864, "lr": 4.2857142857142855e-06, "epoch": 0.021813224267211998, "percentage": 2.18, "elapsed_time": "0:38:36", "remaining_time": "1 day, 4:50:54"}
13
+ {"current_steps": 13, "total_steps": 550, "loss": 1.8647, "lr": 4.642857142857144e-06, "epoch": 0.02363099295614633, "percentage": 2.36, "elapsed_time": "0:41:46", "remaining_time": "1 day, 4:45:46"}
14
+ {"current_steps": 14, "total_steps": 550, "loss": 1.8605, "lr": 5e-06, "epoch": 0.025448761645080663, "percentage": 2.55, "elapsed_time": "0:44:56", "remaining_time": "1 day, 4:40:44"}
15
+ {"current_steps": 15, "total_steps": 550, "loss": 1.8648, "lr": 5.357142857142857e-06, "epoch": 0.027266530334014997, "percentage": 2.73, "elapsed_time": "0:48:07", "remaining_time": "1 day, 4:36:38"}
16
+ {"current_steps": 16, "total_steps": 550, "loss": 1.8536, "lr": 5.7142857142857145e-06, "epoch": 0.02908429902294933, "percentage": 2.91, "elapsed_time": "0:51:17", "remaining_time": "1 day, 4:32:06"}
17
+ {"current_steps": 17, "total_steps": 550, "loss": 1.8485, "lr": 6.071428571428571e-06, "epoch": 0.03090206771188366, "percentage": 3.09, "elapsed_time": "0:54:29", "remaining_time": "1 day, 4:28:19"}
18
+ {"current_steps": 18, "total_steps": 550, "loss": 1.8536, "lr": 6.4285714285714295e-06, "epoch": 0.032719836400818, "percentage": 3.27, "elapsed_time": "0:57:39", "remaining_time": "1 day, 4:23:56"}
19
+ {"current_steps": 19, "total_steps": 550, "loss": 1.8491, "lr": 6.785714285714287e-06, "epoch": 0.03453760508975233, "percentage": 3.45, "elapsed_time": "1:00:49", "remaining_time": "1 day, 4:19:43"}
20
+ {"current_steps": 20, "total_steps": 550, "loss": 1.8361, "lr": 7.1428571428571436e-06, "epoch": 0.03635537377868666, "percentage": 3.64, "elapsed_time": "1:03:59", "remaining_time": "1 day, 4:15:34"}
21
+ {"current_steps": 21, "total_steps": 550, "loss": 1.8522, "lr": 7.500000000000001e-06, "epoch": 0.038173142467621, "percentage": 3.82, "elapsed_time": "1:07:10", "remaining_time": "1 day, 4:12:12"}
22
+ {"current_steps": 22, "total_steps": 550, "loss": 1.8391, "lr": 7.857142857142858e-06, "epoch": 0.03999091115655533, "percentage": 4.0, "elapsed_time": "1:10:21", "remaining_time": "1 day, 4:08:33"}
23
+ {"current_steps": 23, "total_steps": 550, "loss": 1.8345, "lr": 8.214285714285714e-06, "epoch": 0.04180867984548966, "percentage": 4.18, "elapsed_time": "1:13:33", "remaining_time": "1 day, 4:05:29"}
24
+ {"current_steps": 24, "total_steps": 550, "loss": 1.8342, "lr": 8.571428571428571e-06, "epoch": 0.043626448534423996, "percentage": 4.36, "elapsed_time": "1:16:45", "remaining_time": "1 day, 4:02:12"}
25
+ {"current_steps": 25, "total_steps": 550, "loss": 1.8399, "lr": 8.92857142857143e-06, "epoch": 0.04544421722335833, "percentage": 4.55, "elapsed_time": "1:19:54", "remaining_time": "1 day, 3:58:10"}
26
+ {"current_steps": 26, "total_steps": 550, "loss": 1.833, "lr": 9.285714285714288e-06, "epoch": 0.04726198591229266, "percentage": 4.73, "elapsed_time": "1:23:06", "remaining_time": "1 day, 3:54:55"}
27
+ {"current_steps": 27, "total_steps": 550, "loss": 1.8342, "lr": 9.642857142857144e-06, "epoch": 0.049079754601226995, "percentage": 4.91, "elapsed_time": "1:26:17", "remaining_time": "1 day, 3:51:20"}
28
+ {"current_steps": 28, "total_steps": 550, "loss": 1.8313, "lr": 1e-05, "epoch": 0.050897523290161326, "percentage": 5.09, "elapsed_time": "1:29:29", "remaining_time": "1 day, 3:48:31"}
29
+ {"current_steps": 29, "total_steps": 550, "loss": 1.8291, "lr": 9.999909448127131e-06, "epoch": 0.05271529197909566, "percentage": 5.27, "elapsed_time": "1:32:39", "remaining_time": "1 day, 3:44:39"}
30
+ {"current_steps": 30, "total_steps": 550, "loss": 1.8185, "lr": 9.999637795788383e-06, "epoch": 0.054533060668029994, "percentage": 5.45, "elapsed_time": "1:35:49", "remaining_time": "1 day, 3:41:01"}
31
+ {"current_steps": 31, "total_steps": 550, "loss": 1.8261, "lr": 9.999185052823207e-06, "epoch": 0.056350829356964324, "percentage": 5.64, "elapsed_time": "1:38:59", "remaining_time": "1 day, 3:37:25"}
32
+ {"current_steps": 32, "total_steps": 550, "loss": 1.8237, "lr": 9.99855123563029e-06, "epoch": 0.05816859804589866, "percentage": 5.82, "elapsed_time": "1:42:10", "remaining_time": "1 day, 3:33:57"}
33
+ {"current_steps": 33, "total_steps": 550, "loss": 1.827, "lr": 9.997736367166967e-06, "epoch": 0.05998636673483299, "percentage": 6.0, "elapsed_time": "1:45:21", "remaining_time": "1 day, 3:30:44"}
34
+ {"current_steps": 34, "total_steps": 550, "loss": 1.8257, "lr": 9.996740476948386e-06, "epoch": 0.06180413542376732, "percentage": 6.18, "elapsed_time": "1:48:32", "remaining_time": "1 day, 3:27:15"}
35
+ {"current_steps": 35, "total_steps": 550, "loss": 1.819, "lr": 9.995563601046434e-06, "epoch": 0.06362190411270166, "percentage": 6.36, "elapsed_time": "1:51:42", "remaining_time": "1 day, 3:23:49"}
36
+ {"current_steps": 36, "total_steps": 550, "loss": 1.8136, "lr": 9.994205782088438e-06, "epoch": 0.065439672801636, "percentage": 6.55, "elapsed_time": "1:54:54", "remaining_time": "1 day, 3:20:37"}
37
+ {"current_steps": 37, "total_steps": 550, "loss": 1.8206, "lr": 9.99266706925562e-06, "epoch": 0.06725744149057032, "percentage": 6.73, "elapsed_time": "1:58:06", "remaining_time": "1 day, 3:17:37"}
38
+ {"current_steps": 38, "total_steps": 550, "loss": 1.8281, "lr": 9.990947518281312e-06, "epoch": 0.06907521017950466, "percentage": 6.91, "elapsed_time": "2:01:16", "remaining_time": "1 day, 3:13:59"}
39
+ {"current_steps": 39, "total_steps": 550, "loss": 1.82, "lr": 9.989047191448934e-06, "epoch": 0.070892978868439, "percentage": 7.09, "elapsed_time": "2:04:25", "remaining_time": "1 day, 3:10:23"}
40
+ {"current_steps": 40, "total_steps": 550, "loss": 1.8079, "lr": 9.986966157589751e-06, "epoch": 0.07271074755737332, "percentage": 7.27, "elapsed_time": "2:07:37", "remaining_time": "1 day, 3:07:09"}
41
+ {"current_steps": 41, "total_steps": 550, "loss": 1.8088, "lr": 9.984704492080366e-06, "epoch": 0.07452851624630766, "percentage": 7.45, "elapsed_time": "2:10:48", "remaining_time": "1 day, 3:03:56"}
42
+ {"current_steps": 42, "total_steps": 550, "loss": 1.8153, "lr": 9.982262276840002e-06, "epoch": 0.076346284935242, "percentage": 7.64, "elapsed_time": "2:14:00", "remaining_time": "1 day, 3:00:49"}
43
+ {"current_steps": 43, "total_steps": 550, "loss": 1.8082, "lr": 9.979639600327522e-06, "epoch": 0.07816405362417632, "percentage": 7.82, "elapsed_time": "2:17:10", "remaining_time": "1 day, 2:57:27"}
44
+ {"current_steps": 44, "total_steps": 550, "loss": 1.8087, "lr": 9.976836557538234e-06, "epoch": 0.07998182231311066, "percentage": 8.0, "elapsed_time": "2:20:22", "remaining_time": "1 day, 2:54:18"}
45
+ {"current_steps": 45, "total_steps": 550, "loss": 1.8132, "lr": 9.973853250000449e-06, "epoch": 0.081799591002045, "percentage": 8.18, "elapsed_time": "2:23:31", "remaining_time": "1 day, 2:50:41"}
46
+ {"current_steps": 46, "total_steps": 550, "loss": 1.8077, "lr": 9.970689785771798e-06, "epoch": 0.08361735969097932, "percentage": 8.36, "elapsed_time": "2:26:44", "remaining_time": "1 day, 2:47:48"}
47
+ {"current_steps": 47, "total_steps": 550, "loss": 1.8063, "lr": 9.967346279435328e-06, "epoch": 0.08543512837991366, "percentage": 8.55, "elapsed_time": "2:29:54", "remaining_time": "1 day, 2:44:17"}
48
+ {"current_steps": 48, "total_steps": 550, "loss": 1.8036, "lr": 9.963822852095344e-06, "epoch": 0.08725289706884799, "percentage": 8.73, "elapsed_time": "2:33:03", "remaining_time": "1 day, 2:40:45"}
49
+ {"current_steps": 49, "total_steps": 550, "loss": 1.8135, "lr": 9.960119631373023e-06, "epoch": 0.08907066575778232, "percentage": 8.91, "elapsed_time": "2:36:13", "remaining_time": "1 day, 2:37:20"}
50
+ {"current_steps": 50, "total_steps": 550, "loss": 1.8115, "lr": 9.95623675140179e-06, "epoch": 0.09088843444671665, "percentage": 9.09, "elapsed_time": "2:39:24", "remaining_time": "1 day, 2:34:08"}
51
+ {"current_steps": 51, "total_steps": 550, "loss": 1.8087, "lr": 9.952174352822474e-06, "epoch": 0.09270620313565099, "percentage": 9.27, "elapsed_time": "2:42:36", "remaining_time": "1 day, 2:30:56"}
52
+ {"current_steps": 52, "total_steps": 550, "loss": 1.8093, "lr": 9.947932582778188e-06, "epoch": 0.09452397182458531, "percentage": 9.45, "elapsed_time": "2:45:46", "remaining_time": "1 day, 2:27:34"}
53
+ {"current_steps": 53, "total_steps": 550, "loss": 1.8008, "lr": 9.943511594909024e-06, "epoch": 0.09634174051351965, "percentage": 9.64, "elapsed_time": "2:48:59", "remaining_time": "1 day, 2:24:38"}
54
+ {"current_steps": 54, "total_steps": 550, "loss": 1.8075, "lr": 9.938911549346473e-06, "epoch": 0.09815950920245399, "percentage": 9.82, "elapsed_time": "2:52:08", "remaining_time": "1 day, 2:21:05"}
55
+ {"current_steps": 55, "total_steps": 550, "loss": 1.8065, "lr": 9.934132612707631e-06, "epoch": 0.09997727789138833, "percentage": 10.0, "elapsed_time": "2:55:18", "remaining_time": "1 day, 2:17:44"}
56
+ {"current_steps": 56, "total_steps": 550, "loss": 1.8066, "lr": 9.929174958089167e-06, "epoch": 0.10179504658032265, "percentage": 10.18, "elapsed_time": "2:58:28", "remaining_time": "1 day, 2:14:23"}
57
+ {"current_steps": 57, "total_steps": 550, "loss": 1.8089, "lr": 9.924038765061042e-06, "epoch": 0.10361281526925699, "percentage": 10.36, "elapsed_time": "3:01:38", "remaining_time": "1 day, 2:11:03"}
58
+ {"current_steps": 58, "total_steps": 550, "loss": 1.8063, "lr": 9.918724219660013e-06, "epoch": 0.10543058395819133, "percentage": 10.55, "elapsed_time": "3:04:49", "remaining_time": "1 day, 2:07:51"}
59
+ {"current_steps": 59, "total_steps": 550, "loss": 1.7952, "lr": 9.913231514382902e-06, "epoch": 0.10724835264712565, "percentage": 10.73, "elapsed_time": "3:08:02", "remaining_time": "1 day, 2:04:51"}
60
+ {"current_steps": 60, "total_steps": 550, "loss": 1.797, "lr": 9.907560848179607e-06, "epoch": 0.10906612133605999, "percentage": 10.91, "elapsed_time": "3:11:14", "remaining_time": "1 day, 2:01:48"}
61
+ {"current_steps": 61, "total_steps": 550, "loss": 1.7966, "lr": 9.901712426445901e-06, "epoch": 0.11088389002499432, "percentage": 11.09, "elapsed_time": "3:14:24", "remaining_time": "1 day, 1:58:26"}
62
+ {"current_steps": 62, "total_steps": 550, "loss": 1.8097, "lr": 9.895686461016007e-06, "epoch": 0.11270165871392865, "percentage": 11.27, "elapsed_time": "3:17:34", "remaining_time": "1 day, 1:55:04"}
63
+ {"current_steps": 63, "total_steps": 550, "loss": 1.7984, "lr": 9.889483170154903e-06, "epoch": 0.11451942740286299, "percentage": 11.45, "elapsed_time": "3:20:44", "remaining_time": "1 day, 1:51:46"}
64
+ {"current_steps": 64, "total_steps": 550, "loss": 1.8013, "lr": 9.883102778550434e-06, "epoch": 0.11633719609179732, "percentage": 11.64, "elapsed_time": "3:23:54", "remaining_time": "1 day, 1:48:25"}
65
+ {"current_steps": 65, "total_steps": 550, "loss": 1.7993, "lr": 9.876545517305163e-06, "epoch": 0.11815496478073165, "percentage": 11.82, "elapsed_time": "3:27:04", "remaining_time": "1 day, 1:45:04"}
66
+ {"current_steps": 66, "total_steps": 550, "loss": 1.7968, "lr": 9.869811623928001e-06, "epoch": 0.11997273346966598, "percentage": 12.0, "elapsed_time": "3:30:14", "remaining_time": "1 day, 1:41:45"}
67
+ {"current_steps": 67, "total_steps": 550, "loss": 1.7947, "lr": 9.862901342325617e-06, "epoch": 0.12179050215860032, "percentage": 12.18, "elapsed_time": "3:33:25", "remaining_time": "1 day, 1:38:35"}
68
+ {"current_steps": 68, "total_steps": 550, "loss": 1.8011, "lr": 9.855814922793583e-06, "epoch": 0.12360827084753465, "percentage": 12.36, "elapsed_time": "3:36:35", "remaining_time": "1 day, 1:35:12"}
69
+ {"current_steps": 69, "total_steps": 550, "loss": 1.7956, "lr": 9.848552622007326e-06, "epoch": 0.125426039536469, "percentage": 12.55, "elapsed_time": "3:39:44", "remaining_time": "1 day, 1:31:51"}
70
+ {"current_steps": 70, "total_steps": 550, "loss": 1.7961, "lr": 9.841114703012817e-06, "epoch": 0.12724380822540332, "percentage": 12.73, "elapsed_time": "3:42:55", "remaining_time": "1 day, 1:28:35"}
71
+ {"current_steps": 71, "total_steps": 550, "loss": 1.7981, "lr": 9.83350143521706e-06, "epoch": 0.12906157691433764, "percentage": 12.91, "elapsed_time": "3:46:06", "remaining_time": "1 day, 1:25:26"}
72
+ {"current_steps": 72, "total_steps": 550, "loss": 1.8042, "lr": 9.82571309437831e-06, "epoch": 0.130879345603272, "percentage": 13.09, "elapsed_time": "3:49:17", "remaining_time": "1 day, 1:22:11"}
73
+ {"current_steps": 73, "total_steps": 550, "loss": 1.793, "lr": 9.817749962596115e-06, "epoch": 0.13269711429220632, "percentage": 13.27, "elapsed_time": "3:52:27", "remaining_time": "1 day, 1:18:54"}
74
+ {"current_steps": 74, "total_steps": 550, "loss": 1.8074, "lr": 9.809612328301071e-06, "epoch": 0.13451488298114064, "percentage": 13.45, "elapsed_time": "3:55:36", "remaining_time": "1 day, 1:15:31"}
75
+ {"current_steps": 75, "total_steps": 550, "loss": 1.7973, "lr": 9.801300486244385e-06, "epoch": 0.136332651670075, "percentage": 13.64, "elapsed_time": "3:58:45", "remaining_time": "1 day, 1:12:07"}
76
+ {"current_steps": 76, "total_steps": 550, "loss": 1.7973, "lr": 9.792814737487207e-06, "epoch": 0.13815042035900932, "percentage": 13.82, "elapsed_time": "4:01:54", "remaining_time": "1 day, 1:08:47"}
77
+ {"current_steps": 77, "total_steps": 550, "loss": 1.7986, "lr": 9.784155389389713e-06, "epoch": 0.13996818904794364, "percentage": 14.0, "elapsed_time": "4:05:04", "remaining_time": "1 day, 1:05:24"}
78
+ {"current_steps": 78, "total_steps": 550, "loss": 1.7937, "lr": 9.775322755599979e-06, "epoch": 0.141785957736878, "percentage": 14.18, "elapsed_time": "4:08:13", "remaining_time": "1 day, 1:02:02"}
79
+ {"current_steps": 79, "total_steps": 550, "loss": 1.7976, "lr": 9.766317156042615e-06, "epoch": 0.14360372642581232, "percentage": 14.36, "elapsed_time": "4:11:21", "remaining_time": "1 day, 0:58:37"}
80
+ {"current_steps": 80, "total_steps": 550, "loss": 1.7915, "lr": 9.757138916907184e-06, "epoch": 0.14542149511474664, "percentage": 14.55, "elapsed_time": "4:14:31", "remaining_time": "1 day, 0:55:21"}
81
+ {"current_steps": 81, "total_steps": 550, "loss": 1.8053, "lr": 9.747788370636389e-06, "epoch": 0.147239263803681, "percentage": 14.73, "elapsed_time": "4:17:40", "remaining_time": "1 day, 0:52:00"}
82
+ {"current_steps": 82, "total_steps": 550, "loss": 1.7908, "lr": 9.738265855914014e-06, "epoch": 0.14905703249261532, "percentage": 14.91, "elapsed_time": "4:20:50", "remaining_time": "1 day, 0:48:42"}
83
+ {"current_steps": 83, "total_steps": 550, "loss": 1.7888, "lr": 9.728571717652677e-06, "epoch": 0.15087480118154964, "percentage": 15.09, "elapsed_time": "4:23:59", "remaining_time": "1 day, 0:45:22"}
84
+ {"current_steps": 84, "total_steps": 550, "loss": 1.7911, "lr": 9.718706306981332e-06, "epoch": 0.152692569870484, "percentage": 15.27, "elapsed_time": "4:27:08", "remaining_time": "1 day, 0:41:57"}
85
+ {"current_steps": 85, "total_steps": 550, "loss": 1.8017, "lr": 9.708669981232542e-06, "epoch": 0.15451033855941831, "percentage": 15.45, "elapsed_time": "4:30:16", "remaining_time": "1 day, 0:38:31"}
86
+ {"current_steps": 86, "total_steps": 550, "loss": 1.7979, "lr": 9.698463103929542e-06, "epoch": 0.15632810724835264, "percentage": 15.64, "elapsed_time": "4:33:24", "remaining_time": "1 day, 0:35:08"}
87
+ {"current_steps": 87, "total_steps": 550, "loss": 1.7872, "lr": 9.688086044773079e-06, "epoch": 0.158145875937287, "percentage": 15.82, "elapsed_time": "4:36:34", "remaining_time": "1 day, 0:31:54"}
88
+ {"current_steps": 88, "total_steps": 550, "loss": 1.794, "lr": 9.677539179628005e-06, "epoch": 0.1599636446262213, "percentage": 16.0, "elapsed_time": "4:39:43", "remaining_time": "1 day, 0:28:34"}
89
+ {"current_steps": 89, "total_steps": 550, "loss": 1.7981, "lr": 9.66682289050968e-06, "epoch": 0.16178141331515564, "percentage": 16.18, "elapsed_time": "4:42:53", "remaining_time": "1 day, 0:25:20"}
90
+ {"current_steps": 90, "total_steps": 550, "loss": 1.7943, "lr": 9.655937565570124e-06, "epoch": 0.16359918200409, "percentage": 16.36, "elapsed_time": "4:46:05", "remaining_time": "1 day, 0:22:15"}
91
+ {"current_steps": 91, "total_steps": 550, "loss": 1.7873, "lr": 9.644883599083959e-06, "epoch": 0.1654169506930243, "percentage": 16.55, "elapsed_time": "4:49:15", "remaining_time": "1 day, 0:19:01"}
92
+ {"current_steps": 92, "total_steps": 550, "loss": 1.7959, "lr": 9.63366139143413e-06, "epoch": 0.16723471938195864, "percentage": 16.73, "elapsed_time": "4:52:27", "remaining_time": "1 day, 0:15:54"}
93
+ {"current_steps": 93, "total_steps": 550, "loss": 1.7883, "lr": 9.622271349097413e-06, "epoch": 0.169052488070893, "percentage": 16.91, "elapsed_time": "4:55:38", "remaining_time": "1 day, 0:12:47"}
94
+ {"current_steps": 94, "total_steps": 550, "loss": 1.7864, "lr": 9.610713884629667e-06, "epoch": 0.1708702567598273, "percentage": 17.09, "elapsed_time": "4:58:50", "remaining_time": "1 day, 0:09:41"}
95
+ {"current_steps": 95, "total_steps": 550, "loss": 1.7871, "lr": 9.598989416650915e-06, "epoch": 0.17268802544876163, "percentage": 17.27, "elapsed_time": "5:02:02", "remaining_time": "1 day, 0:06:36"}
96
+ {"current_steps": 96, "total_steps": 550, "loss": 1.7804, "lr": 9.587098369830171e-06, "epoch": 0.17450579413769599, "percentage": 17.45, "elapsed_time": "5:05:15", "remaining_time": "1 day, 0:03:36"}
97
+ {"current_steps": 97, "total_steps": 550, "loss": 1.7858, "lr": 9.575041174870062e-06, "epoch": 0.1763235628266303, "percentage": 17.64, "elapsed_time": "5:08:26", "remaining_time": "1 day, 0:00:28"}
98
+ {"current_steps": 98, "total_steps": 550, "loss": 1.7823, "lr": 9.562818268491216e-06, "epoch": 0.17814133151556463, "percentage": 17.82, "elapsed_time": "5:11:39", "remaining_time": "23:57:25"}
99
+ {"current_steps": 99, "total_steps": 550, "loss": 1.7882, "lr": 9.550430093416465e-06, "epoch": 0.17995910020449898, "percentage": 18.0, "elapsed_time": "5:14:48", "remaining_time": "23:54:08"}
100
+ {"current_steps": 100, "total_steps": 550, "loss": 1.7836, "lr": 9.537877098354787e-06, "epoch": 0.1817768688934333, "percentage": 18.18, "elapsed_time": "5:17:58", "remaining_time": "23:50:52"}
101
+ {"current_steps": 101, "total_steps": 550, "loss": 1.7843, "lr": 9.525159737985066e-06, "epoch": 0.18359463758236763, "percentage": 18.36, "elapsed_time": "5:24:39", "remaining_time": "1 day, 0:03:17"}
102
+ {"current_steps": 102, "total_steps": 550, "loss": 1.7835, "lr": 9.512278472939627e-06, "epoch": 0.18541240627130198, "percentage": 18.55, "elapsed_time": "5:27:49", "remaining_time": "23:59:51"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbcb0763afe7ddb533417233ceab289a75850df67ec6d1a045ba6d98406b7a67
3
- size 7875
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3f7716b5bb67b032e521b14589c540c09ad80ea315f78f0457c4ad79c3ed75e
3
+ size 7672