gsmyrnis commited on
Commit
6589cb2
·
verified ·
1 Parent(s): 7c401c0

Training in progress, epoch 0

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f731ca782b6dbade195e1404a644a857523c3712efbc5155bda0fab320167353
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db24cf62c687c65bd405f2992ce91cea20e4854776905f300db496ba68e1636b
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78275d0c4fb8c347882bfa5a0cba1ea5cd9a1d38dcecf67972864891e14a1937
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2168a2007ac7107210994cc6a9857a8a19fff0e0a052b4048f43e60307b3c2fa
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:178b282610de3e0386f2bf28ac0f7be9e257c9b5065b7b5e5feade0ad46c55ec
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b45d19532fe893a0abe2ccec22bb79c13284dca1c92f2a6c4d74b2b4b45fbd4
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac6434dc335625b6fac58fe1f5ffd681aeaf112fea777a5cc3de6edc4720274b
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:512b5d0932cc6a7a0a6f1faaed400fac2b620942fc6b1b207a76a8c974128b25
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1,220 +1,117 @@
1
- {"current_steps": 1, "total_steps": 219, "loss": 0.472, "lr": 4.5454545454545457e-07, "epoch": 0.0136986301369863, "percentage": 0.46, "elapsed_time": "0:00:02", "remaining_time": "0:09:51"}
2
- {"current_steps": 2, "total_steps": 219, "loss": 0.4526, "lr": 9.090909090909091e-07, "epoch": 0.0273972602739726, "percentage": 0.91, "elapsed_time": "0:00:04", "remaining_time": "0:07:48"}
3
- {"current_steps": 3, "total_steps": 219, "loss": 0.4436, "lr": 1.3636363636363636e-06, "epoch": 0.0410958904109589, "percentage": 1.37, "elapsed_time": "0:00:05", "remaining_time": "0:06:54"}
4
- {"current_steps": 4, "total_steps": 219, "loss": 0.494, "lr": 1.8181818181818183e-06, "epoch": 0.0547945205479452, "percentage": 1.83, "elapsed_time": "0:00:07", "remaining_time": "0:06:20"}
5
- {"current_steps": 5, "total_steps": 219, "loss": 0.4486, "lr": 2.2727272727272728e-06, "epoch": 0.0684931506849315, "percentage": 2.28, "elapsed_time": "0:00:08", "remaining_time": "0:06:05"}
6
- {"current_steps": 6, "total_steps": 219, "loss": 0.418, "lr": 2.7272727272727272e-06, "epoch": 0.0821917808219178, "percentage": 2.74, "elapsed_time": "0:00:09", "remaining_time": "0:05:49"}
7
- {"current_steps": 7, "total_steps": 219, "loss": 0.4354, "lr": 3.181818181818182e-06, "epoch": 0.0958904109589041, "percentage": 3.2, "elapsed_time": "0:00:11", "remaining_time": "0:05:38"}
8
- {"current_steps": 8, "total_steps": 219, "loss": 0.4127, "lr": 3.6363636363636366e-06, "epoch": 0.1095890410958904, "percentage": 3.65, "elapsed_time": "0:00:12", "remaining_time": "0:05:28"}
9
- {"current_steps": 9, "total_steps": 219, "loss": 0.387, "lr": 4.0909090909090915e-06, "epoch": 0.1232876712328767, "percentage": 4.11, "elapsed_time": "0:00:13", "remaining_time": "0:05:26"}
10
- {"current_steps": 10, "total_steps": 219, "loss": 0.414, "lr": 4.5454545454545455e-06, "epoch": 0.136986301369863, "percentage": 4.57, "elapsed_time": "0:00:15", "remaining_time": "0:05:21"}
11
- {"current_steps": 11, "total_steps": 219, "loss": 0.4015, "lr": 5e-06, "epoch": 0.1506849315068493, "percentage": 5.02, "elapsed_time": "0:00:16", "remaining_time": "0:05:14"}
12
- {"current_steps": 12, "total_steps": 219, "loss": 0.3787, "lr": 5.4545454545454545e-06, "epoch": 0.1643835616438356, "percentage": 5.48, "elapsed_time": "0:00:17", "remaining_time": "0:05:09"}
13
- {"current_steps": 13, "total_steps": 219, "loss": 0.3654, "lr": 5.90909090909091e-06, "epoch": 0.1780821917808219, "percentage": 5.94, "elapsed_time": "0:00:19", "remaining_time": "0:05:06"}
14
- {"current_steps": 14, "total_steps": 219, "loss": 0.3886, "lr": 6.363636363636364e-06, "epoch": 0.1917808219178082, "percentage": 6.39, "elapsed_time": "0:00:20", "remaining_time": "0:05:02"}
15
- {"current_steps": 15, "total_steps": 219, "loss": 0.368, "lr": 6.818181818181818e-06, "epoch": 0.2054794520547945, "percentage": 6.85, "elapsed_time": "0:00:21", "remaining_time": "0:04:59"}
16
- {"current_steps": 16, "total_steps": 219, "loss": 0.3584, "lr": 7.272727272727273e-06, "epoch": 0.2191780821917808, "percentage": 7.31, "elapsed_time": "0:00:23", "remaining_time": "0:04:55"}
17
- {"current_steps": 17, "total_steps": 219, "loss": 0.3403, "lr": 7.727272727272727e-06, "epoch": 0.2328767123287671, "percentage": 7.76, "elapsed_time": "0:00:24", "remaining_time": "0:04:52"}
18
- {"current_steps": 18, "total_steps": 219, "loss": 0.3206, "lr": 8.181818181818183e-06, "epoch": 0.2465753424657534, "percentage": 8.22, "elapsed_time": "0:00:25", "remaining_time": "0:04:49"}
19
- {"current_steps": 19, "total_steps": 219, "loss": 0.3002, "lr": 8.636363636363637e-06, "epoch": 0.2602739726027397, "percentage": 8.68, "elapsed_time": "0:00:27", "remaining_time": "0:04:46"}
20
- {"current_steps": 20, "total_steps": 219, "loss": 0.3244, "lr": 9.090909090909091e-06, "epoch": 0.273972602739726, "percentage": 9.13, "elapsed_time": "0:00:28", "remaining_time": "0:04:43"}
21
- {"current_steps": 21, "total_steps": 219, "loss": 0.3761, "lr": 9.545454545454547e-06, "epoch": 0.2876712328767123, "percentage": 9.59, "elapsed_time": "0:00:29", "remaining_time": "0:04:42"}
22
- {"current_steps": 22, "total_steps": 219, "loss": 0.3035, "lr": 1e-05, "epoch": 0.3013698630136986, "percentage": 10.05, "elapsed_time": "0:00:31", "remaining_time": "0:04:40"}
23
- {"current_steps": 23, "total_steps": 219, "loss": 0.3365, "lr": 9.999364232830053e-06, "epoch": 0.3150684931506849, "percentage": 10.5, "elapsed_time": "0:00:32", "remaining_time": "0:04:38"}
24
- {"current_steps": 24, "total_steps": 219, "loss": 0.3114, "lr": 9.997457093000165e-06, "epoch": 0.3287671232876712, "percentage": 10.96, "elapsed_time": "0:00:34", "remaining_time": "0:04:37"}
25
- {"current_steps": 25, "total_steps": 219, "loss": 0.3489, "lr": 9.994279065509094e-06, "epoch": 0.3424657534246575, "percentage": 11.42, "elapsed_time": "0:00:35", "remaining_time": "0:04:34"}
26
- {"current_steps": 26, "total_steps": 219, "loss": 0.3447, "lr": 9.989830958551058e-06, "epoch": 0.3561643835616438, "percentage": 11.87, "elapsed_time": "0:00:36", "remaining_time": "0:04:32"}
27
- {"current_steps": 27, "total_steps": 219, "loss": 0.3154, "lr": 9.984113903310206e-06, "epoch": 0.3698630136986301, "percentage": 12.33, "elapsed_time": "0:00:37", "remaining_time": "0:04:29"}
28
- {"current_steps": 28, "total_steps": 219, "loss": 0.3445, "lr": 9.977129353672951e-06, "epoch": 0.3835616438356164, "percentage": 12.79, "elapsed_time": "0:00:39", "remaining_time": "0:04:27"}
29
- {"current_steps": 29, "total_steps": 219, "loss": 0.3465, "lr": 9.968879085858234e-06, "epoch": 0.3972602739726027, "percentage": 13.24, "elapsed_time": "0:00:40", "remaining_time": "0:04:25"}
30
- {"current_steps": 30, "total_steps": 219, "loss": 0.3273, "lr": 9.959365197965824e-06, "epoch": 0.410958904109589, "percentage": 13.7, "elapsed_time": "0:00:41", "remaining_time": "0:04:23"}
31
- {"current_steps": 31, "total_steps": 219, "loss": 0.3304, "lr": 9.948590109442755e-06, "epoch": 0.4246575342465753, "percentage": 14.16, "elapsed_time": "0:00:43", "remaining_time": "0:04:21"}
32
- {"current_steps": 32, "total_steps": 219, "loss": 0.3329, "lr": 9.936556560468037e-06, "epoch": 0.4383561643835616, "percentage": 14.61, "elapsed_time": "0:00:44", "remaining_time": "0:04:19"}
33
- {"current_steps": 33, "total_steps": 219, "loss": 0.3268, "lr": 9.923267611255824e-06, "epoch": 0.4520547945205479, "percentage": 15.07, "elapsed_time": "0:00:45", "remaining_time": "0:04:18"}
34
- {"current_steps": 34, "total_steps": 219, "loss": 0.3683, "lr": 9.908726641277167e-06, "epoch": 0.4657534246575342, "percentage": 15.53, "elapsed_time": "0:00:47", "remaining_time": "0:04:16"}
35
- {"current_steps": 35, "total_steps": 219, "loss": 0.3313, "lr": 9.8929373484006e-06, "epoch": 0.4794520547945205, "percentage": 15.98, "elapsed_time": "0:00:48", "remaining_time": "0:04:14"}
36
- {"current_steps": 36, "total_steps": 219, "loss": 0.3306, "lr": 9.875903747951742e-06, "epoch": 0.4931506849315068, "percentage": 16.44, "elapsed_time": "0:00:49", "remaining_time": "0:04:12"}
37
- {"current_steps": 37, "total_steps": 219, "loss": 0.3117, "lr": 9.857630171692175e-06, "epoch": 0.5068493150684932, "percentage": 16.89, "elapsed_time": "0:00:51", "remaining_time": "0:04:11"}
38
- {"current_steps": 38, "total_steps": 219, "loss": 0.3357, "lr": 9.83812126671784e-06, "epoch": 0.5205479452054794, "percentage": 17.35, "elapsed_time": "0:00:52", "remaining_time": "0:04:10"}
39
- {"current_steps": 39, "total_steps": 219, "loss": 0.3769, "lr": 9.81738199427726e-06, "epoch": 0.5342465753424658, "percentage": 17.81, "elapsed_time": "0:00:53", "remaining_time": "0:04:08"}
40
- {"current_steps": 40, "total_steps": 219, "loss": 0.3469, "lr": 9.795417628509857e-06, "epoch": 0.547945205479452, "percentage": 18.26, "elapsed_time": "0:00:55", "remaining_time": "0:04:06"}
41
- {"current_steps": 41, "total_steps": 219, "loss": 0.3305, "lr": 9.772233755104695e-06, "epoch": 0.5616438356164384, "percentage": 18.72, "elapsed_time": "0:00:56", "remaining_time": "0:04:04"}
42
- {"current_steps": 42, "total_steps": 219, "loss": 0.3312, "lr": 9.747836269880005e-06, "epoch": 0.5753424657534246, "percentage": 19.18, "elapsed_time": "0:00:57", "remaining_time": "0:04:03"}
43
- {"current_steps": 43, "total_steps": 219, "loss": 0.3713, "lr": 9.722231377283841e-06, "epoch": 0.589041095890411, "percentage": 19.63, "elapsed_time": "0:00:59", "remaining_time": "0:04:02"}
44
- {"current_steps": 44, "total_steps": 219, "loss": 0.3817, "lr": 9.695425588816248e-06, "epoch": 0.6027397260273972, "percentage": 20.09, "elapsed_time": "0:01:00", "remaining_time": "0:04:00"}
45
- {"current_steps": 45, "total_steps": 219, "loss": 0.3504, "lr": 9.667425721373333e-06, "epoch": 0.6164383561643836, "percentage": 20.55, "elapsed_time": "0:01:01", "remaining_time": "0:03:59"}
46
- {"current_steps": 46, "total_steps": 219, "loss": 0.3246, "lr": 9.638238895513687e-06, "epoch": 0.6301369863013698, "percentage": 21.0, "elapsed_time": "0:01:03", "remaining_time": "0:03:57"}
47
- {"current_steps": 47, "total_steps": 219, "loss": 0.3301, "lr": 9.607872533647584e-06, "epoch": 0.6438356164383562, "percentage": 21.46, "elapsed_time": "0:01:04", "remaining_time": "0:03:56"}
48
- {"current_steps": 48, "total_steps": 219, "loss": 0.3264, "lr": 9.5763343581494e-06, "epoch": 0.6575342465753424, "percentage": 21.92, "elapsed_time": "0:01:05", "remaining_time": "0:03:54"}
49
- {"current_steps": 49, "total_steps": 219, "loss": 0.315, "lr": 9.543632389393767e-06, "epoch": 0.6712328767123288, "percentage": 22.37, "elapsed_time": "0:01:07", "remaining_time": "0:03:52"}
50
- {"current_steps": 50, "total_steps": 219, "loss": 0.3348, "lr": 9.50977494371594e-06, "epoch": 0.684931506849315, "percentage": 22.83, "elapsed_time": "0:01:08", "remaining_time": "0:03:51"}
51
- {"current_steps": 51, "total_steps": 219, "loss": 0.3885, "lr": 9.474770631296882e-06, "epoch": 0.6986301369863014, "percentage": 23.29, "elapsed_time": "0:01:09", "remaining_time": "0:03:50"}
52
- {"current_steps": 52, "total_steps": 219, "loss": 0.351, "lr": 9.438628353973654e-06, "epoch": 0.7123287671232876, "percentage": 23.74, "elapsed_time": "0:01:11", "remaining_time": "0:03:48"}
53
- {"current_steps": 53, "total_steps": 219, "loss": 0.2853, "lr": 9.4013573029756e-06, "epoch": 0.726027397260274, "percentage": 24.2, "elapsed_time": "0:01:12", "remaining_time": "0:03:46"}
54
- {"current_steps": 54, "total_steps": 219, "loss": 0.3421, "lr": 9.36296695658697e-06, "epoch": 0.7397260273972602, "percentage": 24.66, "elapsed_time": "0:01:13", "remaining_time": "0:03:45"}
55
- {"current_steps": 55, "total_steps": 219, "loss": 0.3127, "lr": 9.323467077736513e-06, "epoch": 0.7534246575342466, "percentage": 25.11, "elapsed_time": "0:01:15", "remaining_time": "0:03:43"}
56
- {"current_steps": 56, "total_steps": 219, "loss": 0.3773, "lr": 9.282867711514703e-06, "epoch": 0.7671232876712328, "percentage": 25.57, "elapsed_time": "0:01:16", "remaining_time": "0:03:42"}
57
- {"current_steps": 57, "total_steps": 219, "loss": 0.2957, "lr": 9.241179182619207e-06, "epoch": 0.7808219178082192, "percentage": 26.03, "elapsed_time": "0:01:17", "remaining_time": "0:03:40"}
58
- {"current_steps": 58, "total_steps": 219, "loss": 0.3309, "lr": 9.19841209272924e-06, "epoch": 0.7945205479452054, "percentage": 26.48, "elapsed_time": "0:01:18", "remaining_time": "0:03:39"}
59
- {"current_steps": 59, "total_steps": 219, "loss": 0.3175, "lr": 9.154577317809483e-06, "epoch": 0.8082191780821918, "percentage": 26.94, "elapsed_time": "0:01:20", "remaining_time": "0:03:37"}
60
- {"current_steps": 60, "total_steps": 219, "loss": 0.3083, "lr": 9.109686005344258e-06, "epoch": 0.821917808219178, "percentage": 27.4, "elapsed_time": "0:01:21", "remaining_time": "0:03:36"}
61
- {"current_steps": 61, "total_steps": 219, "loss": 0.326, "lr": 9.063749571502633e-06, "epoch": 0.8356164383561644, "percentage": 27.85, "elapsed_time": "0:01:23", "remaining_time": "0:03:34"}
62
- {"current_steps": 62, "total_steps": 219, "loss": 0.3308, "lr": 9.016779698235227e-06, "epoch": 0.8493150684931506, "percentage": 28.31, "elapsed_time": "0:01:24", "remaining_time": "0:03:33"}
63
- {"current_steps": 63, "total_steps": 219, "loss": 0.3217, "lr": 8.9687883303034e-06, "epoch": 0.863013698630137, "percentage": 28.77, "elapsed_time": "0:01:25", "remaining_time": "0:03:31"}
64
- {"current_steps": 64, "total_steps": 219, "loss": 0.292, "lr": 8.919787672241619e-06, "epoch": 0.8767123287671232, "percentage": 29.22, "elapsed_time": "0:01:27", "remaining_time": "0:03:30"}
65
- {"current_steps": 65, "total_steps": 219, "loss": 0.3156, "lr": 8.869790185253766e-06, "epoch": 0.8904109589041096, "percentage": 29.68, "elapsed_time": "0:01:28", "remaining_time": "0:03:29"}
66
- {"current_steps": 66, "total_steps": 219, "loss": 0.3835, "lr": 8.818808584044163e-06, "epoch": 0.9041095890410958, "percentage": 30.14, "elapsed_time": "0:01:29", "remaining_time": "0:03:28"}
67
- {"current_steps": 67, "total_steps": 219, "loss": 0.3118, "lr": 8.76685583358414e-06, "epoch": 0.9178082191780822, "percentage": 30.59, "elapsed_time": "0:01:31", "remaining_time": "0:03:26"}
68
- {"current_steps": 68, "total_steps": 219, "loss": 0.2837, "lr": 8.713945145814948e-06, "epoch": 0.9315068493150684, "percentage": 31.05, "elapsed_time": "0:01:32", "remaining_time": "0:03:26"}
69
- {"current_steps": 69, "total_steps": 219, "loss": 0.3545, "lr": 8.660089976287875e-06, "epoch": 0.9452054794520548, "percentage": 31.51, "elapsed_time": "0:01:34", "remaining_time": "0:03:25"}
70
- {"current_steps": 70, "total_steps": 219, "loss": 0.347, "lr": 8.60530402074241e-06, "epoch": 0.958904109589041, "percentage": 31.96, "elapsed_time": "0:01:35", "remaining_time": "0:03:23"}
71
- {"current_steps": 71, "total_steps": 219, "loss": 0.3328, "lr": 8.549601211623316e-06, "epoch": 0.9726027397260274, "percentage": 32.42, "elapsed_time": "0:01:36", "remaining_time": "0:03:22"}
72
- {"current_steps": 72, "total_steps": 219, "loss": 0.317, "lr": 8.492995714537519e-06, "epoch": 0.9863013698630136, "percentage": 32.88, "elapsed_time": "0:01:39", "remaining_time": "0:03:23"}
73
- {"current_steps": 73, "total_steps": 219, "loss": 0.3426, "lr": 8.43550192465169e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:01:41", "remaining_time": "0:03:22"}
74
- {"current_steps": 74, "total_steps": 219, "loss": 0.2593, "lr": 8.377134463031468e-06, "epoch": 1.0136986301369864, "percentage": 33.79, "elapsed_time": "0:02:41", "remaining_time": "0:05:16"}
75
- {"current_steps": 75, "total_steps": 219, "loss": 0.2759, "lr": 8.317908172923207e-06, "epoch": 1.0273972602739727, "percentage": 34.25, "elapsed_time": "0:02:42", "remaining_time": "0:05:12"}
76
- {"current_steps": 76, "total_steps": 219, "loss": 0.3252, "lr": 8.257838115979244e-06, "epoch": 1.0410958904109588, "percentage": 34.7, "elapsed_time": "0:02:44", "remaining_time": "0:05:08"}
77
- {"current_steps": 77, "total_steps": 219, "loss": 0.2972, "lr": 8.196939568427624e-06, "epoch": 1.0547945205479452, "percentage": 35.16, "elapsed_time": "0:02:45", "remaining_time": "0:05:05"}
78
- {"current_steps": 78, "total_steps": 219, "loss": 0.2969, "lr": 8.135228017187238e-06, "epoch": 1.0684931506849316, "percentage": 35.62, "elapsed_time": "0:02:46", "remaining_time": "0:05:01"}
79
- {"current_steps": 79, "total_steps": 219, "loss": 0.2835, "lr": 8.0727191559294e-06, "epoch": 1.0821917808219177, "percentage": 36.07, "elapsed_time": "0:02:48", "remaining_time": "0:04:58"}
80
- {"current_steps": 80, "total_steps": 219, "loss": 0.3078, "lr": 8.009428881086836e-06, "epoch": 1.095890410958904, "percentage": 36.53, "elapsed_time": "0:02:49", "remaining_time": "0:04:54"}
81
- {"current_steps": 81, "total_steps": 219, "loss": 0.2332, "lr": 7.945373287811116e-06, "epoch": 1.1095890410958904, "percentage": 36.99, "elapsed_time": "0:02:50", "remaining_time": "0:04:51"}
82
- {"current_steps": 82, "total_steps": 219, "loss": 0.2494, "lr": 7.880568665879542e-06, "epoch": 1.1232876712328768, "percentage": 37.44, "elapsed_time": "0:02:52", "remaining_time": "0:04:47"}
83
- {"current_steps": 83, "total_steps": 219, "loss": 0.3014, "lr": 7.81503149555255e-06, "epoch": 1.1369863013698631, "percentage": 37.9, "elapsed_time": "0:02:53", "remaining_time": "0:04:44"}
84
- {"current_steps": 84, "total_steps": 219, "loss": 0.2684, "lr": 7.748778443382658e-06, "epoch": 1.1506849315068493, "percentage": 38.36, "elapsed_time": "0:02:54", "remaining_time": "0:04:41"}
85
- {"current_steps": 85, "total_steps": 219, "loss": 0.2688, "lr": 7.68182635797606e-06, "epoch": 1.1643835616438356, "percentage": 38.81, "elapsed_time": "0:02:56", "remaining_time": "0:04:37"}
86
- {"current_steps": 86, "total_steps": 219, "loss": 0.2822, "lr": 7.6141922657079045e-06, "epoch": 1.178082191780822, "percentage": 39.27, "elapsed_time": "0:02:57", "remaining_time": "0:04:34"}
87
- {"current_steps": 87, "total_steps": 219, "loss": 0.2939, "lr": 7.545893366392358e-06, "epoch": 1.191780821917808, "percentage": 39.73, "elapsed_time": "0:02:58", "remaining_time": "0:04:31"}
88
- {"current_steps": 88, "total_steps": 219, "loss": 0.2571, "lr": 7.476947028908595e-06, "epoch": 1.2054794520547945, "percentage": 40.18, "elapsed_time": "0:03:00", "remaining_time": "0:04:28"}
89
- {"current_steps": 89, "total_steps": 219, "loss": 0.2285, "lr": 7.407370786783757e-06, "epoch": 1.2191780821917808, "percentage": 40.64, "elapsed_time": "0:03:01", "remaining_time": "0:04:25"}
90
- {"current_steps": 90, "total_steps": 219, "loss": 0.2908, "lr": 7.33718233373407e-06, "epoch": 1.2328767123287672, "percentage": 41.1, "elapsed_time": "0:03:02", "remaining_time": "0:04:21"}
91
- {"current_steps": 91, "total_steps": 219, "loss": 0.2572, "lr": 7.266399519165193e-06, "epoch": 1.2465753424657535, "percentage": 41.55, "elapsed_time": "0:03:04", "remaining_time": "0:04:18"}
92
- {"current_steps": 92, "total_steps": 219, "loss": 0.2675, "lr": 7.195040343633006e-06, "epoch": 1.2602739726027397, "percentage": 42.01, "elapsed_time": "0:03:05", "remaining_time": "0:04:15"}
93
- {"current_steps": 93, "total_steps": 219, "loss": 0.278, "lr": 7.123122954265942e-06, "epoch": 1.273972602739726, "percentage": 42.47, "elapsed_time": "0:03:06", "remaining_time": "0:04:12"}
94
- {"current_steps": 94, "total_steps": 219, "loss": 0.2649, "lr": 7.050665640150045e-06, "epoch": 1.2876712328767124, "percentage": 42.92, "elapsed_time": "0:03:07", "remaining_time": "0:04:09"}
95
- {"current_steps": 95, "total_steps": 219, "loss": 0.275, "lr": 6.977686827677926e-06, "epoch": 1.3013698630136985, "percentage": 43.38, "elapsed_time": "0:03:09", "remaining_time": "0:04:07"}
96
- {"current_steps": 96, "total_steps": 219, "loss": 0.2633, "lr": 6.904205075862816e-06, "epoch": 1.3150684931506849, "percentage": 43.84, "elapsed_time": "0:03:10", "remaining_time": "0:04:04"}
97
- {"current_steps": 97, "total_steps": 219, "loss": 0.2421, "lr": 6.830239071618874e-06, "epoch": 1.3287671232876712, "percentage": 44.29, "elapsed_time": "0:03:12", "remaining_time": "0:04:01"}
98
- {"current_steps": 98, "total_steps": 219, "loss": 0.2533, "lr": 6.755807625008974e-06, "epoch": 1.3424657534246576, "percentage": 44.75, "elapsed_time": "0:03:14", "remaining_time": "0:03:59"}
99
- {"current_steps": 99, "total_steps": 219, "loss": 0.2923, "lr": 6.680929664461184e-06, "epoch": 1.356164383561644, "percentage": 45.21, "elapsed_time": "0:03:15", "remaining_time": "0:03:56"}
100
- {"current_steps": 100, "total_steps": 219, "loss": 0.2928, "lr": 6.6056242319551315e-06, "epoch": 1.36986301369863, "percentage": 45.66, "elapsed_time": "0:03:16", "remaining_time": "0:03:53"}
101
- {"current_steps": 101, "total_steps": 219, "loss": 0.3264, "lr": 6.529910478179499e-06, "epoch": 1.3835616438356164, "percentage": 46.12, "elapsed_time": "0:03:17", "remaining_time": "0:03:51"}
102
- {"current_steps": 102, "total_steps": 219, "loss": 0.258, "lr": 6.45380765766187e-06, "epoch": 1.3972602739726028, "percentage": 46.58, "elapsed_time": "0:03:19", "remaining_time": "0:03:48"}
103
- {"current_steps": 103, "total_steps": 219, "loss": 0.2556, "lr": 6.377335123872177e-06, "epoch": 1.410958904109589, "percentage": 47.03, "elapsed_time": "0:03:20", "remaining_time": "0:03:46"}
104
- {"current_steps": 104, "total_steps": 219, "loss": 0.2864, "lr": 6.300512324300975e-06, "epoch": 1.4246575342465753, "percentage": 47.49, "elapsed_time": "0:03:22", "remaining_time": "0:03:43"}
105
- {"current_steps": 105, "total_steps": 219, "loss": 0.2552, "lr": 6.223358795513812e-06, "epoch": 1.4383561643835616, "percentage": 47.95, "elapsed_time": "0:03:23", "remaining_time": "0:03:40"}
106
- {"current_steps": 106, "total_steps": 219, "loss": 0.245, "lr": 6.145894158182945e-06, "epoch": 1.452054794520548, "percentage": 48.4, "elapsed_time": "0:03:24", "remaining_time": "0:03:38"}
107
- {"current_steps": 107, "total_steps": 219, "loss": 0.2753, "lr": 6.0681381120976745e-06, "epoch": 1.4657534246575343, "percentage": 48.86, "elapsed_time": "0:03:26", "remaining_time": "0:03:35"}
108
- {"current_steps": 108, "total_steps": 219, "loss": 0.2808, "lr": 5.990110431154549e-06, "epoch": 1.4794520547945205, "percentage": 49.32, "elapsed_time": "0:03:27", "remaining_time": "0:03:33"}
109
- {"current_steps": 109, "total_steps": 219, "loss": 0.2591, "lr": 5.9118309583287205e-06, "epoch": 1.4931506849315068, "percentage": 49.77, "elapsed_time": "0:03:28", "remaining_time": "0:03:30"}
110
- {"current_steps": 110, "total_steps": 219, "loss": 0.3354, "lr": 5.8333196006277536e-06, "epoch": 1.5068493150684932, "percentage": 50.23, "elapsed_time": "0:03:30", "remaining_time": "0:03:28"}
111
- {"current_steps": 111, "total_steps": 219, "loss": 0.2526, "lr": 5.754596324029125e-06, "epoch": 1.5205479452054793, "percentage": 50.68, "elapsed_time": "0:03:31", "remaining_time": "0:03:25"}
112
- {"current_steps": 112, "total_steps": 219, "loss": 0.2537, "lr": 5.675681148402743e-06, "epoch": 1.5342465753424657, "percentage": 51.14, "elapsed_time": "0:03:32", "remaining_time": "0:03:23"}
113
- {"current_steps": 113, "total_steps": 219, "loss": 0.3343, "lr": 5.596594142419759e-06, "epoch": 1.547945205479452, "percentage": 51.6, "elapsed_time": "0:03:34", "remaining_time": "0:03:20"}
114
- {"current_steps": 114, "total_steps": 219, "loss": 0.2454, "lr": 5.517355418448961e-06, "epoch": 1.5616438356164384, "percentage": 52.05, "elapsed_time": "0:03:35", "remaining_time": "0:03:18"}
115
- {"current_steps": 115, "total_steps": 219, "loss": 0.2782, "lr": 5.437985127442065e-06, "epoch": 1.5753424657534247, "percentage": 52.51, "elapsed_time": "0:03:36", "remaining_time": "0:03:16"}
116
- {"current_steps": 116, "total_steps": 219, "loss": 0.2633, "lr": 5.3585034538091885e-06, "epoch": 1.589041095890411, "percentage": 52.97, "elapsed_time": "0:03:38", "remaining_time": "0:03:13"}
117
- {"current_steps": 117, "total_steps": 219, "loss": 0.2261, "lr": 5.278930610285813e-06, "epoch": 1.6027397260273972, "percentage": 53.42, "elapsed_time": "0:03:39", "remaining_time": "0:03:11"}
118
- {"current_steps": 118, "total_steps": 219, "loss": 0.2315, "lr": 5.199286832792553e-06, "epoch": 1.6164383561643836, "percentage": 53.88, "elapsed_time": "0:03:40", "remaining_time": "0:03:09"}
119
- {"current_steps": 119, "total_steps": 219, "loss": 0.295, "lr": 5.119592375289015e-06, "epoch": 1.6301369863013697, "percentage": 54.34, "elapsed_time": "0:03:43", "remaining_time": "0:03:07"}
120
- {"current_steps": 120, "total_steps": 219, "loss": 0.2276, "lr": 5.039867504623084e-06, "epoch": 1.643835616438356, "percentage": 54.79, "elapsed_time": "0:03:44", "remaining_time": "0:03:05"}
121
- {"current_steps": 121, "total_steps": 219, "loss": 0.276, "lr": 4.960132495376919e-06, "epoch": 1.6575342465753424, "percentage": 55.25, "elapsed_time": "0:03:46", "remaining_time": "0:03:03"}
122
- {"current_steps": 122, "total_steps": 219, "loss": 0.2886, "lr": 4.880407624710986e-06, "epoch": 1.6712328767123288, "percentage": 55.71, "elapsed_time": "0:03:47", "remaining_time": "0:03:00"}
123
- {"current_steps": 123, "total_steps": 219, "loss": 0.2911, "lr": 4.800713167207449e-06, "epoch": 1.6849315068493151, "percentage": 56.16, "elapsed_time": "0:03:49", "remaining_time": "0:02:58"}
124
- {"current_steps": 124, "total_steps": 219, "loss": 0.2931, "lr": 4.721069389714188e-06, "epoch": 1.6986301369863015, "percentage": 56.62, "elapsed_time": "0:03:50", "remaining_time": "0:02:56"}
125
- {"current_steps": 125, "total_steps": 219, "loss": 0.2429, "lr": 4.641496546190813e-06, "epoch": 1.7123287671232876, "percentage": 57.08, "elapsed_time": "0:03:51", "remaining_time": "0:02:54"}
126
- {"current_steps": 126, "total_steps": 219, "loss": 0.2898, "lr": 4.562014872557936e-06, "epoch": 1.726027397260274, "percentage": 57.53, "elapsed_time": "0:03:53", "remaining_time": "0:02:51"}
127
- {"current_steps": 127, "total_steps": 219, "loss": 0.2853, "lr": 4.48264458155104e-06, "epoch": 1.7397260273972601, "percentage": 57.99, "elapsed_time": "0:03:54", "remaining_time": "0:02:49"}
128
- {"current_steps": 128, "total_steps": 219, "loss": 0.2457, "lr": 4.403405857580243e-06, "epoch": 1.7534246575342465, "percentage": 58.45, "elapsed_time": "0:03:55", "remaining_time": "0:02:47"}
129
- {"current_steps": 129, "total_steps": 219, "loss": 0.282, "lr": 4.3243188515972575e-06, "epoch": 1.7671232876712328, "percentage": 58.9, "elapsed_time": "0:03:57", "remaining_time": "0:02:45"}
130
- {"current_steps": 130, "total_steps": 219, "loss": 0.2653, "lr": 4.245403675970877e-06, "epoch": 1.7808219178082192, "percentage": 59.36, "elapsed_time": "0:03:58", "remaining_time": "0:02:43"}
131
- {"current_steps": 131, "total_steps": 219, "loss": 0.2535, "lr": 4.166680399372248e-06, "epoch": 1.7945205479452055, "percentage": 59.82, "elapsed_time": "0:04:00", "remaining_time": "0:02:41"}
132
- {"current_steps": 132, "total_steps": 219, "loss": 0.2786, "lr": 4.08816904167128e-06, "epoch": 1.808219178082192, "percentage": 60.27, "elapsed_time": "0:04:01", "remaining_time": "0:02:39"}
133
- {"current_steps": 133, "total_steps": 219, "loss": 0.2588, "lr": 4.009889568845453e-06, "epoch": 1.821917808219178, "percentage": 60.73, "elapsed_time": "0:04:02", "remaining_time": "0:02:36"}
134
- {"current_steps": 134, "total_steps": 219, "loss": 0.276, "lr": 3.9318618879023255e-06, "epoch": 1.8356164383561644, "percentage": 61.19, "elapsed_time": "0:04:04", "remaining_time": "0:02:34"}
135
- {"current_steps": 135, "total_steps": 219, "loss": 0.2486, "lr": 3.854105841817056e-06, "epoch": 1.8493150684931505, "percentage": 61.64, "elapsed_time": "0:04:05", "remaining_time": "0:02:32"}
136
- {"current_steps": 136, "total_steps": 219, "loss": 0.3044, "lr": 3.776641204486191e-06, "epoch": 1.8630136986301369, "percentage": 62.1, "elapsed_time": "0:04:06", "remaining_time": "0:02:30"}
137
- {"current_steps": 137, "total_steps": 219, "loss": 0.2668, "lr": 3.699487675699027e-06, "epoch": 1.8767123287671232, "percentage": 62.56, "elapsed_time": "0:04:08", "remaining_time": "0:02:28"}
138
- {"current_steps": 138, "total_steps": 219, "loss": 0.263, "lr": 3.6226648761278238e-06, "epoch": 1.8904109589041096, "percentage": 63.01, "elapsed_time": "0:04:09", "remaining_time": "0:02:26"}
139
- {"current_steps": 139, "total_steps": 219, "loss": 0.2641, "lr": 3.5461923423381313e-06, "epoch": 1.904109589041096, "percentage": 63.47, "elapsed_time": "0:04:10", "remaining_time": "0:02:24"}
140
- {"current_steps": 140, "total_steps": 219, "loss": 0.2841, "lr": 3.4700895218205026e-06, "epoch": 1.9178082191780823, "percentage": 63.93, "elapsed_time": "0:04:12", "remaining_time": "0:02:22"}
141
- {"current_steps": 141, "total_steps": 219, "loss": 0.2793, "lr": 3.3943757680448697e-06, "epoch": 1.9315068493150684, "percentage": 64.38, "elapsed_time": "0:04:13", "remaining_time": "0:02:20"}
142
- {"current_steps": 142, "total_steps": 219, "loss": 0.2646, "lr": 3.3190703355388165e-06, "epoch": 1.9452054794520548, "percentage": 64.84, "elapsed_time": "0:04:14", "remaining_time": "0:02:18"}
143
- {"current_steps": 143, "total_steps": 219, "loss": 0.2544, "lr": 3.244192374991027e-06, "epoch": 1.958904109589041, "percentage": 65.3, "elapsed_time": "0:04:16", "remaining_time": "0:02:16"}
144
- {"current_steps": 144, "total_steps": 219, "loss": 0.2838, "lr": 3.169760928381127e-06, "epoch": 1.9726027397260273, "percentage": 65.75, "elapsed_time": "0:04:17", "remaining_time": "0:02:14"}
145
- {"current_steps": 145, "total_steps": 219, "loss": 0.2582, "lr": 3.0957949241371845e-06, "epoch": 1.9863013698630136, "percentage": 66.21, "elapsed_time": "0:04:18", "remaining_time": "0:02:12"}
146
- {"current_steps": 146, "total_steps": 219, "loss": 0.2092, "lr": 3.0223131723220756e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:04:20", "remaining_time": "0:02:10"}
147
- {"current_steps": 147, "total_steps": 219, "loss": 0.2165, "lr": 2.949334359849957e-06, "epoch": 2.0136986301369864, "percentage": 67.12, "elapsed_time": "0:05:19", "remaining_time": "0:02:36"}
148
- {"current_steps": 148, "total_steps": 219, "loss": 0.2247, "lr": 2.876877045734058e-06, "epoch": 2.0273972602739727, "percentage": 67.58, "elapsed_time": "0:05:20", "remaining_time": "0:02:33"}
149
- {"current_steps": 149, "total_steps": 219, "loss": 0.1997, "lr": 2.8049596563669936e-06, "epoch": 2.041095890410959, "percentage": 68.04, "elapsed_time": "0:05:22", "remaining_time": "0:02:31"}
150
- {"current_steps": 150, "total_steps": 219, "loss": 0.2302, "lr": 2.7336004808348094e-06, "epoch": 2.0547945205479454, "percentage": 68.49, "elapsed_time": "0:05:23", "remaining_time": "0:02:28"}
151
- {"current_steps": 151, "total_steps": 219, "loss": 0.2337, "lr": 2.662817666265932e-06, "epoch": 2.0684931506849313, "percentage": 68.95, "elapsed_time": "0:05:24", "remaining_time": "0:02:26"}
152
- {"current_steps": 152, "total_steps": 219, "loss": 0.2303, "lr": 2.5926292132162432e-06, "epoch": 2.0821917808219177, "percentage": 69.41, "elapsed_time": "0:05:26", "remaining_time": "0:02:23"}
153
- {"current_steps": 153, "total_steps": 219, "loss": 0.2373, "lr": 2.5230529710914074e-06, "epoch": 2.095890410958904, "percentage": 69.86, "elapsed_time": "0:05:27", "remaining_time": "0:02:21"}
154
- {"current_steps": 154, "total_steps": 219, "loss": 0.1983, "lr": 2.4541066336076434e-06, "epoch": 2.1095890410958904, "percentage": 70.32, "elapsed_time": "0:05:28", "remaining_time": "0:02:18"}
155
- {"current_steps": 155, "total_steps": 219, "loss": 0.3069, "lr": 2.385807734292097e-06, "epoch": 2.1232876712328768, "percentage": 70.78, "elapsed_time": "0:05:30", "remaining_time": "0:02:16"}
156
- {"current_steps": 156, "total_steps": 219, "loss": 0.2487, "lr": 2.318173642023939e-06, "epoch": 2.136986301369863, "percentage": 71.23, "elapsed_time": "0:05:31", "remaining_time": "0:02:13"}
157
- {"current_steps": 157, "total_steps": 219, "loss": 0.2513, "lr": 2.251221556617344e-06, "epoch": 2.1506849315068495, "percentage": 71.69, "elapsed_time": "0:05:33", "remaining_time": "0:02:11"}
158
- {"current_steps": 158, "total_steps": 219, "loss": 0.2337, "lr": 2.184968504447453e-06, "epoch": 2.1643835616438354, "percentage": 72.15, "elapsed_time": "0:05:34", "remaining_time": "0:02:09"}
159
- {"current_steps": 159, "total_steps": 219, "loss": 0.1819, "lr": 2.11943133412046e-06, "epoch": 2.1780821917808217, "percentage": 72.6, "elapsed_time": "0:05:36", "remaining_time": "0:02:06"}
160
- {"current_steps": 160, "total_steps": 219, "loss": 0.2157, "lr": 2.0546267121888863e-06, "epoch": 2.191780821917808, "percentage": 73.06, "elapsed_time": "0:05:38", "remaining_time": "0:02:04"}
161
- {"current_steps": 161, "total_steps": 219, "loss": 0.2337, "lr": 1.990571118913166e-06, "epoch": 2.2054794520547945, "percentage": 73.52, "elapsed_time": "0:05:40", "remaining_time": "0:02:02"}
162
- {"current_steps": 162, "total_steps": 219, "loss": 0.2319, "lr": 1.9272808440706024e-06, "epoch": 2.219178082191781, "percentage": 73.97, "elapsed_time": "0:05:41", "remaining_time": "0:02:00"}
163
- {"current_steps": 163, "total_steps": 219, "loss": 0.2067, "lr": 1.864771982812763e-06, "epoch": 2.232876712328767, "percentage": 74.43, "elapsed_time": "0:05:42", "remaining_time": "0:01:57"}
164
- {"current_steps": 164, "total_steps": 219, "loss": 0.1983, "lr": 1.8030604315723765e-06, "epoch": 2.2465753424657535, "percentage": 74.89, "elapsed_time": "0:05:44", "remaining_time": "0:01:55"}
165
- {"current_steps": 165, "total_steps": 219, "loss": 0.2062, "lr": 1.7421618840207576e-06, "epoch": 2.26027397260274, "percentage": 75.34, "elapsed_time": "0:05:45", "remaining_time": "0:01:53"}
166
- {"current_steps": 166, "total_steps": 219, "loss": 0.2391, "lr": 1.682091827076796e-06, "epoch": 2.2739726027397262, "percentage": 75.8, "elapsed_time": "0:05:46", "remaining_time": "0:01:50"}
167
- {"current_steps": 167, "total_steps": 219, "loss": 0.2615, "lr": 1.6228655369685342e-06, "epoch": 2.287671232876712, "percentage": 76.26, "elapsed_time": "0:05:48", "remaining_time": "0:01:48"}
168
- {"current_steps": 168, "total_steps": 219, "loss": 0.2346, "lr": 1.5644980753483109e-06, "epoch": 2.3013698630136985, "percentage": 76.71, "elapsed_time": "0:05:49", "remaining_time": "0:01:46"}
169
- {"current_steps": 169, "total_steps": 219, "loss": 0.2281, "lr": 1.5070042854624833e-06, "epoch": 2.315068493150685, "percentage": 77.17, "elapsed_time": "0:05:50", "remaining_time": "0:01:43"}
170
- {"current_steps": 170, "total_steps": 219, "loss": 0.2411, "lr": 1.4503987883766857e-06, "epoch": 2.328767123287671, "percentage": 77.63, "elapsed_time": "0:05:52", "remaining_time": "0:01:41"}
171
- {"current_steps": 171, "total_steps": 219, "loss": 0.214, "lr": 1.3946959792575915e-06, "epoch": 2.3424657534246576, "percentage": 78.08, "elapsed_time": "0:05:53", "remaining_time": "0:01:39"}
172
- {"current_steps": 172, "total_steps": 219, "loss": 0.1733, "lr": 1.3399100237121266e-06, "epoch": 2.356164383561644, "percentage": 78.54, "elapsed_time": "0:05:54", "remaining_time": "0:01:36"}
173
- {"current_steps": 173, "total_steps": 219, "loss": 0.191, "lr": 1.2860548541850542e-06, "epoch": 2.3698630136986303, "percentage": 79.0, "elapsed_time": "0:05:56", "remaining_time": "0:01:34"}
174
- {"current_steps": 174, "total_steps": 219, "loss": 0.2372, "lr": 1.233144166415861e-06, "epoch": 2.383561643835616, "percentage": 79.45, "elapsed_time": "0:05:57", "remaining_time": "0:01:32"}
175
- {"current_steps": 175, "total_steps": 219, "loss": 0.187, "lr": 1.1811914159558374e-06, "epoch": 2.3972602739726026, "percentage": 79.91, "elapsed_time": "0:05:58", "remaining_time": "0:01:30"}
176
- {"current_steps": 176, "total_steps": 219, "loss": 0.2357, "lr": 1.1302098147462348e-06, "epoch": 2.410958904109589, "percentage": 80.37, "elapsed_time": "0:06:00", "remaining_time": "0:01:27"}
177
- {"current_steps": 177, "total_steps": 219, "loss": 0.2322, "lr": 1.080212327758382e-06, "epoch": 2.4246575342465753, "percentage": 80.82, "elapsed_time": "0:06:01", "remaining_time": "0:01:25"}
178
- {"current_steps": 178, "total_steps": 219, "loss": 0.1893, "lr": 1.0312116696966012e-06, "epoch": 2.4383561643835616, "percentage": 81.28, "elapsed_time": "0:06:02", "remaining_time": "0:01:23"}
179
- {"current_steps": 179, "total_steps": 219, "loss": 0.2097, "lr": 9.832203017647746e-07, "epoch": 2.452054794520548, "percentage": 81.74, "elapsed_time": "0:06:04", "remaining_time": "0:01:21"}
180
- {"current_steps": 180, "total_steps": 219, "loss": 0.187, "lr": 9.362504284973683e-07, "epoch": 2.4657534246575343, "percentage": 82.19, "elapsed_time": "0:06:05", "remaining_time": "0:01:19"}
181
- {"current_steps": 181, "total_steps": 219, "loss": 0.2157, "lr": 8.903139946557437e-07, "epoch": 2.4794520547945207, "percentage": 82.65, "elapsed_time": "0:06:06", "remaining_time": "0:01:16"}
182
- {"current_steps": 182, "total_steps": 219, "loss": 0.2315, "lr": 8.454226821905171e-07, "epoch": 2.493150684931507, "percentage": 83.11, "elapsed_time": "0:06:07", "remaining_time": "0:01:14"}
183
- {"current_steps": 183, "total_steps": 219, "loss": 0.2128, "lr": 8.015879072707611e-07, "epoch": 2.506849315068493, "percentage": 83.56, "elapsed_time": "0:06:09", "remaining_time": "0:01:12"}
184
- {"current_steps": 184, "total_steps": 219, "loss": 0.21, "lr": 7.588208173807943e-07, "epoch": 2.5205479452054793, "percentage": 84.02, "elapsed_time": "0:06:10", "remaining_time": "0:01:10"}
185
- {"current_steps": 185, "total_steps": 219, "loss": 0.227, "lr": 7.171322884852988e-07, "epoch": 2.5342465753424657, "percentage": 84.47, "elapsed_time": "0:06:11", "remaining_time": "0:01:08"}
186
- {"current_steps": 186, "total_steps": 219, "loss": 0.2004, "lr": 6.765329222634892e-07, "epoch": 2.547945205479452, "percentage": 84.93, "elapsed_time": "0:06:13", "remaining_time": "0:01:06"}
187
- {"current_steps": 187, "total_steps": 219, "loss": 0.2319, "lr": 6.370330434130317e-07, "epoch": 2.5616438356164384, "percentage": 85.39, "elapsed_time": "0:06:14", "remaining_time": "0:01:04"}
188
- {"current_steps": 188, "total_steps": 219, "loss": 0.242, "lr": 5.986426970244009e-07, "epoch": 2.5753424657534247, "percentage": 85.84, "elapsed_time": "0:06:15", "remaining_time": "0:01:01"}
189
- {"current_steps": 189, "total_steps": 219, "loss": 0.1823, "lr": 5.613716460263485e-07, "epoch": 2.589041095890411, "percentage": 86.3, "elapsed_time": "0:06:17", "remaining_time": "0:00:59"}
190
- {"current_steps": 190, "total_steps": 219, "loss": 0.2112, "lr": 5.252293687031196e-07, "epoch": 2.602739726027397, "percentage": 86.76, "elapsed_time": "0:06:18", "remaining_time": "0:00:57"}
191
- {"current_steps": 191, "total_steps": 219, "loss": 0.2016, "lr": 4.902250562840622e-07, "epoch": 2.616438356164384, "percentage": 87.21, "elapsed_time": "0:06:20", "remaining_time": "0:00:55"}
192
- {"current_steps": 192, "total_steps": 219, "loss": 0.2507, "lr": 4.5636761060623314e-07, "epoch": 2.6301369863013697, "percentage": 87.67, "elapsed_time": "0:06:21", "remaining_time": "0:00:53"}
193
- {"current_steps": 193, "total_steps": 219, "loss": 0.2042, "lr": 4.2366564185060134e-07, "epoch": 2.643835616438356, "percentage": 88.13, "elapsed_time": "0:06:22", "remaining_time": "0:00:51"}
194
- {"current_steps": 194, "total_steps": 219, "loss": 0.2087, "lr": 3.921274663524183e-07, "epoch": 2.6575342465753424, "percentage": 88.58, "elapsed_time": "0:06:24", "remaining_time": "0:00:49"}
195
- {"current_steps": 195, "total_steps": 219, "loss": 0.2578, "lr": 3.61761104486314e-07, "epoch": 2.671232876712329, "percentage": 89.04, "elapsed_time": "0:06:25", "remaining_time": "0:00:47"}
196
- {"current_steps": 196, "total_steps": 219, "loss": 0.2471, "lr": 3.3257427862666894e-07, "epoch": 2.684931506849315, "percentage": 89.5, "elapsed_time": "0:06:26", "remaining_time": "0:00:45"}
197
- {"current_steps": 197, "total_steps": 219, "loss": 0.2304, "lr": 3.045744111837529e-07, "epoch": 2.6986301369863015, "percentage": 89.95, "elapsed_time": "0:06:28", "remaining_time": "0:00:43"}
198
- {"current_steps": 198, "total_steps": 219, "loss": 0.1633, "lr": 2.777686227161591e-07, "epoch": 2.712328767123288, "percentage": 90.41, "elapsed_time": "0:06:29", "remaining_time": "0:00:41"}
199
- {"current_steps": 199, "total_steps": 219, "loss": 0.2266, "lr": 2.5216373011999697e-07, "epoch": 2.7260273972602738, "percentage": 90.87, "elapsed_time": "0:06:30", "remaining_time": "0:00:39"}
200
- {"current_steps": 200, "total_steps": 219, "loss": 0.234, "lr": 2.2776624489530664e-07, "epoch": 2.73972602739726, "percentage": 91.32, "elapsed_time": "0:06:31", "remaining_time": "0:00:37"}
201
- {"current_steps": 201, "total_steps": 219, "loss": 0.2286, "lr": 2.0458237149014347e-07, "epoch": 2.7534246575342465, "percentage": 91.78, "elapsed_time": "0:06:33", "remaining_time": "0:00:35"}
202
- {"current_steps": 202, "total_steps": 219, "loss": 0.2296, "lr": 1.8261800572274001e-07, "epoch": 2.767123287671233, "percentage": 92.24, "elapsed_time": "0:06:34", "remaining_time": "0:00:33"}
203
- {"current_steps": 203, "total_steps": 219, "loss": 0.2116, "lr": 1.6187873328216142e-07, "epoch": 2.780821917808219, "percentage": 92.69, "elapsed_time": "0:06:35", "remaining_time": "0:00:31"}
204
- {"current_steps": 204, "total_steps": 219, "loss": 0.2032, "lr": 1.4236982830782676e-07, "epoch": 2.7945205479452055, "percentage": 93.15, "elapsed_time": "0:06:37", "remaining_time": "0:00:29"}
205
- {"current_steps": 205, "total_steps": 219, "loss": 0.2345, "lr": 1.2409625204825802e-07, "epoch": 2.808219178082192, "percentage": 93.61, "elapsed_time": "0:06:38", "remaining_time": "0:00:27"}
206
- {"current_steps": 206, "total_steps": 219, "loss": 0.19, "lr": 1.0706265159939944e-07, "epoch": 2.821917808219178, "percentage": 94.06, "elapsed_time": "0:06:39", "remaining_time": "0:00:25"}
207
- {"current_steps": 207, "total_steps": 219, "loss": 0.1803, "lr": 9.12733587228326e-08, "epoch": 2.8356164383561646, "percentage": 94.52, "elapsed_time": "0:06:41", "remaining_time": "0:00:23"}
208
- {"current_steps": 208, "total_steps": 219, "loss": 0.1956, "lr": 7.673238874417676e-08, "epoch": 2.8493150684931505, "percentage": 94.98, "elapsed_time": "0:06:42", "remaining_time": "0:00:21"}
209
- {"current_steps": 209, "total_steps": 219, "loss": 0.2221, "lr": 6.344343953196386e-08, "epoch": 2.863013698630137, "percentage": 95.43, "elapsed_time": "0:06:43", "remaining_time": "0:00:19"}
210
- {"current_steps": 210, "total_steps": 219, "loss": 0.2437, "lr": 5.1409890557246876e-08, "epoch": 2.8767123287671232, "percentage": 95.89, "elapsed_time": "0:06:45", "remaining_time": "0:00:17"}
211
- {"current_steps": 211, "total_steps": 219, "loss": 0.2314, "lr": 4.063480203417625e-08, "epoch": 2.8904109589041096, "percentage": 96.35, "elapsed_time": "0:06:46", "remaining_time": "0:00:15"}
212
- {"current_steps": 212, "total_steps": 219, "loss": 0.249, "lr": 3.1120914141766214e-08, "epoch": 2.904109589041096, "percentage": 96.8, "elapsed_time": "0:06:47", "remaining_time": "0:00:13"}
213
- {"current_steps": 213, "total_steps": 219, "loss": 0.2131, "lr": 2.287064632705005e-08, "epoch": 2.9178082191780823, "percentage": 97.26, "elapsed_time": "0:06:49", "remaining_time": "0:00:11"}
214
- {"current_steps": 214, "total_steps": 219, "loss": 0.2178, "lr": 1.588609668979446e-08, "epoch": 2.9315068493150687, "percentage": 97.72, "elapsed_time": "0:06:50", "remaining_time": "0:00:09"}
215
- {"current_steps": 215, "total_steps": 219, "loss": 0.2207, "lr": 1.016904144894304e-08, "epoch": 2.9452054794520546, "percentage": 98.17, "elapsed_time": "0:06:52", "remaining_time": "0:00:07"}
216
- {"current_steps": 216, "total_steps": 219, "loss": 0.2142, "lr": 5.720934490907604e-09, "epoch": 2.958904109589041, "percentage": 98.63, "elapsed_time": "0:06:53", "remaining_time": "0:00:05"}
217
- {"current_steps": 217, "total_steps": 219, "loss": 0.2298, "lr": 2.542906999836725e-09, "epoch": 2.9726027397260273, "percentage": 99.09, "elapsed_time": "0:06:54", "remaining_time": "0:00:03"}
218
- {"current_steps": 218, "total_steps": 219, "loss": 0.2056, "lr": 6.357671699486201e-10, "epoch": 2.9863013698630136, "percentage": 99.54, "elapsed_time": "0:06:56", "remaining_time": "0:00:01"}
219
- {"current_steps": 219, "total_steps": 219, "loss": 0.1987, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:06:57", "remaining_time": "0:00:00"}
220
- {"current_steps": 219, "total_steps": 219, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:09:06", "remaining_time": "0:00:00"}
 
1
+ {"current_steps": 1, "total_steps": 216, "loss": 0.4904, "lr": 4.5454545454545457e-07, "epoch": 0.013824884792626729, "percentage": 0.46, "elapsed_time": "0:00:06", "remaining_time": "0:23:47"}
2
+ {"current_steps": 2, "total_steps": 216, "loss": 0.4586, "lr": 9.090909090909091e-07, "epoch": 0.027649769585253458, "percentage": 0.93, "elapsed_time": "0:00:10", "remaining_time": "0:18:01"}
3
+ {"current_steps": 3, "total_steps": 216, "loss": 0.4491, "lr": 1.3636363636363636e-06, "epoch": 0.041474654377880185, "percentage": 1.39, "elapsed_time": "0:00:13", "remaining_time": "0:15:57"}
4
+ {"current_steps": 4, "total_steps": 216, "loss": 0.495, "lr": 1.8181818181818183e-06, "epoch": 0.055299539170506916, "percentage": 1.85, "elapsed_time": "0:00:16", "remaining_time": "0:14:59"}
5
+ {"current_steps": 5, "total_steps": 216, "loss": 0.4518, "lr": 2.2727272727272728e-06, "epoch": 0.06912442396313365, "percentage": 2.31, "elapsed_time": "0:00:20", "remaining_time": "0:14:22"}
6
+ {"current_steps": 6, "total_steps": 216, "loss": 0.4245, "lr": 2.7272727272727272e-06, "epoch": 0.08294930875576037, "percentage": 2.78, "elapsed_time": "0:00:23", "remaining_time": "0:13:56"}
7
+ {"current_steps": 7, "total_steps": 216, "loss": 0.4485, "lr": 3.181818181818182e-06, "epoch": 0.0967741935483871, "percentage": 3.24, "elapsed_time": "0:00:27", "remaining_time": "0:13:36"}
8
+ {"current_steps": 8, "total_steps": 216, "loss": 0.4126, "lr": 3.6363636363636366e-06, "epoch": 0.11059907834101383, "percentage": 3.7, "elapsed_time": "0:00:30", "remaining_time": "0:13:18"}
9
+ {"current_steps": 9, "total_steps": 216, "loss": 0.3782, "lr": 4.0909090909090915e-06, "epoch": 0.12442396313364056, "percentage": 4.17, "elapsed_time": "0:00:34", "remaining_time": "0:13:05"}
10
+ {"current_steps": 10, "total_steps": 216, "loss": 0.4114, "lr": 4.5454545454545455e-06, "epoch": 0.1382488479262673, "percentage": 4.63, "elapsed_time": "0:00:37", "remaining_time": "0:12:53"}
11
+ {"current_steps": 11, "total_steps": 216, "loss": 0.4018, "lr": 5e-06, "epoch": 0.15207373271889402, "percentage": 5.09, "elapsed_time": "0:00:40", "remaining_time": "0:12:42"}
12
+ {"current_steps": 12, "total_steps": 216, "loss": 0.3739, "lr": 5.4545454545454545e-06, "epoch": 0.16589861751152074, "percentage": 5.56, "elapsed_time": "0:00:44", "remaining_time": "0:12:33"}
13
+ {"current_steps": 13, "total_steps": 216, "loss": 0.3516, "lr": 5.90909090909091e-06, "epoch": 0.17972350230414746, "percentage": 6.02, "elapsed_time": "0:00:47", "remaining_time": "0:12:25"}
14
+ {"current_steps": 14, "total_steps": 216, "loss": 0.3873, "lr": 6.363636363636364e-06, "epoch": 0.1935483870967742, "percentage": 6.48, "elapsed_time": "0:00:51", "remaining_time": "0:12:18"}
15
+ {"current_steps": 15, "total_steps": 216, "loss": 0.3635, "lr": 6.818181818181818e-06, "epoch": 0.2073732718894009, "percentage": 6.94, "elapsed_time": "0:00:54", "remaining_time": "0:12:10"}
16
+ {"current_steps": 16, "total_steps": 216, "loss": 0.3538, "lr": 7.272727272727273e-06, "epoch": 0.22119815668202766, "percentage": 7.41, "elapsed_time": "0:00:57", "remaining_time": "0:12:04"}
17
+ {"current_steps": 17, "total_steps": 216, "loss": 0.3322, "lr": 7.727272727272727e-06, "epoch": 0.2350230414746544, "percentage": 7.87, "elapsed_time": "0:01:01", "remaining_time": "0:11:58"}
18
+ {"current_steps": 18, "total_steps": 216, "loss": 0.3175, "lr": 8.181818181818183e-06, "epoch": 0.2488479262672811, "percentage": 8.33, "elapsed_time": "0:01:04", "remaining_time": "0:11:52"}
19
+ {"current_steps": 19, "total_steps": 216, "loss": 0.2943, "lr": 8.636363636363637e-06, "epoch": 0.2626728110599078, "percentage": 8.8, "elapsed_time": "0:01:08", "remaining_time": "0:11:46"}
20
+ {"current_steps": 20, "total_steps": 216, "loss": 0.3269, "lr": 9.090909090909091e-06, "epoch": 0.2764976958525346, "percentage": 9.26, "elapsed_time": "0:01:11", "remaining_time": "0:11:40"}
21
+ {"current_steps": 21, "total_steps": 216, "loss": 0.3665, "lr": 9.545454545454547e-06, "epoch": 0.2903225806451613, "percentage": 9.72, "elapsed_time": "0:01:14", "remaining_time": "0:11:35"}
22
+ {"current_steps": 22, "total_steps": 216, "loss": 0.3081, "lr": 1e-05, "epoch": 0.30414746543778803, "percentage": 10.19, "elapsed_time": "0:01:18", "remaining_time": "0:11:30"}
23
+ {"current_steps": 23, "total_steps": 216, "loss": 0.3216, "lr": 9.999344418328161e-06, "epoch": 0.31797235023041476, "percentage": 10.65, "elapsed_time": "0:01:21", "remaining_time": "0:11:25"}
24
+ {"current_steps": 24, "total_steps": 216, "loss": 0.322, "lr": 9.997377845227577e-06, "epoch": 0.3317972350230415, "percentage": 11.11, "elapsed_time": "0:01:25", "remaining_time": "0:11:21"}
25
+ {"current_steps": 25, "total_steps": 216, "loss": 0.3406, "lr": 9.994100796397954e-06, "epoch": 0.3456221198156682, "percentage": 11.57, "elapsed_time": "0:01:28", "remaining_time": "0:11:16"}
26
+ {"current_steps": 26, "total_steps": 216, "loss": 0.342, "lr": 9.98951413118856e-06, "epoch": 0.35944700460829493, "percentage": 12.04, "elapsed_time": "0:01:32", "remaining_time": "0:11:12"}
27
+ {"current_steps": 27, "total_steps": 216, "loss": 0.3228, "lr": 9.983619052372847e-06, "epoch": 0.37327188940092165, "percentage": 12.5, "elapsed_time": "0:01:35", "remaining_time": "0:11:07"}
28
+ {"current_steps": 28, "total_steps": 216, "loss": 0.34, "lr": 9.97641710583307e-06, "epoch": 0.3870967741935484, "percentage": 12.96, "elapsed_time": "0:01:38", "remaining_time": "0:11:02"}
29
+ {"current_steps": 29, "total_steps": 216, "loss": 0.3624, "lr": 9.96791018015489e-06, "epoch": 0.4009216589861751, "percentage": 13.43, "elapsed_time": "0:01:42", "remaining_time": "0:10:58"}
30
+ {"current_steps": 30, "total_steps": 216, "loss": 0.3362, "lr": 9.958100506132127e-06, "epoch": 0.4147465437788018, "percentage": 13.89, "elapsed_time": "0:01:45", "remaining_time": "0:10:54"}
31
+ {"current_steps": 31, "total_steps": 216, "loss": 0.3306, "lr": 9.946990656181782e-06, "epoch": 0.42857142857142855, "percentage": 14.35, "elapsed_time": "0:01:48", "remaining_time": "0:10:49"}
32
+ {"current_steps": 32, "total_steps": 216, "loss": 0.333, "lr": 9.934583543669454e-06, "epoch": 0.4423963133640553, "percentage": 14.81, "elapsed_time": "0:01:52", "remaining_time": "0:10:45"}
33
+ {"current_steps": 33, "total_steps": 216, "loss": 0.3297, "lr": 9.920882422145372e-06, "epoch": 0.45622119815668205, "percentage": 15.28, "elapsed_time": "0:01:55", "remaining_time": "0:10:41"}
34
+ {"current_steps": 34, "total_steps": 216, "loss": 0.3474, "lr": 9.905890884491196e-06, "epoch": 0.4700460829493088, "percentage": 15.74, "elapsed_time": "0:01:59", "remaining_time": "0:10:37"}
35
+ {"current_steps": 35, "total_steps": 216, "loss": 0.3366, "lr": 9.889612861977855e-06, "epoch": 0.4838709677419355, "percentage": 16.2, "elapsed_time": "0:02:02", "remaining_time": "0:10:33"}
36
+ {"current_steps": 36, "total_steps": 216, "loss": 0.3247, "lr": 9.872052623234632e-06, "epoch": 0.4976958525345622, "percentage": 16.67, "elapsed_time": "0:02:05", "remaining_time": "0:10:28"}
37
+ {"current_steps": 37, "total_steps": 216, "loss": 0.3035, "lr": 9.853214773129796e-06, "epoch": 0.511520737327189, "percentage": 17.13, "elapsed_time": "0:02:09", "remaining_time": "0:10:25"}
38
+ {"current_steps": 38, "total_steps": 216, "loss": 0.3222, "lr": 9.833104251563058e-06, "epoch": 0.5253456221198156, "percentage": 17.59, "elapsed_time": "0:02:12", "remaining_time": "0:10:20"}
39
+ {"current_steps": 39, "total_steps": 216, "loss": 0.3557, "lr": 9.811726332170153e-06, "epoch": 0.5391705069124424, "percentage": 18.06, "elapsed_time": "0:02:15", "remaining_time": "0:10:17"}
40
+ {"current_steps": 40, "total_steps": 216, "loss": 0.3392, "lr": 9.789086620939936e-06, "epoch": 0.5529953917050692, "percentage": 18.52, "elapsed_time": "0:02:19", "remaining_time": "0:10:12"}
41
+ {"current_steps": 41, "total_steps": 216, "loss": 0.3305, "lr": 9.765191054744305e-06, "epoch": 0.5668202764976958, "percentage": 18.98, "elapsed_time": "0:02:22", "remaining_time": "0:10:08"}
42
+ {"current_steps": 42, "total_steps": 216, "loss": 0.3387, "lr": 9.740045899781353e-06, "epoch": 0.5806451612903226, "percentage": 19.44, "elapsed_time": "0:02:26", "remaining_time": "0:10:05"}
43
+ {"current_steps": 43, "total_steps": 216, "loss": 0.378, "lr": 9.713657749932172e-06, "epoch": 0.5944700460829493, "percentage": 19.91, "elapsed_time": "0:02:29", "remaining_time": "0:10:01"}
44
+ {"current_steps": 44, "total_steps": 216, "loss": 0.3808, "lr": 9.68603352503172e-06, "epoch": 0.6082949308755761, "percentage": 20.37, "elapsed_time": "0:02:32", "remaining_time": "0:09:57"}
45
+ {"current_steps": 45, "total_steps": 216, "loss": 0.3561, "lr": 9.657180469054213e-06, "epoch": 0.6221198156682027, "percentage": 20.83, "elapsed_time": "0:02:36", "remaining_time": "0:09:53"}
46
+ {"current_steps": 46, "total_steps": 216, "loss": 0.3224, "lr": 9.627106148213521e-06, "epoch": 0.6359447004608295, "percentage": 21.3, "elapsed_time": "0:02:39", "remaining_time": "0:09:49"}
47
+ {"current_steps": 47, "total_steps": 216, "loss": 0.3502, "lr": 9.595818448979061e-06, "epoch": 0.6497695852534562, "percentage": 21.76, "elapsed_time": "0:02:43", "remaining_time": "0:09:46"}
48
+ {"current_steps": 48, "total_steps": 216, "loss": 0.3172, "lr": 9.563325576007702e-06, "epoch": 0.663594470046083, "percentage": 22.22, "elapsed_time": "0:02:46", "remaining_time": "0:09:42"}
49
+ {"current_steps": 49, "total_steps": 216, "loss": 0.3078, "lr": 9.529636049992235e-06, "epoch": 0.6774193548387096, "percentage": 22.69, "elapsed_time": "0:02:49", "remaining_time": "0:09:38"}
50
+ {"current_steps": 50, "total_steps": 216, "loss": 0.3378, "lr": 9.494758705426978e-06, "epoch": 0.6912442396313364, "percentage": 23.15, "elapsed_time": "0:02:53", "remaining_time": "0:09:34"}
51
+ {"current_steps": 51, "total_steps": 216, "loss": 0.3749, "lr": 9.458702688291072e-06, "epoch": 0.7050691244239631, "percentage": 23.61, "elapsed_time": "0:02:56", "remaining_time": "0:09:31"}
52
+ {"current_steps": 52, "total_steps": 216, "loss": 0.3646, "lr": 9.421477453650118e-06, "epoch": 0.7188940092165899, "percentage": 24.07, "elapsed_time": "0:02:59", "remaining_time": "0:09:27"}
53
+ {"current_steps": 53, "total_steps": 216, "loss": 0.2952, "lr": 9.38309276317674e-06, "epoch": 0.7327188940092166, "percentage": 24.54, "elapsed_time": "0:03:03", "remaining_time": "0:09:23"}
54
+ {"current_steps": 54, "total_steps": 216, "loss": 0.3402, "lr": 9.343558682590757e-06, "epoch": 0.7465437788018433, "percentage": 25.0, "elapsed_time": "0:03:06", "remaining_time": "0:09:20"}
55
+ {"current_steps": 55, "total_steps": 216, "loss": 0.3157, "lr": 9.302885579019626e-06, "epoch": 0.7603686635944701, "percentage": 25.46, "elapsed_time": "0:03:10", "remaining_time": "0:09:16"}
56
+ {"current_steps": 56, "total_steps": 216, "loss": 0.3724, "lr": 9.261084118279846e-06, "epoch": 0.7741935483870968, "percentage": 25.93, "elapsed_time": "0:03:13", "remaining_time": "0:09:12"}
57
+ {"current_steps": 57, "total_steps": 216, "loss": 0.2915, "lr": 9.218165262080024e-06, "epoch": 0.7880184331797235, "percentage": 26.39, "elapsed_time": "0:03:16", "remaining_time": "0:09:09"}
58
+ {"current_steps": 58, "total_steps": 216, "loss": 0.3374, "lr": 9.174140265146356e-06, "epoch": 0.8018433179723502, "percentage": 26.85, "elapsed_time": "0:03:20", "remaining_time": "0:09:05"}
59
+ {"current_steps": 59, "total_steps": 216, "loss": 0.3119, "lr": 9.129020672271283e-06, "epoch": 0.815668202764977, "percentage": 27.31, "elapsed_time": "0:03:23", "remaining_time": "0:09:02"}
60
+ {"current_steps": 60, "total_steps": 216, "loss": 0.3139, "lr": 9.082818315286054e-06, "epoch": 0.8294930875576036, "percentage": 27.78, "elapsed_time": "0:03:27", "remaining_time": "0:08:58"}
61
+ {"current_steps": 61, "total_steps": 216, "loss": 0.3391, "lr": 9.035545309958048e-06, "epoch": 0.8433179723502304, "percentage": 28.24, "elapsed_time": "0:03:30", "remaining_time": "0:08:54"}
62
+ {"current_steps": 62, "total_steps": 216, "loss": 0.3385, "lr": 8.987214052813605e-06, "epoch": 0.8571428571428571, "percentage": 28.7, "elapsed_time": "0:03:33", "remaining_time": "0:08:51"}
63
+ {"current_steps": 63, "total_steps": 216, "loss": 0.3216, "lr": 8.937837217887273e-06, "epoch": 0.8709677419354839, "percentage": 29.17, "elapsed_time": "0:03:37", "remaining_time": "0:08:47"}
64
+ {"current_steps": 64, "total_steps": 216, "loss": 0.2931, "lr": 8.887427753398249e-06, "epoch": 0.8847926267281107, "percentage": 29.63, "elapsed_time": "0:03:40", "remaining_time": "0:08:44"}
65
+ {"current_steps": 65, "total_steps": 216, "loss": 0.3172, "lr": 8.83599887835493e-06, "epoch": 0.8986175115207373, "percentage": 30.09, "elapsed_time": "0:03:44", "remaining_time": "0:08:40"}
66
+ {"current_steps": 66, "total_steps": 216, "loss": 0.3882, "lr": 8.783564079088478e-06, "epoch": 0.9124423963133641, "percentage": 30.56, "elapsed_time": "0:03:47", "remaining_time": "0:08:37"}
67
+ {"current_steps": 67, "total_steps": 216, "loss": 0.2963, "lr": 8.730137105716231e-06, "epoch": 0.9262672811059908, "percentage": 31.02, "elapsed_time": "0:03:50", "remaining_time": "0:08:33"}
68
+ {"current_steps": 68, "total_steps": 216, "loss": 0.2824, "lr": 8.675731968536004e-06, "epoch": 0.9400921658986175, "percentage": 31.48, "elapsed_time": "0:03:54", "remaining_time": "0:08:30"}
69
+ {"current_steps": 69, "total_steps": 216, "loss": 0.3439, "lr": 8.620362934352109e-06, "epoch": 0.9539170506912442, "percentage": 31.94, "elapsed_time": "0:03:57", "remaining_time": "0:08:26"}
70
+ {"current_steps": 70, "total_steps": 216, "loss": 0.345, "lr": 8.564044522734147e-06, "epoch": 0.967741935483871, "percentage": 32.41, "elapsed_time": "0:04:01", "remaining_time": "0:08:23"}
71
+ {"current_steps": 71, "total_steps": 216, "loss": 0.3383, "lr": 8.506791502209497e-06, "epoch": 0.9815668202764977, "percentage": 32.87, "elapsed_time": "0:04:04", "remaining_time": "0:08:19"}
72
+ {"current_steps": 72, "total_steps": 216, "loss": 0.31, "lr": 8.448618886390523e-06, "epoch": 0.9953917050691244, "percentage": 33.33, "elapsed_time": "0:04:08", "remaining_time": "0:08:16"}
73
+ {"current_steps": 73, "total_steps": 216, "loss": 0.4918, "lr": 8.389541930037516e-06, "epoch": 1.0092165898617511, "percentage": 33.8, "elapsed_time": "0:05:10", "remaining_time": "0:10:08"}
74
+ {"current_steps": 74, "total_steps": 216, "loss": 0.284, "lr": 8.329576125058406e-06, "epoch": 1.023041474654378, "percentage": 34.26, "elapsed_time": "0:05:14", "remaining_time": "0:10:03"}
75
+ {"current_steps": 75, "total_steps": 216, "loss": 0.2914, "lr": 8.268737196446264e-06, "epoch": 1.0368663594470047, "percentage": 34.72, "elapsed_time": "0:05:17", "remaining_time": "0:09:57"}
76
+ {"current_steps": 76, "total_steps": 216, "loss": 0.2723, "lr": 8.207041098155701e-06, "epoch": 1.0506912442396312, "percentage": 35.19, "elapsed_time": "0:05:21", "remaining_time": "0:09:51"}
77
+ {"current_steps": 77, "total_steps": 216, "loss": 0.3119, "lr": 8.144504008919224e-06, "epoch": 1.064516129032258, "percentage": 35.65, "elapsed_time": "0:05:24", "remaining_time": "0:09:45"}
78
+ {"current_steps": 78, "total_steps": 216, "loss": 0.2598, "lr": 8.081142328004638e-06, "epoch": 1.0783410138248848, "percentage": 36.11, "elapsed_time": "0:05:28", "remaining_time": "0:09:40"}
79
+ {"current_steps": 79, "total_steps": 216, "loss": 0.322, "lr": 8.016972670914624e-06, "epoch": 1.0921658986175116, "percentage": 36.57, "elapsed_time": "0:05:31", "remaining_time": "0:09:34"}
80
+ {"current_steps": 80, "total_steps": 216, "loss": 0.2509, "lr": 7.952011865029614e-06, "epoch": 1.1059907834101383, "percentage": 37.04, "elapsed_time": "0:05:34", "remaining_time": "0:09:29"}
81
+ {"current_steps": 81, "total_steps": 216, "loss": 0.2206, "lr": 7.886276945195098e-06, "epoch": 1.119815668202765, "percentage": 37.5, "elapsed_time": "0:05:38", "remaining_time": "0:09:24"}
82
+ {"current_steps": 82, "total_steps": 216, "loss": 0.2954, "lr": 7.819785149254534e-06, "epoch": 1.1336405529953917, "percentage": 37.96, "elapsed_time": "0:05:41", "remaining_time": "0:09:18"}
83
+ {"current_steps": 83, "total_steps": 216, "loss": 0.2628, "lr": 7.752553913529019e-06, "epoch": 1.1474654377880185, "percentage": 38.43, "elapsed_time": "0:05:45", "remaining_time": "0:09:13"}
84
+ {"current_steps": 84, "total_steps": 216, "loss": 0.3206, "lr": 7.68460086824492e-06, "epoch": 1.1612903225806452, "percentage": 38.89, "elapsed_time": "0:05:48", "remaining_time": "0:09:08"}
85
+ {"current_steps": 85, "total_steps": 216, "loss": 0.2363, "lr": 7.61594383291065e-06, "epoch": 1.1751152073732718, "percentage": 39.35, "elapsed_time": "0:05:52", "remaining_time": "0:09:03"}
86
+ {"current_steps": 86, "total_steps": 216, "loss": 0.3353, "lr": 7.546600811643816e-06, "epoch": 1.1889400921658986, "percentage": 39.81, "elapsed_time": "0:05:55", "remaining_time": "0:08:57"}
87
+ {"current_steps": 87, "total_steps": 216, "loss": 0.2618, "lr": 7.476589988449939e-06, "epoch": 1.2027649769585254, "percentage": 40.28, "elapsed_time": "0:05:59", "remaining_time": "0:08:52"}
88
+ {"current_steps": 88, "total_steps": 216, "loss": 0.2639, "lr": 7.405929722454026e-06, "epoch": 1.2165898617511521, "percentage": 40.74, "elapsed_time": "0:06:02", "remaining_time": "0:08:47"}
89
+ {"current_steps": 89, "total_steps": 216, "loss": 0.2477, "lr": 7.334638543086203e-06, "epoch": 1.230414746543779, "percentage": 41.2, "elapsed_time": "0:06:06", "remaining_time": "0:08:42"}
90
+ {"current_steps": 90, "total_steps": 216, "loss": 0.2437, "lr": 7.262735145222696e-06, "epoch": 1.2442396313364055, "percentage": 41.67, "elapsed_time": "0:06:09", "remaining_time": "0:08:37"}
91
+ {"current_steps": 91, "total_steps": 216, "loss": 0.2625, "lr": 7.190238384283413e-06, "epoch": 1.2580645161290323, "percentage": 42.13, "elapsed_time": "0:06:13", "remaining_time": "0:08:32"}
92
+ {"current_steps": 92, "total_steps": 216, "loss": 0.2838, "lr": 7.117167271287453e-06, "epoch": 1.271889400921659, "percentage": 42.59, "elapsed_time": "0:06:16", "remaining_time": "0:08:27"}
93
+ {"current_steps": 93, "total_steps": 216, "loss": 0.2596, "lr": 7.043540967867782e-06, "epoch": 1.2857142857142856, "percentage": 43.06, "elapsed_time": "0:06:20", "remaining_time": "0:08:22"}
94
+ {"current_steps": 94, "total_steps": 216, "loss": 0.295, "lr": 6.969378781246436e-06, "epoch": 1.2995391705069124, "percentage": 43.52, "elapsed_time": "0:06:23", "remaining_time": "0:08:17"}
95
+ {"current_steps": 95, "total_steps": 216, "loss": 0.2478, "lr": 6.894700159171535e-06, "epoch": 1.3133640552995391, "percentage": 43.98, "elapsed_time": "0:06:27", "remaining_time": "0:08:13"}
96
+ {"current_steps": 96, "total_steps": 216, "loss": 0.2375, "lr": 6.819524684817439e-06, "epoch": 1.327188940092166, "percentage": 44.44, "elapsed_time": "0:06:30", "remaining_time": "0:08:08"}
97
+ {"current_steps": 97, "total_steps": 216, "loss": 0.293, "lr": 6.743872071649411e-06, "epoch": 1.3410138248847927, "percentage": 44.91, "elapsed_time": "0:06:34", "remaining_time": "0:08:03"}
98
+ {"current_steps": 98, "total_steps": 216, "loss": 0.2759, "lr": 6.667762158254104e-06, "epoch": 1.3548387096774195, "percentage": 45.37, "elapsed_time": "0:06:37", "remaining_time": "0:07:58"}
99
+ {"current_steps": 99, "total_steps": 216, "loss": 0.2919, "lr": 6.591214903137221e-06, "epoch": 1.368663594470046, "percentage": 45.83, "elapsed_time": "0:06:41", "remaining_time": "0:07:54"}
100
+ {"current_steps": 100, "total_steps": 216, "loss": 0.3236, "lr": 6.514250379489754e-06, "epoch": 1.3824884792626728, "percentage": 46.3, "elapsed_time": "0:06:44", "remaining_time": "0:07:49"}
101
+ {"current_steps": 101, "total_steps": 216, "loss": 0.2599, "lr": 6.436888769924142e-06, "epoch": 1.3963133640552996, "percentage": 46.76, "elapsed_time": "0:06:47", "remaining_time": "0:07:44"}
102
+ {"current_steps": 102, "total_steps": 216, "loss": 0.2881, "lr": 6.3591503611817155e-06, "epoch": 1.4101382488479262, "percentage": 47.22, "elapsed_time": "0:06:51", "remaining_time": "0:07:39"}
103
+ {"current_steps": 103, "total_steps": 216, "loss": 0.2528, "lr": 6.281055538812861e-06, "epoch": 1.423963133640553, "percentage": 47.69, "elapsed_time": "0:06:54", "remaining_time": "0:07:35"}
104
+ {"current_steps": 104, "total_steps": 216, "loss": 0.2586, "lr": 6.202624781831269e-06, "epoch": 1.4377880184331797, "percentage": 48.15, "elapsed_time": "0:06:58", "remaining_time": "0:07:30"}
105
+ {"current_steps": 105, "total_steps": 216, "loss": 0.2933, "lr": 6.123878657343648e-06, "epoch": 1.4516129032258065, "percentage": 48.61, "elapsed_time": "0:07:01", "remaining_time": "0:07:25"}
106
+ {"current_steps": 106, "total_steps": 216, "loss": 0.2682, "lr": 6.044837815156377e-06, "epoch": 1.4654377880184333, "percentage": 49.07, "elapsed_time": "0:07:05", "remaining_time": "0:07:21"}
107
+ {"current_steps": 107, "total_steps": 216, "loss": 0.2574, "lr": 5.965522982360441e-06, "epoch": 1.4792626728110598, "percentage": 49.54, "elapsed_time": "0:07:08", "remaining_time": "0:07:16"}
108
+ {"current_steps": 108, "total_steps": 216, "loss": 0.256, "lr": 5.885954957896115e-06, "epoch": 1.4930875576036866, "percentage": 50.0, "elapsed_time": "0:07:12", "remaining_time": "0:07:12"}
109
+ {"current_steps": 109, "total_steps": 216, "loss": 0.3367, "lr": 5.806154607098799e-06, "epoch": 1.5069124423963134, "percentage": 50.46, "elapsed_time": "0:07:15", "remaining_time": "0:07:07"}
110
+ {"current_steps": 110, "total_steps": 216, "loss": 0.2801, "lr": 5.726142856227453e-06, "epoch": 1.52073732718894, "percentage": 50.93, "elapsed_time": "0:07:19", "remaining_time": "0:07:03"}
111
+ {"current_steps": 111, "total_steps": 216, "loss": 0.2512, "lr": 5.645940686977033e-06, "epoch": 1.5345622119815667, "percentage": 51.39, "elapsed_time": "0:07:22", "remaining_time": "0:06:58"}
112
+ {"current_steps": 112, "total_steps": 216, "loss": 0.2938, "lr": 5.5655691309764225e-06, "epoch": 1.5483870967741935, "percentage": 51.85, "elapsed_time": "0:07:26", "remaining_time": "0:06:54"}
113
+ {"current_steps": 113, "total_steps": 216, "loss": 0.2598, "lr": 5.485049264273241e-06, "epoch": 1.5622119815668203, "percentage": 52.31, "elapsed_time": "0:07:29", "remaining_time": "0:06:49"}
114
+ {"current_steps": 114, "total_steps": 216, "loss": 0.2587, "lr": 5.404402201807022e-06, "epoch": 1.576036866359447, "percentage": 52.78, "elapsed_time": "0:07:32", "remaining_time": "0:06:45"}
115
+ {"current_steps": 115, "total_steps": 216, "loss": 0.2917, "lr": 5.323649091872179e-06, "epoch": 1.5898617511520738, "percentage": 53.24, "elapsed_time": "0:07:36", "remaining_time": "0:06:40"}
116
+ {"current_steps": 116, "total_steps": 216, "loss": 0.2357, "lr": 5.242811110572243e-06, "epoch": 1.6036866359447006, "percentage": 53.7, "elapsed_time": "0:07:39", "remaining_time": "0:06:36"}
117
+ {"current_steps": 117, "total_steps": 216, "loss": 0.2259, "lr": 5.161909456266781e-06, "epoch": 1.6175115207373272, "percentage": 54.17, "elapsed_time": "0:07:43", "remaining_time": "0:06:31"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:068cb1b51236a064603b57f3353fdf5080f8a630a6847994129d2d7cabd6b163
3
  size 7288
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a91811e6e07dfcc842e6192d8eeb61b5cea677543130cfcef6e39900b918e368
3
  size 7288