File size: 12,303 Bytes
a560675
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
{"current_steps": 10, "total_steps": 555, "loss": 0.9678, "learning_rate": 1.7857142857142859e-06, "epoch": 0.05398110661268556, "percentage": 1.8, "elapsed_time": "0:00:45", "remaining_time": "0:41:11"}
{"current_steps": 20, "total_steps": 555, "loss": 0.6964, "learning_rate": 3.5714285714285718e-06, "epoch": 0.10796221322537113, "percentage": 3.6, "elapsed_time": "0:01:32", "remaining_time": "0:41:21"}
{"current_steps": 30, "total_steps": 555, "loss": 0.4919, "learning_rate": 5.357142857142857e-06, "epoch": 0.16194331983805668, "percentage": 5.41, "elapsed_time": "0:02:21", "remaining_time": "0:41:18"}
{"current_steps": 40, "total_steps": 555, "loss": 0.4628, "learning_rate": 7.1428571428571436e-06, "epoch": 0.21592442645074225, "percentage": 7.21, "elapsed_time": "0:03:12", "remaining_time": "0:41:22"}
{"current_steps": 50, "total_steps": 555, "loss": 0.3842, "learning_rate": 8.92857142857143e-06, "epoch": 0.2699055330634278, "percentage": 9.01, "elapsed_time": "0:03:55", "remaining_time": "0:39:39"}
{"current_steps": 60, "total_steps": 555, "loss": 0.4654, "learning_rate": 9.998414611537682e-06, "epoch": 0.32388663967611336, "percentage": 10.81, "elapsed_time": "0:04:44", "remaining_time": "0:39:08"}
{"current_steps": 70, "total_steps": 555, "loss": 0.3943, "learning_rate": 9.980590535514234e-06, "epoch": 0.37786774628879893, "percentage": 12.61, "elapsed_time": "0:05:32", "remaining_time": "0:38:20"}
{"current_steps": 80, "total_steps": 555, "loss": 0.3839, "learning_rate": 9.943031509146825e-06, "epoch": 0.4318488529014845, "percentage": 14.41, "elapsed_time": "0:06:12", "remaining_time": "0:36:51"}
{"current_steps": 90, "total_steps": 555, "loss": 0.3731, "learning_rate": 9.885886355253758e-06, "epoch": 0.48582995951417, "percentage": 16.22, "elapsed_time": "0:06:59", "remaining_time": "0:36:05"}
{"current_steps": 100, "total_steps": 555, "loss": 0.3932, "learning_rate": 9.809381504168235e-06, "epoch": 0.5398110661268556, "percentage": 18.02, "elapsed_time": "0:07:41", "remaining_time": "0:34:59"}
{"current_steps": 100, "total_steps": 555, "eval_loss": 0.3728838264942169, "epoch": 0.5398110661268556, "percentage": 18.02, "elapsed_time": "0:08:17", "remaining_time": "0:37:43"}
{"current_steps": 110, "total_steps": 555, "loss": 0.4067, "learning_rate": 9.713820096537226e-06, "epoch": 0.5937921727395412, "percentage": 19.82, "elapsed_time": "0:09:24", "remaining_time": "0:38:02"}
{"current_steps": 120, "total_steps": 555, "loss": 0.3586, "learning_rate": 9.599580782165598e-06, "epoch": 0.6477732793522267, "percentage": 21.62, "elapsed_time": "0:10:09", "remaining_time": "0:36:47"}
{"current_steps": 130, "total_steps": 555, "loss": 0.3675, "learning_rate": 9.467116219664893e-06, "epoch": 0.7017543859649122, "percentage": 23.42, "elapsed_time": "0:10:54", "remaining_time": "0:35:41"}
{"current_steps": 140, "total_steps": 555, "loss": 0.3823, "learning_rate": 9.316951282851708e-06, "epoch": 0.7557354925775979, "percentage": 25.23, "elapsed_time": "0:11:36", "remaining_time": "0:34:23"}
{"current_steps": 150, "total_steps": 555, "loss": 0.3965, "learning_rate": 9.149680981002609e-06, "epoch": 0.8097165991902834, "percentage": 27.03, "elapsed_time": "0:12:21", "remaining_time": "0:33:22"}
{"current_steps": 160, "total_steps": 555, "loss": 0.3643, "learning_rate": 8.965968101206291e-06, "epoch": 0.863697705802969, "percentage": 28.83, "elapsed_time": "0:13:10", "remaining_time": "0:32:32"}
{"current_steps": 170, "total_steps": 555, "loss": 0.3892, "learning_rate": 8.76654058215486e-06, "epoch": 0.9176788124156545, "percentage": 30.63, "elapsed_time": "0:13:59", "remaining_time": "0:31:41"}
{"current_steps": 180, "total_steps": 555, "loss": 0.3469, "learning_rate": 8.552188629780245e-06, "epoch": 0.97165991902834, "percentage": 32.43, "elapsed_time": "0:14:47", "remaining_time": "0:30:49"}
{"current_steps": 190, "total_steps": 555, "loss": 0.3549, "learning_rate": 8.323761586164695e-06, "epoch": 1.0256410256410255, "percentage": 34.23, "elapsed_time": "0:15:34", "remaining_time": "0:29:55"}
{"current_steps": 200, "total_steps": 555, "loss": 0.235, "learning_rate": 8.082164564131844e-06, "epoch": 1.0796221322537112, "percentage": 36.04, "elapsed_time": "0:16:24", "remaining_time": "0:29:06"}
{"current_steps": 200, "total_steps": 555, "eval_loss": 0.36726805567741394, "epoch": 1.0796221322537112, "percentage": 36.04, "elapsed_time": "0:16:59", "remaining_time": "0:30:09"}
{"current_steps": 210, "total_steps": 555, "loss": 0.2505, "learning_rate": 7.8283548608534e-06, "epoch": 1.1336032388663968, "percentage": 37.84, "elapsed_time": "0:18:11", "remaining_time": "0:29:53"}
{"current_steps": 220, "total_steps": 555, "loss": 0.2495, "learning_rate": 7.563338164682036e-06, "epoch": 1.1875843454790824, "percentage": 39.64, "elapsed_time": "0:19:02", "remaining_time": "0:29:00"}
{"current_steps": 230, "total_steps": 555, "loss": 0.2302, "learning_rate": 7.2881645702404625e-06, "epoch": 1.2415654520917678, "percentage": 41.44, "elapsed_time": "0:19:44", "remaining_time": "0:27:53"}
{"current_steps": 240, "total_steps": 555, "loss": 0.2603, "learning_rate": 7.003924417556344e-06, "epoch": 1.2955465587044535, "percentage": 43.24, "elapsed_time": "0:20:31", "remaining_time": "0:26:56"}
{"current_steps": 250, "total_steps": 555, "loss": 0.2452, "learning_rate": 6.711743971729967e-06, "epoch": 1.349527665317139, "percentage": 45.05, "elapsed_time": "0:21:16", "remaining_time": "0:25:57"}
{"current_steps": 260, "total_steps": 555, "loss": 0.2402, "learning_rate": 6.412780960253437e-06, "epoch": 1.4035087719298245, "percentage": 46.85, "elapsed_time": "0:22:01", "remaining_time": "0:24:59"}
{"current_steps": 270, "total_steps": 555, "loss": 0.2366, "learning_rate": 6.108219985664161e-06, "epoch": 1.45748987854251, "percentage": 48.65, "elapsed_time": "0:22:45", "remaining_time": "0:24:01"}
{"current_steps": 280, "total_steps": 555, "loss": 0.2307, "learning_rate": 5.799267831709442e-06, "epoch": 1.5114709851551957, "percentage": 50.45, "elapsed_time": "0:23:33", "remaining_time": "0:23:08"}
{"current_steps": 290, "total_steps": 555, "loss": 0.2561, "learning_rate": 5.487148681620862e-06, "epoch": 1.5654520917678814, "percentage": 52.25, "elapsed_time": "0:24:17", "remaining_time": "0:22:11"}
{"current_steps": 300, "total_steps": 555, "loss": 0.2243, "learning_rate": 5.173099267445452e-06, "epoch": 1.6194331983805668, "percentage": 54.05, "elapsed_time": "0:25:00", "remaining_time": "0:21:15"}
{"current_steps": 300, "total_steps": 555, "eval_loss": 0.3492150604724884, "epoch": 1.6194331983805668, "percentage": 54.05, "elapsed_time": "0:25:36", "remaining_time": "0:21:45"}
{"current_steps": 310, "total_steps": 555, "loss": 0.2575, "learning_rate": 4.8583639696537815e-06, "epoch": 1.6734143049932524, "percentage": 55.86, "elapsed_time": "0:26:46", "remaining_time": "0:21:09"}
{"current_steps": 320, "total_steps": 555, "loss": 0.2749, "learning_rate": 4.544189886442163e-06, "epoch": 1.7273954116059378, "percentage": 57.66, "elapsed_time": "0:27:31", "remaining_time": "0:20:12"}
{"current_steps": 330, "total_steps": 555, "loss": 0.2442, "learning_rate": 4.23182189226621e-06, "epoch": 1.7813765182186234, "percentage": 59.46, "elapsed_time": "0:28:18", "remaining_time": "0:19:17"}
{"current_steps": 340, "total_steps": 555, "loss": 0.2275, "learning_rate": 3.9224977051856906e-06, "epoch": 1.835357624831309, "percentage": 61.26, "elapsed_time": "0:28:58", "remaining_time": "0:18:19"}
{"current_steps": 350, "total_steps": 555, "loss": 0.2461, "learning_rate": 3.6174429825656687e-06, "epoch": 1.8893387314439947, "percentage": 63.06, "elapsed_time": "0:29:46", "remaining_time": "0:17:26"}
{"current_steps": 360, "total_steps": 555, "loss": 0.24, "learning_rate": 3.317866464566607e-06, "epoch": 1.9433198380566803, "percentage": 64.86, "elapsed_time": "0:30:32", "remaining_time": "0:16:32"}
{"current_steps": 370, "total_steps": 555, "loss": 0.2394, "learning_rate": 3.0249551846667207e-06, "epoch": 1.9973009446693657, "percentage": 66.67, "elapsed_time": "0:31:19", "remaining_time": "0:15:39"}
{"current_steps": 380, "total_steps": 555, "loss": 0.1461, "learning_rate": 2.7398697661942632e-06, "epoch": 2.051282051282051, "percentage": 68.47, "elapsed_time": "0:32:03", "remaining_time": "0:14:45"}
{"current_steps": 390, "total_steps": 555, "loss": 0.1443, "learning_rate": 2.4637398235066527e-06, "epoch": 2.1052631578947367, "percentage": 70.27, "elapsed_time": "0:32:50", "remaining_time": "0:13:53"}
{"current_steps": 400, "total_steps": 555, "loss": 0.1416, "learning_rate": 2.19765948603866e-06, "epoch": 2.1592442645074224, "percentage": 72.07, "elapsed_time": "0:33:37", "remaining_time": "0:13:01"}
{"current_steps": 400, "total_steps": 555, "eval_loss": 0.37677058577537537, "epoch": 2.1592442645074224, "percentage": 72.07, "elapsed_time": "0:34:13", "remaining_time": "0:13:15"}
{"current_steps": 410, "total_steps": 555, "loss": 0.1282, "learning_rate": 1.9426830629550244e-06, "epoch": 2.213225371120108, "percentage": 73.87, "elapsed_time": "0:35:21", "remaining_time": "0:12:30"}
{"current_steps": 420, "total_steps": 555, "loss": 0.1444, "learning_rate": 1.699820865585814e-06, "epoch": 2.2672064777327936, "percentage": 75.68, "elapsed_time": "0:35:59", "remaining_time": "0:11:34"}
{"current_steps": 430, "total_steps": 555, "loss": 0.135, "learning_rate": 1.470035204197517e-06, "epoch": 2.3211875843454792, "percentage": 77.48, "elapsed_time": "0:36:45", "remaining_time": "0:10:41"}
{"current_steps": 440, "total_steps": 555, "loss": 0.124, "learning_rate": 1.2542365749622048e-06, "epoch": 2.375168690958165, "percentage": 79.28, "elapsed_time": "0:37:34", "remaining_time": "0:09:49"}
{"current_steps": 450, "total_steps": 555, "loss": 0.1336, "learning_rate": 1.0532800522333902e-06, "epoch": 2.42914979757085, "percentage": 81.08, "elapsed_time": "0:38:19", "remaining_time": "0:08:56"}
{"current_steps": 460, "total_steps": 555, "loss": 0.1265, "learning_rate": 8.679619004237111e-07, "epoch": 2.4831309041835357, "percentage": 82.88, "elapsed_time": "0:39:04", "remaining_time": "0:08:04"}
{"current_steps": 470, "total_steps": 555, "loss": 0.1378, "learning_rate": 6.990164189094589e-07, "epoch": 2.5371120107962213, "percentage": 84.68, "elapsed_time": "0:39:49", "remaining_time": "0:07:12"}
{"current_steps": 480, "total_steps": 555, "loss": 0.1156, "learning_rate": 5.471130324636115e-07, "epoch": 2.591093117408907, "percentage": 86.49, "elapsed_time": "0:40:39", "remaining_time": "0:06:21"}
{"current_steps": 490, "total_steps": 555, "loss": 0.1174, "learning_rate": 4.12853638746134e-07, "epoch": 2.6450742240215925, "percentage": 88.29, "elapsed_time": "0:41:22", "remaining_time": "0:05:29"}
{"current_steps": 500, "total_steps": 555, "loss": 0.1247, "learning_rate": 2.9677022336181414e-07, "epoch": 2.699055330634278, "percentage": 90.09, "elapsed_time": "0:42:17", "remaining_time": "0:04:39"}
{"current_steps": 500, "total_steps": 555, "eval_loss": 0.384060263633728, "epoch": 2.699055330634278, "percentage": 90.09, "elapsed_time": "0:42:53", "remaining_time": "0:04:43"}
{"current_steps": 510, "total_steps": 555, "loss": 0.1213, "learning_rate": 1.993227519356189e-07, "epoch": 2.753036437246964, "percentage": 91.89, "elapsed_time": "0:44:02", "remaining_time": "0:03:53"}
{"current_steps": 520, "total_steps": 555, "loss": 0.1303, "learning_rate": 1.2089734755797611e-07, "epoch": 2.807017543859649, "percentage": 93.69, "elapsed_time": "0:44:48", "remaining_time": "0:03:00"}
{"current_steps": 530, "total_steps": 555, "loss": 0.1234, "learning_rate": 6.180476082162656e-08, "epoch": 2.8609986504723346, "percentage": 95.5, "elapsed_time": "0:45:35", "remaining_time": "0:02:09"}
{"current_steps": 540, "total_steps": 555, "loss": 0.1329, "learning_rate": 2.227913851230057e-08, "epoch": 2.91497975708502, "percentage": 97.3, "elapsed_time": "0:46:16", "remaining_time": "0:01:17"}
{"current_steps": 550, "total_steps": 555, "loss": 0.139, "learning_rate": 2.4770958321568283e-09, "epoch": 2.968960863697706, "percentage": 99.1, "elapsed_time": "0:47:05", "remaining_time": "0:00:25"}
{"current_steps": 555, "total_steps": 555, "epoch": 2.9959514170040484, "percentage": 100.0, "elapsed_time": "0:47:51", "remaining_time": "0:00:00"}