sedrickkeh commited on
Commit
b489075
·
verified ·
1 Parent(s): 4b8278a

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf0c25c85922ea2f2f611ee9cdd50b8b1045cffc9dec7bf6557d20a7d09825f0
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a34a9e5b25cd1055ae7aa0bfcf0a258f56c65dd7df68759753bf70c20f84ff4
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f146dca0ef08a3acf5a781f005c038a3432eeedbb21ebb8a878184d03de2b80
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32c62b39bf8f4073dcadb2b49178f70ad45348736cee00ac3795f7b813b259a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a953b7d295c2c30ac799f485a1405aed614a8fa304453faba84d63826f9b43b
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4be9c18016feb23c1d34f5732268794381043bc2366fa72b1022896a648c8a5d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f144ff612a09e03b2dbde7c1801c0b3b4d9c72b4df6a2c338353f758b9fdd15e
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bef089507508ddaa4833aed8a2ad3bb0991e46b9f6b42c37e0d4ee6ce781585
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -55,3 +55,31 @@
55
  {"current_steps": 55, "total_steps": 84, "loss": 0.7228, "lr": 2.6057118107127402e-05, "epoch": 1.9262472885032538, "percentage": 65.48, "elapsed_time": "2:23:34", "remaining_time": "1:15:42"}
56
  {"current_steps": 56, "total_steps": 84, "loss": 0.7208, "lr": 2.4499376541915883e-05, "epoch": 1.9609544468546638, "percentage": 66.67, "elapsed_time": "2:26:07", "remaining_time": "1:13:03"}
57
  {"current_steps": 57, "total_steps": 84, "loss": 1.1849, "lr": 2.2968828337397095e-05, "epoch": 2.013015184381779, "percentage": 67.86, "elapsed_time": "2:30:19", "remaining_time": "1:11:12"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  {"current_steps": 55, "total_steps": 84, "loss": 0.7228, "lr": 2.6057118107127402e-05, "epoch": 1.9262472885032538, "percentage": 65.48, "elapsed_time": "2:23:34", "remaining_time": "1:15:42"}
56
  {"current_steps": 56, "total_steps": 84, "loss": 0.7208, "lr": 2.4499376541915883e-05, "epoch": 1.9609544468546638, "percentage": 66.67, "elapsed_time": "2:26:07", "remaining_time": "1:13:03"}
57
  {"current_steps": 57, "total_steps": 84, "loss": 1.1849, "lr": 2.2968828337397095e-05, "epoch": 2.013015184381779, "percentage": 67.86, "elapsed_time": "2:30:19", "remaining_time": "1:11:12"}
58
+ {"current_steps": 58, "total_steps": 84, "loss": 0.6845, "lr": 2.1468158595205543e-05, "epoch": 2.0477223427331888, "percentage": 69.05, "elapsed_time": "2:32:52", "remaining_time": "1:08:31"}
59
+ {"current_steps": 59, "total_steps": 84, "loss": 0.681, "lr": 2.0000000000000012e-05, "epoch": 2.0824295010845986, "percentage": 70.24, "elapsed_time": "2:35:26", "remaining_time": "1:05:51"}
60
+ {"current_steps": 60, "total_steps": 84, "loss": 0.6803, "lr": 1.8566928200840128e-05, "epoch": 2.117136659436009, "percentage": 71.43, "elapsed_time": "2:37:59", "remaining_time": "1:03:11"}
61
+ {"current_steps": 61, "total_steps": 84, "loss": 0.6756, "lr": 1.7171457292622736e-05, "epoch": 2.1518438177874186, "percentage": 72.62, "elapsed_time": "2:40:33", "remaining_time": "1:00:32"}
62
+ {"current_steps": 62, "total_steps": 84, "loss": 0.6713, "lr": 1.5816035405505007e-05, "epoch": 2.1865509761388284, "percentage": 73.81, "elapsed_time": "2:43:06", "remaining_time": "0:57:52"}
63
+ {"current_steps": 63, "total_steps": 84, "loss": 0.6778, "lr": 1.4503040410052412e-05, "epoch": 2.2212581344902387, "percentage": 75.0, "elapsed_time": "2:45:39", "remaining_time": "0:55:13"}
64
+ {"current_steps": 64, "total_steps": 84, "loss": 0.6733, "lr": 1.3234775745645684e-05, "epoch": 2.2559652928416485, "percentage": 76.19, "elapsed_time": "2:48:12", "remaining_time": "0:52:33"}
65
+ {"current_steps": 65, "total_steps": 84, "loss": 0.673, "lr": 1.201346637946538e-05, "epoch": 2.2906724511930587, "percentage": 77.38, "elapsed_time": "2:50:45", "remaining_time": "0:49:54"}
66
+ {"current_steps": 66, "total_steps": 84, "loss": 0.6758, "lr": 1.0841254903143547e-05, "epoch": 2.3253796095444685, "percentage": 78.57, "elapsed_time": "2:53:18", "remaining_time": "0:47:15"}
67
+ {"current_steps": 67, "total_steps": 84, "loss": 0.6708, "lr": 9.720197773929749e-06, "epoch": 2.3600867678958783, "percentage": 79.76, "elapsed_time": "2:55:51", "remaining_time": "0:44:37"}
68
+ {"current_steps": 68, "total_steps": 84, "loss": 0.6694, "lr": 8.652261706966412e-06, "epoch": 2.3947939262472886, "percentage": 80.95, "elapsed_time": "2:58:26", "remaining_time": "0:41:59"}
69
+ {"current_steps": 69, "total_steps": 84, "loss": 0.6749, "lr": 7.639320225002106e-06, "epoch": 2.4295010845986984, "percentage": 82.14, "elapsed_time": "3:00:59", "remaining_time": "0:39:20"}
70
+ {"current_steps": 70, "total_steps": 84, "loss": 0.6752, "lr": 6.6831503715960235e-06, "epoch": 2.4642082429501087, "percentage": 83.33, "elapsed_time": "3:03:33", "remaining_time": "0:36:42"}
71
+ {"current_steps": 71, "total_steps": 84, "loss": 0.6781, "lr": 5.785429593579736e-06, "epoch": 2.4989154013015185, "percentage": 84.52, "elapsed_time": "3:06:06", "remaining_time": "0:34:04"}
72
+ {"current_steps": 72, "total_steps": 84, "loss": 0.6716, "lr": 4.947732798245466e-06, "epoch": 2.5336225596529283, "percentage": 85.71, "elapsed_time": "3:08:40", "remaining_time": "0:31:26"}
73
+ {"current_steps": 73, "total_steps": 84, "loss": 0.6779, "lr": 4.171529590423484e-06, "epoch": 2.5683297180043385, "percentage": 86.9, "elapsed_time": "3:11:13", "remaining_time": "0:28:48"}
74
+ {"current_steps": 74, "total_steps": 84, "loss": 0.6805, "lr": 3.458181694295961e-06, "epoch": 2.6030368763557483, "percentage": 88.1, "elapsed_time": "3:13:47", "remaining_time": "0:26:11"}
75
+ {"current_steps": 75, "total_steps": 84, "loss": 0.6719, "lr": 2.8089405644699463e-06, "epoch": 2.6377440347071586, "percentage": 89.29, "elapsed_time": "3:16:21", "remaining_time": "0:23:33"}
76
+ {"current_steps": 76, "total_steps": 84, "loss": 0.675, "lr": 2.2249451905007603e-06, "epoch": 2.6724511930585684, "percentage": 90.48, "elapsed_time": "3:18:54", "remaining_time": "0:20:56"}
77
+ {"current_steps": 77, "total_steps": 84, "loss": 0.6767, "lr": 1.7072200987173105e-06, "epoch": 2.707158351409978, "percentage": 91.67, "elapsed_time": "3:21:26", "remaining_time": "0:18:18"}
78
+ {"current_steps": 78, "total_steps": 84, "loss": 0.6633, "lr": 1.256673554854757e-06, "epoch": 2.7418655097613884, "percentage": 92.86, "elapsed_time": "3:23:59", "remaining_time": "0:15:41"}
79
+ {"current_steps": 79, "total_steps": 84, "loss": 0.6672, "lr": 8.740959706477725e-07, "epoch": 2.7765726681127982, "percentage": 94.05, "elapsed_time": "3:26:32", "remaining_time": "0:13:04"}
80
+ {"current_steps": 80, "total_steps": 84, "loss": 0.6708, "lr": 5.601585171798052e-07, "epoch": 2.811279826464208, "percentage": 95.24, "elapsed_time": "3:29:05", "remaining_time": "0:10:27"}
81
+ {"current_steps": 81, "total_steps": 84, "loss": 0.6748, "lr": 3.154119474208894e-07, "epoch": 2.8459869848156183, "percentage": 96.43, "elapsed_time": "3:31:38", "remaining_time": "0:07:50"}
82
+ {"current_steps": 82, "total_steps": 84, "loss": 0.6686, "lr": 1.402856300198252e-07, "epoch": 2.880694143167028, "percentage": 97.62, "elapsed_time": "3:34:10", "remaining_time": "0:05:13"}
83
+ {"current_steps": 83, "total_steps": 84, "loss": 0.662, "lr": 3.5086796045664674e-08, "epoch": 2.915401301518438, "percentage": 98.81, "elapsed_time": "3:36:43", "remaining_time": "0:02:36"}
84
+ {"current_steps": 84, "total_steps": 84, "loss": 0.673, "lr": 0.0, "epoch": 2.950108459869848, "percentage": 100.0, "elapsed_time": "3:39:16", "remaining_time": "0:00:00"}
85
+ {"current_steps": 84, "total_steps": 84, "epoch": 2.950108459869848, "percentage": 100.0, "elapsed_time": "3:40:52", "remaining_time": "0:00:00"}