sedrickkeh commited on
Commit
f92f79c
·
verified ·
1 Parent(s): 322487a

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b19d513d4e39409d115af008bad8a9f9fa745ba54bb723e3c205c0085aaa90a3
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f83b6ec3e0c440e893d30b0c1742fa41604a806777236bc2666e184a7becc32
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2b834512244613ab75b3132908bc629669f846da8b98c9655d9995772f5e92e
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ce5eea1dd417148f094d986a272fe5c0acbd8f0ab164fa256d8127dec312f77
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e764f4816a0ac0834983c10cd6ade7388d0f84241e1a25687c953b34570d4b0
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4fab5cc499300593d0ffde9ee3c478f56356b65d662f42f468d24bab782e3e1
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f0c9c7def3a2db0d32d77b71f8bc0ea4a361b582275f92d83ccc833efb50262
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10017a208b0ebc8bba8bdb1396e92834259e4f8d639ff9721af7dbbe835196f5
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -64,3 +64,34 @@
64
  {"current_steps": 630, "total_steps": 957, "loss": 0.6588, "lr": 5e-06, "epoch": 1.9733750978856697, "percentage": 65.83, "elapsed_time": "10:15:39", "remaining_time": "5:19:33"}
65
  {"current_steps": 638, "total_steps": 957, "eval_loss": 0.6915597319602966, "epoch": 1.9984338292873924, "percentage": 66.67, "elapsed_time": "10:29:32", "remaining_time": "5:14:46"}
66
  {"current_steps": 640, "total_steps": 957, "loss": 0.7005, "lr": 5e-06, "epoch": 2.004698512137823, "percentage": 66.88, "elapsed_time": "10:32:10", "remaining_time": "5:13:07"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  {"current_steps": 630, "total_steps": 957, "loss": 0.6588, "lr": 5e-06, "epoch": 1.9733750978856697, "percentage": 65.83, "elapsed_time": "10:15:39", "remaining_time": "5:19:33"}
65
  {"current_steps": 638, "total_steps": 957, "eval_loss": 0.6915597319602966, "epoch": 1.9984338292873924, "percentage": 66.67, "elapsed_time": "10:29:32", "remaining_time": "5:14:46"}
66
  {"current_steps": 640, "total_steps": 957, "loss": 0.7005, "lr": 5e-06, "epoch": 2.004698512137823, "percentage": 66.88, "elapsed_time": "10:32:10", "remaining_time": "5:13:07"}
67
+ {"current_steps": 650, "total_steps": 957, "loss": 0.61, "lr": 5e-06, "epoch": 2.0360219263899766, "percentage": 67.92, "elapsed_time": "10:41:48", "remaining_time": "5:03:08"}
68
+ {"current_steps": 660, "total_steps": 957, "loss": 0.6129, "lr": 5e-06, "epoch": 2.06734534064213, "percentage": 68.97, "elapsed_time": "10:51:28", "remaining_time": "4:53:09"}
69
+ {"current_steps": 670, "total_steps": 957, "loss": 0.6073, "lr": 5e-06, "epoch": 2.0986687548942835, "percentage": 70.01, "elapsed_time": "11:01:08", "remaining_time": "4:43:12"}
70
+ {"current_steps": 680, "total_steps": 957, "loss": 0.6069, "lr": 5e-06, "epoch": 2.129992169146437, "percentage": 71.06, "elapsed_time": "11:10:47", "remaining_time": "4:33:15"}
71
+ {"current_steps": 690, "total_steps": 957, "loss": 0.6115, "lr": 5e-06, "epoch": 2.1613155833985904, "percentage": 72.1, "elapsed_time": "11:20:26", "remaining_time": "4:23:18"}
72
+ {"current_steps": 700, "total_steps": 957, "loss": 0.6083, "lr": 5e-06, "epoch": 2.192638997650744, "percentage": 73.15, "elapsed_time": "11:30:05", "remaining_time": "4:13:21"}
73
+ {"current_steps": 710, "total_steps": 957, "loss": 0.6055, "lr": 5e-06, "epoch": 2.2239624119028973, "percentage": 74.19, "elapsed_time": "11:39:44", "remaining_time": "4:03:25"}
74
+ {"current_steps": 720, "total_steps": 957, "loss": 0.612, "lr": 5e-06, "epoch": 2.255285826155051, "percentage": 75.24, "elapsed_time": "11:49:23", "remaining_time": "3:53:30"}
75
+ {"current_steps": 730, "total_steps": 957, "loss": 0.6119, "lr": 5e-06, "epoch": 2.2866092404072043, "percentage": 76.28, "elapsed_time": "11:59:03", "remaining_time": "3:43:35"}
76
+ {"current_steps": 740, "total_steps": 957, "loss": 0.6113, "lr": 5e-06, "epoch": 2.3179326546593577, "percentage": 77.32, "elapsed_time": "12:08:42", "remaining_time": "3:33:41"}
77
+ {"current_steps": 750, "total_steps": 957, "loss": 0.6111, "lr": 5e-06, "epoch": 2.349256068911511, "percentage": 78.37, "elapsed_time": "12:18:20", "remaining_time": "3:23:46"}
78
+ {"current_steps": 760, "total_steps": 957, "loss": 0.6121, "lr": 5e-06, "epoch": 2.3805794831636646, "percentage": 79.41, "elapsed_time": "12:27:59", "remaining_time": "3:13:53"}
79
+ {"current_steps": 770, "total_steps": 957, "loss": 0.6159, "lr": 5e-06, "epoch": 2.4119028974158185, "percentage": 80.46, "elapsed_time": "12:37:38", "remaining_time": "3:03:59"}
80
+ {"current_steps": 780, "total_steps": 957, "loss": 0.6142, "lr": 5e-06, "epoch": 2.443226311667972, "percentage": 81.5, "elapsed_time": "12:47:17", "remaining_time": "2:54:06"}
81
+ {"current_steps": 790, "total_steps": 957, "loss": 0.6181, "lr": 5e-06, "epoch": 2.4745497259201255, "percentage": 82.55, "elapsed_time": "12:56:56", "remaining_time": "2:44:14"}
82
+ {"current_steps": 800, "total_steps": 957, "loss": 0.6127, "lr": 5e-06, "epoch": 2.505873140172279, "percentage": 83.59, "elapsed_time": "13:06:34", "remaining_time": "2:34:21"}
83
+ {"current_steps": 810, "total_steps": 957, "loss": 0.6192, "lr": 5e-06, "epoch": 2.5371965544244324, "percentage": 84.64, "elapsed_time": "13:16:13", "remaining_time": "2:24:29"}
84
+ {"current_steps": 820, "total_steps": 957, "loss": 0.6098, "lr": 5e-06, "epoch": 2.568519968676586, "percentage": 85.68, "elapsed_time": "13:25:51", "remaining_time": "2:14:38"}
85
+ {"current_steps": 830, "total_steps": 957, "loss": 0.6126, "lr": 5e-06, "epoch": 2.5998433829287393, "percentage": 86.73, "elapsed_time": "13:35:28", "remaining_time": "2:04:46"}
86
+ {"current_steps": 840, "total_steps": 957, "loss": 0.618, "lr": 5e-06, "epoch": 2.6311667971808927, "percentage": 87.77, "elapsed_time": "13:45:06", "remaining_time": "1:54:55"}
87
+ {"current_steps": 850, "total_steps": 957, "loss": 0.6132, "lr": 5e-06, "epoch": 2.662490211433046, "percentage": 88.82, "elapsed_time": "13:54:45", "remaining_time": "1:45:04"}
88
+ {"current_steps": 860, "total_steps": 957, "loss": 0.6211, "lr": 5e-06, "epoch": 2.6938136256851997, "percentage": 89.86, "elapsed_time": "14:04:24", "remaining_time": "1:35:14"}
89
+ {"current_steps": 870, "total_steps": 957, "loss": 0.6072, "lr": 5e-06, "epoch": 2.725137039937353, "percentage": 90.91, "elapsed_time": "14:14:04", "remaining_time": "1:25:24"}
90
+ {"current_steps": 880, "total_steps": 957, "loss": 0.6181, "lr": 5e-06, "epoch": 2.7564604541895066, "percentage": 91.95, "elapsed_time": "14:23:43", "remaining_time": "1:15:34"}
91
+ {"current_steps": 890, "total_steps": 957, "loss": 0.6183, "lr": 5e-06, "epoch": 2.78778386844166, "percentage": 93.0, "elapsed_time": "14:33:23", "remaining_time": "1:05:44"}
92
+ {"current_steps": 900, "total_steps": 957, "loss": 0.6185, "lr": 5e-06, "epoch": 2.8191072826938135, "percentage": 94.04, "elapsed_time": "14:43:02", "remaining_time": "0:55:55"}
93
+ {"current_steps": 910, "total_steps": 957, "loss": 0.6113, "lr": 5e-06, "epoch": 2.850430696945967, "percentage": 95.09, "elapsed_time": "14:52:41", "remaining_time": "0:46:06"}
94
+ {"current_steps": 920, "total_steps": 957, "loss": 0.613, "lr": 5e-06, "epoch": 2.881754111198121, "percentage": 96.13, "elapsed_time": "15:02:20", "remaining_time": "0:36:17"}
95
+ {"current_steps": 930, "total_steps": 957, "loss": 0.6178, "lr": 5e-06, "epoch": 2.913077525450274, "percentage": 97.18, "elapsed_time": "15:12:00", "remaining_time": "0:26:28"}
96
+ {"current_steps": 940, "total_steps": 957, "loss": 0.6157, "lr": 5e-06, "epoch": 2.9444009397024278, "percentage": 98.22, "elapsed_time": "15:21:40", "remaining_time": "0:16:40"}
97
+ {"current_steps": 950, "total_steps": 957, "loss": 0.6176, "lr": 5e-06, "epoch": 2.975724353954581, "percentage": 99.27, "elapsed_time": "15:31:18", "remaining_time": "0:06:51"}