sedrickkeh commited on
Commit
2aad27f
·
verified ·
1 Parent(s): 21796be

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dddcee50038615ff789118a04b387edad35cc1841d90f8aaff750237de4e8a1
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a746ce57a143285df0995e2c303c0788e992f64bf845a1eea9ba6ad07ca8f885
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8089f1189da15318742f10573736324f72332e06a0744e22feb598366ae6f9a6
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:094c2740982f3d968f2a165b29e4072697bdd2bed1bc055a97db6c024804f4bc
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7f95d26d388a3b35136923a13c5de874b510861bee8ab53115dc96906f073fb
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f124e5da760974f5acfc6e31d6363342aefde9507dab1d91ed68f286f530c5
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:110ed368c632ef3f4341328284cf7f0739fbeabf07264a6566aa97a723c442db
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af6f28757c25fbbaf0500d437b73effec793601270c2ae6bbaff05e6a3dfb26
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -65,3 +65,36 @@
65
  {"current_steps": 640, "total_steps": 981, "loss": 0.7075, "lr": 5e-06, "epoch": 1.9564386702330914, "percentage": 65.24, "elapsed_time": "10:25:02", "remaining_time": "5:33:01"}
66
  {"current_steps": 650, "total_steps": 981, "loss": 0.7082, "lr": 5e-06, "epoch": 1.9870080244554833, "percentage": 66.26, "elapsed_time": "10:34:41", "remaining_time": "5:23:12"}
67
  {"current_steps": 654, "total_steps": 981, "eval_loss": 0.7433667182922363, "epoch": 1.9992357661444402, "percentage": 66.67, "elapsed_time": "10:44:34", "remaining_time": "5:22:17"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  {"current_steps": 640, "total_steps": 981, "loss": 0.7075, "lr": 5e-06, "epoch": 1.9564386702330914, "percentage": 65.24, "elapsed_time": "10:25:02", "remaining_time": "5:33:01"}
66
  {"current_steps": 650, "total_steps": 981, "loss": 0.7082, "lr": 5e-06, "epoch": 1.9870080244554833, "percentage": 66.26, "elapsed_time": "10:34:41", "remaining_time": "5:23:12"}
67
  {"current_steps": 654, "total_steps": 981, "eval_loss": 0.7433667182922363, "epoch": 1.9992357661444402, "percentage": 66.67, "elapsed_time": "10:44:34", "remaining_time": "5:22:17"}
68
+ {"current_steps": 660, "total_steps": 981, "loss": 0.7384, "lr": 5e-06, "epoch": 2.0175773786778755, "percentage": 67.28, "elapsed_time": "10:51:20", "remaining_time": "5:16:47"}
69
+ {"current_steps": 670, "total_steps": 981, "loss": 0.6584, "lr": 5e-06, "epoch": 2.0481467329002676, "percentage": 68.3, "elapsed_time": "11:00:57", "remaining_time": "5:06:48"}
70
+ {"current_steps": 680, "total_steps": 981, "loss": 0.6626, "lr": 5e-06, "epoch": 2.0787160871226593, "percentage": 69.32, "elapsed_time": "11:10:38", "remaining_time": "4:56:51"}
71
+ {"current_steps": 690, "total_steps": 981, "loss": 0.6584, "lr": 5e-06, "epoch": 2.1092854413450515, "percentage": 70.34, "elapsed_time": "11:20:18", "remaining_time": "4:46:54"}
72
+ {"current_steps": 700, "total_steps": 981, "loss": 0.6637, "lr": 5e-06, "epoch": 2.1398547955674436, "percentage": 71.36, "elapsed_time": "11:29:57", "remaining_time": "4:36:58"}
73
+ {"current_steps": 710, "total_steps": 981, "loss": 0.664, "lr": 5e-06, "epoch": 2.1704241497898358, "percentage": 72.38, "elapsed_time": "11:39:37", "remaining_time": "4:27:02"}
74
+ {"current_steps": 720, "total_steps": 981, "loss": 0.6639, "lr": 5e-06, "epoch": 2.200993504012228, "percentage": 73.39, "elapsed_time": "11:49:18", "remaining_time": "4:17:07"}
75
+ {"current_steps": 730, "total_steps": 981, "loss": 0.6644, "lr": 5e-06, "epoch": 2.2315628582346196, "percentage": 74.41, "elapsed_time": "11:58:56", "remaining_time": "4:07:12"}
76
+ {"current_steps": 740, "total_steps": 981, "loss": 0.6597, "lr": 5e-06, "epoch": 2.262132212457012, "percentage": 75.43, "elapsed_time": "12:08:35", "remaining_time": "3:57:16"}
77
+ {"current_steps": 750, "total_steps": 981, "loss": 0.6649, "lr": 5e-06, "epoch": 2.292701566679404, "percentage": 76.45, "elapsed_time": "12:18:13", "remaining_time": "3:47:22"}
78
+ {"current_steps": 760, "total_steps": 981, "loss": 0.6659, "lr": 5e-06, "epoch": 2.323270920901796, "percentage": 77.47, "elapsed_time": "12:27:51", "remaining_time": "3:37:28"}
79
+ {"current_steps": 770, "total_steps": 981, "loss": 0.663, "lr": 5e-06, "epoch": 2.353840275124188, "percentage": 78.49, "elapsed_time": "12:37:30", "remaining_time": "3:27:34"}
80
+ {"current_steps": 780, "total_steps": 981, "loss": 0.6615, "lr": 5e-06, "epoch": 2.38440962934658, "percentage": 79.51, "elapsed_time": "12:47:10", "remaining_time": "3:17:41"}
81
+ {"current_steps": 790, "total_steps": 981, "loss": 0.6668, "lr": 5e-06, "epoch": 2.414978983568972, "percentage": 80.53, "elapsed_time": "12:56:50", "remaining_time": "3:07:49"}
82
+ {"current_steps": 800, "total_steps": 981, "loss": 0.6652, "lr": 5e-06, "epoch": 2.4455483377913643, "percentage": 81.55, "elapsed_time": "13:06:30", "remaining_time": "2:57:56"}
83
+ {"current_steps": 810, "total_steps": 981, "loss": 0.6658, "lr": 5e-06, "epoch": 2.476117692013756, "percentage": 82.57, "elapsed_time": "13:16:09", "remaining_time": "2:48:04"}
84
+ {"current_steps": 820, "total_steps": 981, "loss": 0.6652, "lr": 5e-06, "epoch": 2.506687046236148, "percentage": 83.59, "elapsed_time": "13:25:47", "remaining_time": "2:38:12"}
85
+ {"current_steps": 830, "total_steps": 981, "loss": 0.6667, "lr": 5e-06, "epoch": 2.5372564004585403, "percentage": 84.61, "elapsed_time": "13:35:26", "remaining_time": "2:28:21"}
86
+ {"current_steps": 840, "total_steps": 981, "loss": 0.6675, "lr": 5e-06, "epoch": 2.5678257546809324, "percentage": 85.63, "elapsed_time": "13:45:07", "remaining_time": "2:18:30"}
87
+ {"current_steps": 850, "total_steps": 981, "loss": 0.6645, "lr": 5e-06, "epoch": 2.5983951089033246, "percentage": 86.65, "elapsed_time": "13:54:45", "remaining_time": "2:08:38"}
88
+ {"current_steps": 860, "total_steps": 981, "loss": 0.6632, "lr": 5e-06, "epoch": 2.6289644631257163, "percentage": 87.67, "elapsed_time": "14:04:25", "remaining_time": "1:58:48"}
89
+ {"current_steps": 870, "total_steps": 981, "loss": 0.668, "lr": 5e-06, "epoch": 2.6595338173481085, "percentage": 88.69, "elapsed_time": "14:14:05", "remaining_time": "1:48:58"}
90
+ {"current_steps": 880, "total_steps": 981, "loss": 0.668, "lr": 5e-06, "epoch": 2.6901031715705006, "percentage": 89.7, "elapsed_time": "14:23:45", "remaining_time": "1:39:08"}
91
+ {"current_steps": 890, "total_steps": 981, "loss": 0.6673, "lr": 5e-06, "epoch": 2.7206725257928928, "percentage": 90.72, "elapsed_time": "14:33:25", "remaining_time": "1:29:18"}
92
+ {"current_steps": 900, "total_steps": 981, "loss": 0.6682, "lr": 5e-06, "epoch": 2.751241880015285, "percentage": 91.74, "elapsed_time": "14:43:04", "remaining_time": "1:19:28"}
93
+ {"current_steps": 910, "total_steps": 981, "loss": 0.6654, "lr": 5e-06, "epoch": 2.7818112342376766, "percentage": 92.76, "elapsed_time": "14:52:43", "remaining_time": "1:09:39"}
94
+ {"current_steps": 920, "total_steps": 981, "loss": 0.6644, "lr": 5e-06, "epoch": 2.8123805884600688, "percentage": 93.78, "elapsed_time": "15:02:24", "remaining_time": "0:59:49"}
95
+ {"current_steps": 930, "total_steps": 981, "loss": 0.6662, "lr": 5e-06, "epoch": 2.842949942682461, "percentage": 94.8, "elapsed_time": "15:12:04", "remaining_time": "0:50:01"}
96
+ {"current_steps": 940, "total_steps": 981, "loss": 0.6663, "lr": 5e-06, "epoch": 2.8735192969048526, "percentage": 95.82, "elapsed_time": "15:21:44", "remaining_time": "0:40:12"}
97
+ {"current_steps": 950, "total_steps": 981, "loss": 0.6658, "lr": 5e-06, "epoch": 2.904088651127245, "percentage": 96.84, "elapsed_time": "15:31:24", "remaining_time": "0:30:23"}
98
+ {"current_steps": 960, "total_steps": 981, "loss": 0.667, "lr": 5e-06, "epoch": 2.934658005349637, "percentage": 97.86, "elapsed_time": "15:41:04", "remaining_time": "0:20:35"}
99
+ {"current_steps": 970, "total_steps": 981, "loss": 0.6669, "lr": 5e-06, "epoch": 2.965227359572029, "percentage": 98.88, "elapsed_time": "15:50:45", "remaining_time": "0:10:46"}
100
+ {"current_steps": 980, "total_steps": 981, "loss": 0.6679, "lr": 5e-06, "epoch": 2.9957967137944213, "percentage": 99.9, "elapsed_time": "16:00:25", "remaining_time": "0:00:58"}