gsmyrnis commited on
Commit
09e5bbc
·
verified ·
1 Parent(s): c99be84

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24c1c260b46347fef5bafa7022310b64948edb4abcef50eed591068a760a81e3
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a43f104e1775942af666b232d8449cdae40373bc35ac9d345e19401d8ba345f8
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c727e0eedfabf298b540ac5d4c239a4584de171b74750d45745a92868ff40365
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64d530d8acb3019aaf9f9b8ea0240113efe4f18420abb3eef9960ff8596ec206
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7575a032a9d0535e438d2f7d26416cc759205e38598f2b822f722ed405117a5a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67f67bcb9fb2b91c0d3e2bde068fe927fb9d0fb5f39a62162c782a9a2bd7f701
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b923b31ceff979cba485913dee8394ffc9124d56dcf8102f47cecbac59251e8
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92cc34a9ef33c76993067cd78ca40965a71f301005d7666baa523cc338773dae
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -80,3 +80,27 @@
80
  {"current_steps": 80, "total_steps": 105, "loss": 0.4355, "lr": 1.646076349303884e-06, "epoch": 2.2616822429906542, "percentage": 76.19, "elapsed_time": "0:20:30", "remaining_time": "0:06:24"}
81
  {"current_steps": 81, "total_steps": 105, "loss": 0.4345, "lr": 1.5240378616267887e-06, "epoch": 2.289719626168224, "percentage": 77.14, "elapsed_time": "0:20:45", "remaining_time": "0:06:09"}
82
  {"current_steps": 82, "total_steps": 105, "loss": 0.4131, "lr": 1.4058815806103542e-06, "epoch": 2.317757009345794, "percentage": 78.1, "elapsed_time": "0:21:03", "remaining_time": "0:05:54"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
80
  {"current_steps": 80, "total_steps": 105, "loss": 0.4355, "lr": 1.646076349303884e-06, "epoch": 2.2616822429906542, "percentage": 76.19, "elapsed_time": "0:20:30", "remaining_time": "0:06:24"}
81
  {"current_steps": 81, "total_steps": 105, "loss": 0.4345, "lr": 1.5240378616267887e-06, "epoch": 2.289719626168224, "percentage": 77.14, "elapsed_time": "0:20:45", "remaining_time": "0:06:09"}
82
  {"current_steps": 82, "total_steps": 105, "loss": 0.4131, "lr": 1.4058815806103542e-06, "epoch": 2.317757009345794, "percentage": 78.1, "elapsed_time": "0:21:03", "remaining_time": "0:05:54"}
83
+ {"current_steps": 83, "total_steps": 105, "loss": 0.4497, "lr": 1.2917394717602123e-06, "epoch": 2.3457943925233646, "percentage": 79.05, "elapsed_time": "0:21:17", "remaining_time": "0:05:38"}
84
+ {"current_steps": 84, "total_steps": 105, "loss": 0.4334, "lr": 1.1817390172633402e-06, "epoch": 2.3738317757009346, "percentage": 80.0, "elapsed_time": "0:21:31", "remaining_time": "0:05:22"}
85
+ {"current_steps": 85, "total_steps": 105, "loss": 0.4538, "lr": 1.0760030736066952e-06, "epoch": 2.4018691588785046, "percentage": 80.95, "elapsed_time": "0:21:43", "remaining_time": "0:05:06"}
86
+ {"current_steps": 86, "total_steps": 105, "loss": 0.4733, "lr": 9.746497343621857e-07, "epoch": 2.4299065420560746, "percentage": 81.9, "elapsed_time": "0:21:59", "remaining_time": "0:04:51"}
87
+ {"current_steps": 87, "total_steps": 105, "loss": 0.4268, "lr": 8.777921982911996e-07, "epoch": 2.457943925233645, "percentage": 82.86, "elapsed_time": "0:22:13", "remaining_time": "0:04:35"}
88
+ {"current_steps": 88, "total_steps": 105, "loss": 0.4249, "lr": 7.85538642916015e-07, "epoch": 2.485981308411215, "percentage": 83.81, "elapsed_time": "0:22:26", "remaining_time": "0:04:20"}
89
+ {"current_steps": 89, "total_steps": 105, "loss": 0.4666, "lr": 6.979921036993042e-07, "epoch": 2.514018691588785, "percentage": 84.76, "elapsed_time": "0:22:39", "remaining_time": "0:04:04"}
90
+ {"current_steps": 90, "total_steps": 105, "loss": 0.418, "lr": 6.152503589666426e-07, "epoch": 2.542056074766355, "percentage": 85.71, "elapsed_time": "0:22:53", "remaining_time": "0:03:48"}
91
+ {"current_steps": 91, "total_steps": 105, "loss": 0.4435, "lr": 5.374058207005945e-07, "epoch": 2.5700934579439254, "percentage": 86.67, "elapsed_time": "0:23:08", "remaining_time": "0:03:33"}
92
+ {"current_steps": 92, "total_steps": 105, "loss": 0.4282, "lr": 4.6454543132829653e-07, "epoch": 2.5981308411214954, "percentage": 87.62, "elapsed_time": "0:23:20", "remaining_time": "0:03:17"}
93
+ {"current_steps": 93, "total_steps": 105, "loss": 0.459, "lr": 3.9675056661785563e-07, "epoch": 2.6261682242990654, "percentage": 88.57, "elapsed_time": "0:23:29", "remaining_time": "0:03:01"}
94
+ {"current_steps": 94, "total_steps": 105, "loss": 0.4625, "lr": 3.340969447919873e-07, "epoch": 2.6542056074766354, "percentage": 89.52, "elapsed_time": "0:23:43", "remaining_time": "0:02:46"}
95
+ {"current_steps": 95, "total_steps": 105, "loss": 0.4631, "lr": 2.7665454196040665e-07, "epoch": 2.6822429906542054, "percentage": 90.48, "elapsed_time": "0:23:56", "remaining_time": "0:02:31"}
96
+ {"current_steps": 96, "total_steps": 105, "loss": 0.4534, "lr": 2.2448751396543788e-07, "epoch": 2.710280373831776, "percentage": 91.43, "elapsed_time": "0:24:07", "remaining_time": "0:02:15"}
97
+ {"current_steps": 97, "total_steps": 105, "loss": 0.4504, "lr": 1.776541247281177e-07, "epoch": 2.7383177570093458, "percentage": 92.38, "elapsed_time": "0:24:21", "remaining_time": "0:02:00"}
98
+ {"current_steps": 98, "total_steps": 105, "loss": 0.4242, "lr": 1.3620668117481471e-07, "epoch": 2.7663551401869158, "percentage": 93.33, "elapsed_time": "0:24:33", "remaining_time": "0:01:45"}
99
+ {"current_steps": 99, "total_steps": 105, "loss": 0.4748, "lr": 1.0019147481706626e-07, "epoch": 2.794392523364486, "percentage": 94.29, "elapsed_time": "0:24:48", "remaining_time": "0:01:30"}
100
+ {"current_steps": 100, "total_steps": 105, "loss": 0.4288, "lr": 6.964873004985717e-08, "epoch": 2.822429906542056, "percentage": 95.24, "elapsed_time": "0:25:04", "remaining_time": "0:01:15"}
101
+ {"current_steps": 101, "total_steps": 105, "loss": 0.4565, "lr": 4.461255922609986e-08, "epoch": 2.850467289719626, "percentage": 96.19, "elapsed_time": "0:25:16", "remaining_time": "0:01:00"}
102
+ {"current_steps": 102, "total_steps": 105, "loss": 0.4166, "lr": 2.511092455747932e-08, "epoch": 2.878504672897196, "percentage": 97.14, "elapsed_time": "0:25:30", "remaining_time": "0:00:45"}
103
+ {"current_steps": 103, "total_steps": 105, "loss": 0.4491, "lr": 1.1165606884234182e-08, "epoch": 2.906542056074766, "percentage": 98.1, "elapsed_time": "0:25:44", "remaining_time": "0:00:29"}
104
+ {"current_steps": 104, "total_steps": 105, "loss": 0.4313, "lr": 2.792181348726941e-09, "epoch": 2.9345794392523366, "percentage": 99.05, "elapsed_time": "0:25:57", "remaining_time": "0:00:14"}
105
+ {"current_steps": 105, "total_steps": 105, "loss": 0.4156, "lr": 0.0, "epoch": 2.9626168224299065, "percentage": 100.0, "elapsed_time": "0:26:10", "remaining_time": "0:00:00"}
106
+ {"current_steps": 105, "total_steps": 105, "epoch": 2.9626168224299065, "percentage": 100.0, "elapsed_time": "0:28:16", "remaining_time": "0:00:00"}