gsmyrnis commited on
Commit
5bc5d8a
·
verified ·
1 Parent(s): 6cdeb69

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d342769bd0d625835bfc4b1faab9d9553676c96406c992b80c11d1958be3849a
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a537b6f027ee023fc8b4b26067badd6d727c75a767853e8a0f0799dd7fb3cbf
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb4c0941f386ea7d339f2851f5779cbeeaad508628b9dde7128c3d3753aef2ad
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f65c4501a1b9106ab001d1bf86b432001460ea3e52c36c42ccc0fe6d27d92df8
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:576f455eb39585b6b297da286a43eac88d90f2fb1f97fa36c3c866a8d862a9ec
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebc57c3b27eb73f03dd3e240012d448af57dcd734dc2ecbdd7f5d8fc917a128a
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:318312ff802138afbbe146d43f67d191d2a01dcd6519bf00e123270cbbc57f6a
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32e8f754a67891a52409b9f4f81611260d066c8ec08971fe86c0739e21ff2672
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -57,3 +57,29 @@
57
  {"current_steps": 550, "total_steps": 819, "loss": 0.6558, "learning_rate": 5e-06, "epoch": 2.0146520146520146, "percentage": 67.16, "elapsed_time": "1:00:45", "remaining_time": "0:29:42"}
58
  {"current_steps": 560, "total_steps": 819, "loss": 0.6295, "learning_rate": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:01:47", "remaining_time": "0:28:34"}
59
  {"current_steps": 570, "total_steps": 819, "loss": 0.6286, "learning_rate": 5e-06, "epoch": 2.087912087912088, "percentage": 69.6, "elapsed_time": "1:02:48", "remaining_time": "0:27:26"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  {"current_steps": 550, "total_steps": 819, "loss": 0.6558, "learning_rate": 5e-06, "epoch": 2.0146520146520146, "percentage": 67.16, "elapsed_time": "1:00:45", "remaining_time": "0:29:42"}
58
  {"current_steps": 560, "total_steps": 819, "loss": 0.6295, "learning_rate": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:01:47", "remaining_time": "0:28:34"}
59
  {"current_steps": 570, "total_steps": 819, "loss": 0.6286, "learning_rate": 5e-06, "epoch": 2.087912087912088, "percentage": 69.6, "elapsed_time": "1:02:48", "remaining_time": "0:27:26"}
60
+ {"current_steps": 580, "total_steps": 819, "loss": 0.6314, "learning_rate": 5e-06, "epoch": 2.1245421245421245, "percentage": 70.82, "elapsed_time": "1:03:50", "remaining_time": "0:26:18"}
61
+ {"current_steps": 590, "total_steps": 819, "loss": 0.6283, "learning_rate": 5e-06, "epoch": 2.161172161172161, "percentage": 72.04, "elapsed_time": "1:04:52", "remaining_time": "0:25:10"}
62
+ {"current_steps": 600, "total_steps": 819, "loss": 0.6314, "learning_rate": 5e-06, "epoch": 2.197802197802198, "percentage": 73.26, "elapsed_time": "1:05:54", "remaining_time": "0:24:03"}
63
+ {"current_steps": 610, "total_steps": 819, "loss": 0.6335, "learning_rate": 5e-06, "epoch": 2.2344322344322345, "percentage": 74.48, "elapsed_time": "1:06:56", "remaining_time": "0:22:55"}
64
+ {"current_steps": 620, "total_steps": 819, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 2.271062271062271, "percentage": 75.7, "elapsed_time": "1:07:58", "remaining_time": "0:21:48"}
65
+ {"current_steps": 630, "total_steps": 819, "loss": 0.633, "learning_rate": 5e-06, "epoch": 2.3076923076923075, "percentage": 76.92, "elapsed_time": "1:09:00", "remaining_time": "0:20:42"}
66
+ {"current_steps": 640, "total_steps": 819, "loss": 0.6349, "learning_rate": 5e-06, "epoch": 2.3443223443223444, "percentage": 78.14, "elapsed_time": "1:10:03", "remaining_time": "0:19:35"}
67
+ {"current_steps": 650, "total_steps": 819, "loss": 0.6358, "learning_rate": 5e-06, "epoch": 2.380952380952381, "percentage": 79.37, "elapsed_time": "1:11:05", "remaining_time": "0:18:29"}
68
+ {"current_steps": 660, "total_steps": 819, "loss": 0.634, "learning_rate": 5e-06, "epoch": 2.4175824175824174, "percentage": 80.59, "elapsed_time": "1:12:08", "remaining_time": "0:17:22"}
69
+ {"current_steps": 670, "total_steps": 819, "loss": 0.6332, "learning_rate": 5e-06, "epoch": 2.4542124542124544, "percentage": 81.81, "elapsed_time": "1:13:10", "remaining_time": "0:16:16"}
70
+ {"current_steps": 680, "total_steps": 819, "loss": 0.636, "learning_rate": 5e-06, "epoch": 2.490842490842491, "percentage": 83.03, "elapsed_time": "1:14:12", "remaining_time": "0:15:10"}
71
+ {"current_steps": 690, "total_steps": 819, "loss": 0.6342, "learning_rate": 5e-06, "epoch": 2.5274725274725274, "percentage": 84.25, "elapsed_time": "1:15:14", "remaining_time": "0:14:04"}
72
+ {"current_steps": 700, "total_steps": 819, "loss": 0.6333, "learning_rate": 5e-06, "epoch": 2.564102564102564, "percentage": 85.47, "elapsed_time": "1:16:18", "remaining_time": "0:12:58"}
73
+ {"current_steps": 710, "total_steps": 819, "loss": 0.6373, "learning_rate": 5e-06, "epoch": 2.600732600732601, "percentage": 86.69, "elapsed_time": "1:17:19", "remaining_time": "0:11:52"}
74
+ {"current_steps": 720, "total_steps": 819, "loss": 0.6364, "learning_rate": 5e-06, "epoch": 2.6373626373626373, "percentage": 87.91, "elapsed_time": "1:18:21", "remaining_time": "0:10:46"}
75
+ {"current_steps": 730, "total_steps": 819, "loss": 0.6382, "learning_rate": 5e-06, "epoch": 2.6739926739926743, "percentage": 89.13, "elapsed_time": "1:19:23", "remaining_time": "0:09:40"}
76
+ {"current_steps": 740, "total_steps": 819, "loss": 0.638, "learning_rate": 5e-06, "epoch": 2.7106227106227108, "percentage": 90.35, "elapsed_time": "1:20:26", "remaining_time": "0:08:35"}
77
+ {"current_steps": 750, "total_steps": 819, "loss": 0.6349, "learning_rate": 5e-06, "epoch": 2.7472527472527473, "percentage": 91.58, "elapsed_time": "1:21:27", "remaining_time": "0:07:29"}
78
+ {"current_steps": 760, "total_steps": 819, "loss": 0.6379, "learning_rate": 5e-06, "epoch": 2.7838827838827838, "percentage": 92.8, "elapsed_time": "1:22:31", "remaining_time": "0:06:24"}
79
+ {"current_steps": 770, "total_steps": 819, "loss": 0.6337, "learning_rate": 5e-06, "epoch": 2.8205128205128203, "percentage": 94.02, "elapsed_time": "1:23:32", "remaining_time": "0:05:18"}
80
+ {"current_steps": 780, "total_steps": 819, "loss": 0.641, "learning_rate": 5e-06, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "1:24:34", "remaining_time": "0:04:13"}
81
+ {"current_steps": 790, "total_steps": 819, "loss": 0.6388, "learning_rate": 5e-06, "epoch": 2.8937728937728937, "percentage": 96.46, "elapsed_time": "1:25:36", "remaining_time": "0:03:08"}
82
+ {"current_steps": 800, "total_steps": 819, "loss": 0.6369, "learning_rate": 5e-06, "epoch": 2.9304029304029307, "percentage": 97.68, "elapsed_time": "1:26:38", "remaining_time": "0:02:03"}
83
+ {"current_steps": 810, "total_steps": 819, "loss": 0.6421, "learning_rate": 5e-06, "epoch": 2.967032967032967, "percentage": 98.9, "elapsed_time": "1:27:40", "remaining_time": "0:00:58"}
84
+ {"current_steps": 819, "total_steps": 819, "eval_loss": 0.7364696264266968, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:30:32", "remaining_time": "0:00:00"}
85
+ {"current_steps": 819, "total_steps": 819, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:32:12", "remaining_time": "0:00:00"}