sedrickkeh commited on
Commit
d104ccf
·
verified ·
1 Parent(s): 3f6d666

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62fa2a92bced2365908dd7ed78ed58bd54a6fc9f9121aa25843a11f4da56a239
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0586ab732d5dfa6294a36350ad5089b4e583c40935e075da4fea1598d1669793
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ec5eaedebbbb22ffedd3b9478190026574263b228f195479d9fd1960964735f
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daadd2025e13840c03c2df5ed23d379ca9ca2de08090e20651cbe6c3fc947873
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8db6b9e7baeba74f526dd34ffc2828795206c1c192697db497664ce41a3c9318
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a8db170a9152799069643c131fc81f897461dcefae4972d3b7b22ab516a0d0c
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e531ffa2f0df8f7ac11eec973f18a64fc8feb7f0756fe9b89c725d4996fa8de
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd21de81a4a658528a28024c0a2800f33f521a47940a99abc94d55c6a4e97c37
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -55,3 +55,30 @@
55
  {"current_steps": 540, "total_steps": 822, "loss": 0.6805, "lr": 5e-06, "epoch": 1.968109339407745, "percentage": 65.69, "elapsed_time": "8:42:40", "remaining_time": "4:32:57"}
56
  {"current_steps": 548, "total_steps": 822, "eval_loss": 0.7187947630882263, "epoch": 1.9972665148063782, "percentage": 66.67, "elapsed_time": "8:55:51", "remaining_time": "4:27:55"}
57
  {"current_steps": 550, "total_steps": 822, "loss": 0.7193, "lr": 5e-06, "epoch": 2.0045558086560367, "percentage": 66.91, "elapsed_time": "8:58:21", "remaining_time": "4:26:14"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  {"current_steps": 540, "total_steps": 822, "loss": 0.6805, "lr": 5e-06, "epoch": 1.968109339407745, "percentage": 65.69, "elapsed_time": "8:42:40", "remaining_time": "4:32:57"}
56
  {"current_steps": 548, "total_steps": 822, "eval_loss": 0.7187947630882263, "epoch": 1.9972665148063782, "percentage": 66.67, "elapsed_time": "8:55:51", "remaining_time": "4:27:55"}
57
  {"current_steps": 550, "total_steps": 822, "loss": 0.7193, "lr": 5e-06, "epoch": 2.0045558086560367, "percentage": 66.91, "elapsed_time": "8:58:21", "remaining_time": "4:26:14"}
58
+ {"current_steps": 560, "total_steps": 822, "loss": 0.6233, "lr": 5e-06, "epoch": 2.041002277904328, "percentage": 68.13, "elapsed_time": "9:07:55", "remaining_time": "4:16:20"}
59
+ {"current_steps": 570, "total_steps": 822, "loss": 0.6283, "lr": 5e-06, "epoch": 2.0774487471526197, "percentage": 69.34, "elapsed_time": "9:17:29", "remaining_time": "4:06:28"}
60
+ {"current_steps": 580, "total_steps": 822, "loss": 0.6207, "lr": 5e-06, "epoch": 2.1138952164009113, "percentage": 70.56, "elapsed_time": "9:27:04", "remaining_time": "3:56:36"}
61
+ {"current_steps": 590, "total_steps": 822, "loss": 0.6244, "lr": 5e-06, "epoch": 2.150341685649203, "percentage": 71.78, "elapsed_time": "9:36:38", "remaining_time": "3:46:44"}
62
+ {"current_steps": 600, "total_steps": 822, "loss": 0.6258, "lr": 5e-06, "epoch": 2.1867881548974943, "percentage": 72.99, "elapsed_time": "9:46:13", "remaining_time": "3:36:54"}
63
+ {"current_steps": 610, "total_steps": 822, "loss": 0.628, "lr": 5e-06, "epoch": 2.223234624145786, "percentage": 74.21, "elapsed_time": "9:55:48", "remaining_time": "3:27:03"}
64
+ {"current_steps": 620, "total_steps": 822, "loss": 0.6264, "lr": 5e-06, "epoch": 2.2596810933940774, "percentage": 75.43, "elapsed_time": "10:05:22", "remaining_time": "3:17:14"}
65
+ {"current_steps": 630, "total_steps": 822, "loss": 0.6242, "lr": 5e-06, "epoch": 2.296127562642369, "percentage": 76.64, "elapsed_time": "10:14:57", "remaining_time": "3:07:25"}
66
+ {"current_steps": 640, "total_steps": 822, "loss": 0.6305, "lr": 5e-06, "epoch": 2.3325740318906605, "percentage": 77.86, "elapsed_time": "10:24:32", "remaining_time": "2:57:36"}
67
+ {"current_steps": 650, "total_steps": 822, "loss": 0.6297, "lr": 5e-06, "epoch": 2.369020501138952, "percentage": 79.08, "elapsed_time": "10:34:06", "remaining_time": "2:47:47"}
68
+ {"current_steps": 660, "total_steps": 822, "loss": 0.631, "lr": 5e-06, "epoch": 2.4054669703872436, "percentage": 80.29, "elapsed_time": "10:43:41", "remaining_time": "2:37:59"}
69
+ {"current_steps": 670, "total_steps": 822, "loss": 0.6264, "lr": 5e-06, "epoch": 2.4419134396355355, "percentage": 81.51, "elapsed_time": "10:53:15", "remaining_time": "2:28:12"}
70
+ {"current_steps": 680, "total_steps": 822, "loss": 0.6266, "lr": 5e-06, "epoch": 2.478359908883827, "percentage": 82.73, "elapsed_time": "11:02:49", "remaining_time": "2:18:24"}
71
+ {"current_steps": 690, "total_steps": 822, "loss": 0.6263, "lr": 5e-06, "epoch": 2.5148063781321186, "percentage": 83.94, "elapsed_time": "11:12:22", "remaining_time": "2:08:37"}
72
+ {"current_steps": 700, "total_steps": 822, "loss": 0.6317, "lr": 5e-06, "epoch": 2.55125284738041, "percentage": 85.16, "elapsed_time": "11:21:57", "remaining_time": "1:58:51"}
73
+ {"current_steps": 710, "total_steps": 822, "loss": 0.6264, "lr": 5e-06, "epoch": 2.5876993166287017, "percentage": 86.37, "elapsed_time": "11:31:32", "remaining_time": "1:49:05"}
74
+ {"current_steps": 720, "total_steps": 822, "loss": 0.6295, "lr": 5e-06, "epoch": 2.624145785876993, "percentage": 87.59, "elapsed_time": "11:41:06", "remaining_time": "1:39:19"}
75
+ {"current_steps": 730, "total_steps": 822, "loss": 0.6273, "lr": 5e-06, "epoch": 2.6605922551252847, "percentage": 88.81, "elapsed_time": "11:50:41", "remaining_time": "1:29:33"}
76
+ {"current_steps": 740, "total_steps": 822, "loss": 0.6328, "lr": 5e-06, "epoch": 2.6970387243735763, "percentage": 90.02, "elapsed_time": "12:00:15", "remaining_time": "1:19:48"}
77
+ {"current_steps": 750, "total_steps": 822, "loss": 0.6333, "lr": 5e-06, "epoch": 2.733485193621868, "percentage": 91.24, "elapsed_time": "12:09:50", "remaining_time": "1:10:03"}
78
+ {"current_steps": 760, "total_steps": 822, "loss": 0.6306, "lr": 5e-06, "epoch": 2.7699316628701594, "percentage": 92.46, "elapsed_time": "12:19:24", "remaining_time": "1:00:19"}
79
+ {"current_steps": 770, "total_steps": 822, "loss": 0.6338, "lr": 5e-06, "epoch": 2.806378132118451, "percentage": 93.67, "elapsed_time": "12:28:59", "remaining_time": "0:50:34"}
80
+ {"current_steps": 780, "total_steps": 822, "loss": 0.6352, "lr": 5e-06, "epoch": 2.8428246013667424, "percentage": 94.89, "elapsed_time": "12:38:33", "remaining_time": "0:40:50"}
81
+ {"current_steps": 790, "total_steps": 822, "loss": 0.6284, "lr": 5e-06, "epoch": 2.879271070615034, "percentage": 96.11, "elapsed_time": "12:48:08", "remaining_time": "0:31:06"}
82
+ {"current_steps": 800, "total_steps": 822, "loss": 0.6306, "lr": 5e-06, "epoch": 2.9157175398633255, "percentage": 97.32, "elapsed_time": "12:57:42", "remaining_time": "0:21:23"}
83
+ {"current_steps": 810, "total_steps": 822, "loss": 0.6402, "lr": 5e-06, "epoch": 2.9521640091116175, "percentage": 98.54, "elapsed_time": "13:07:16", "remaining_time": "0:11:39"}
84
+ {"current_steps": 820, "total_steps": 822, "loss": 0.6348, "lr": 5e-06, "epoch": 2.988610478359909, "percentage": 99.76, "elapsed_time": "13:16:51", "remaining_time": "0:01:56"}