sedrickkeh commited on
Commit
4c44fd1
·
verified ·
1 Parent(s): add530d

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ed45c2c2c09ae999c217bc91cd11c59d937ca3774476089717648cf8243d2bd
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae8372ba8f6288205de9483178b0accd16a3c7386dfc92e560836c806c59c8cc
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3880602b3f41a174a4b269ce07b78e2073d5bf5cf647422b208e356ad9a137ea
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77511d7d0a6a3e40e347ce893ac93905fcd087968851600b8cfdf25904fc4da7
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6647ecb9d50b5c8e57778c7d22b13c0763900abbda47da31d7f2eca16deac781
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56db0b0c8a64add581633f0ea3dd135310b0556fcbc6d1d09e2149a40cce0dbf
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:824e6bc1ad01d94a3e193f6c67670562182a0d45139e7775e4f0f0558718f10c
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c76f4ff81c21082ed12fcc3759c9402a939d6d91a79ce4b24fa76f5b5412d7f
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -52,3 +52,25 @@
52
  {"current_steps": 52, "total_steps": 75, "loss": 0.8763, "lr": 2.636557474057173e-06, "epoch": 2.0064308681672025, "percentage": 69.33, "elapsed_time": "0:45:08", "remaining_time": "0:19:58"}
53
  {"current_steps": 53, "total_steps": 75, "loss": 0.8473, "lr": 2.4326290324257896e-06, "epoch": 2.045016077170418, "percentage": 70.67, "elapsed_time": "0:46:09", "remaining_time": "0:19:09"}
54
  {"current_steps": 54, "total_steps": 75, "loss": 0.7919, "lr": 2.234344229374003e-06, "epoch": 2.0836012861736335, "percentage": 72.0, "elapsed_time": "0:47:01", "remaining_time": "0:18:17"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52
  {"current_steps": 52, "total_steps": 75, "loss": 0.8763, "lr": 2.636557474057173e-06, "epoch": 2.0064308681672025, "percentage": 69.33, "elapsed_time": "0:45:08", "remaining_time": "0:19:58"}
53
  {"current_steps": 53, "total_steps": 75, "loss": 0.8473, "lr": 2.4326290324257896e-06, "epoch": 2.045016077170418, "percentage": 70.67, "elapsed_time": "0:46:09", "remaining_time": "0:19:09"}
54
  {"current_steps": 54, "total_steps": 75, "loss": 0.7919, "lr": 2.234344229374003e-06, "epoch": 2.0836012861736335, "percentage": 72.0, "elapsed_time": "0:47:01", "remaining_time": "0:18:17"}
55
+ {"current_steps": 55, "total_steps": 75, "loss": 0.8196, "lr": 2.042138937932388e-06, "epoch": 2.122186495176849, "percentage": 73.33, "elapsed_time": "0:47:50", "remaining_time": "0:17:23"}
56
+ {"current_steps": 56, "total_steps": 75, "loss": 0.7881, "lr": 1.856435667045577e-06, "epoch": 2.1607717041800645, "percentage": 74.67, "elapsed_time": "0:48:34", "remaining_time": "0:16:28"}
57
+ {"current_steps": 57, "total_steps": 75, "loss": 0.8631, "lr": 1.677642632805892e-06, "epoch": 2.19935691318328, "percentage": 76.0, "elapsed_time": "0:49:29", "remaining_time": "0:15:37"}
58
+ {"current_steps": 58, "total_steps": 75, "loss": 0.7746, "lr": 1.5061528611057917e-06, "epoch": 2.237942122186495, "percentage": 77.33, "elapsed_time": "0:50:13", "remaining_time": "0:14:43"}
59
+ {"current_steps": 59, "total_steps": 75, "loss": 0.8119, "lr": 1.3423433236816563e-06, "epoch": 2.2765273311897105, "percentage": 78.67, "elapsed_time": "0:51:06", "remaining_time": "0:13:51"}
60
+ {"current_steps": 60, "total_steps": 75, "loss": 0.8375, "lr": 1.186574109448091e-06, "epoch": 2.315112540192926, "percentage": 80.0, "elapsed_time": "0:51:52", "remaining_time": "0:12:58"}
61
+ {"current_steps": 61, "total_steps": 75, "loss": 0.7619, "lr": 1.0391876329443534e-06, "epoch": 2.3536977491961415, "percentage": 81.33, "elapsed_time": "0:52:36", "remaining_time": "0:12:04"}
62
+ {"current_steps": 62, "total_steps": 75, "loss": 0.8132, "lr": 9.005078816328772e-07, "epoch": 2.392282958199357, "percentage": 82.67, "elapsed_time": "0:53:34", "remaining_time": "0:11:13"}
63
+ {"current_steps": 63, "total_steps": 75, "loss": 0.7784, "lr": 7.708397037045129e-07, "epoch": 2.4308681672025725, "percentage": 84.0, "elapsed_time": "0:54:23", "remaining_time": "0:10:21"}
64
+ {"current_steps": 64, "total_steps": 75, "loss": 0.8832, "lr": 6.50468137956049e-07, "epoch": 2.469453376205788, "percentage": 85.33, "elapsed_time": "0:55:16", "remaining_time": "0:09:29"}
65
+ {"current_steps": 65, "total_steps": 75, "loss": 0.8102, "lr": 5.396577872130676e-07, "epoch": 2.508038585209003, "percentage": 86.67, "elapsed_time": "0:56:07", "remaining_time": "0:08:38"}
66
+ {"current_steps": 66, "total_steps": 75, "loss": 0.7881, "lr": 4.386522366755169e-07, "epoch": 2.5466237942122185, "percentage": 88.0, "elapsed_time": "0:57:00", "remaining_time": "0:07:46"}
67
+ {"current_steps": 67, "total_steps": 75, "loss": 0.8807, "lr": 3.4767351846456744e-07, "epoch": 2.585209003215434, "percentage": 89.33, "elapsed_time": "0:57:53", "remaining_time": "0:06:54"}
68
+ {"current_steps": 68, "total_steps": 75, "loss": 0.7756, "lr": 2.669216235478295e-07, "epoch": 2.6237942122186495, "percentage": 90.67, "elapsed_time": "0:58:42", "remaining_time": "0:06:02"}
69
+ {"current_steps": 69, "total_steps": 75, "loss": 0.8685, "lr": 1.9657406211579966e-07, "epoch": 2.662379421221865, "percentage": 92.0, "elapsed_time": "0:59:29", "remaining_time": "0:05:10"}
70
+ {"current_steps": 70, "total_steps": 75, "loss": 0.7501, "lr": 1.3678547337593494e-07, "epoch": 2.7009646302250805, "percentage": 93.33, "elapsed_time": "1:00:09", "remaining_time": "0:04:17"}
71
+ {"current_steps": 71, "total_steps": 75, "loss": 0.8121, "lr": 8.768728562211948e-08, "epoch": 2.739549839228296, "percentage": 94.67, "elapsed_time": "1:00:59", "remaining_time": "0:03:26"}
72
+ {"current_steps": 72, "total_steps": 75, "loss": 0.7776, "lr": 4.9387427326745287e-08, "epoch": 2.778135048231511, "percentage": 96.0, "elapsed_time": "1:01:41", "remaining_time": "0:02:34"}
73
+ {"current_steps": 73, "total_steps": 75, "loss": 0.8149, "lr": 2.1970089890509527e-08, "epoch": 2.816720257234727, "percentage": 97.33, "elapsed_time": "1:02:33", "remaining_time": "0:01:42"}
74
+ {"current_steps": 74, "total_steps": 75, "loss": 0.8291, "lr": 5.495542571443135e-09, "epoch": 2.855305466237942, "percentage": 98.67, "elapsed_time": "1:03:23", "remaining_time": "0:00:51"}
75
+ {"current_steps": 75, "total_steps": 75, "loss": 0.8268, "lr": 0.0, "epoch": 2.8938906752411575, "percentage": 100.0, "elapsed_time": "1:04:05", "remaining_time": "0:00:00"}
76
+ {"current_steps": 75, "total_steps": 75, "epoch": 2.8938906752411575, "percentage": 100.0, "elapsed_time": "1:06:12", "remaining_time": "0:00:00"}