reinhardh commited on
Commit
2088f0a
·
verified ·
1 Parent(s): 6912e3c

Training in progress, epoch 6

Browse files
model-00001-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:912dadbd6b55ac970f8b9ab628efc262fc0861543718de61ec80de6d9ab2b5bf
3
  size 4891730992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6010c3932025f4568eb143d3f0e3fca015aa985410b86af4cd245eeedbb4042e
3
  size 4891730992
model-00002-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b777475232ff78b11fee9ea24cf971079affb7c6db65cdf7f54b8a6d30bc7e12
3
  size 4876059352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5da985f22413e8503769440a44dd50b77537ae0511a1fb935106ecb9e9f7b214
3
  size 4876059352
model-00003-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f42c75bb334ef46a4e22f7b3f4ab83d0e35bc3089eaa2fb5a66d1d8f5af89da
3
  size 4876059384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0d50f7d2b47a57c2084ba091c5cea46c82bbc66606c426a4392d691af32904b
3
  size 4876059384
model-00004-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2574b3e523c5f2d3e78ebe41c12c81e4691aa9957f9cde2010dfc732300eb464
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d68d7c5fd03a4b1be1528bb0d9176d5fc696e963fee140d1b9b7354bd8c359ec
3
  size 4876059416
model-00005-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f64ce35f60471d32bbee808c2c9d4394e3f9a3daee7973ce9055e9f47d1b29f1
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a357f9418f51c2d78df09fa03c7512c97848f71354aaf95714414711e81462a
3
  size 4876059416
model-00006-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e3ed685f16672e4278544c9db285d9d67ffe2371fea989194f195587c04ab62
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a67484f605266730a80cad1b910632fb3248515bbd4d2d3f4534f49dac83e21
3
  size 4876059416
model-00007-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe94db3dea949988f94086a7c3f4029be1cbc20a9d5ff9f35eddba6f85c4f712
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e443c31e3f3af4ad91a0198419a2ede8cc7625922781a6dc760b51142e3d1da
3
  size 4876059416
model-00008-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f024b0708af17687d8d2929f8b9ec69ee22d2504e3b40e3109a418d8da743a77
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f2debb0b6a469ec4ce49c30f7440b655685738ebbcb32c8c04051328df8780
3
  size 4876059416
model-00009-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dba2b9caccb961497226cd119288817b031b396d6917d1b319294a7e0f6159e
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d72fc8a34b9aa43926d7e82862bebb359ce4fb7daa4f97840a1e390d734ab899
3
  size 4876059416
model-00010-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d7a52600be7604e801269bfa8737820277e8c82827d7acc155faac627096dd2
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32d33c7415b852b204e087a4dccccba93701361132331f5c4c56158b5c1c01ad
3
  size 4876059416
model-00011-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0185e7afa403e1fa1ca82f6bf9a8af5bc69c06798a89b4655a4d2c219aecaf3a
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edd28be8fa042b7e2af2a38f13e2ec5afacdcf814173e23db2192dabbe0cbded
3
  size 4876059416
model-00012-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12a0fddcd89c389dc3b028f5a167203c24cac7f4fc07d7d296a8c3294a815226
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cddb7d84aa2109da78416c80e231e7ec280e2e057c19d3e1e4f977da36c207a
3
  size 4876059416
model-00013-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1aca548c8ad40ef0e3845cd672a801780f09151417265ac5776471ac31aeef3c
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f7bdcf685cd7c3f9049e0814301c3ecef7ad9e4bc2b1b91ec4569154e3db88d
3
  size 4876059416
model-00014-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:301e9b65e5a942e2e1c2a7b94c6709772f8d21e378c581de1f1a34869b9185c9
3
  size 2123397800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9810e7dab886dceffbbf245c30095a6f0aab89cd39b8763b63699a5d303121a4
3
  size 2123397800
trainer_log.jsonl CHANGED
@@ -29,3 +29,43 @@
29
  {"current_steps": 29, "total_steps": 70, "loss": 0.3724, "lr": 1.4562106573531632e-05, "epoch": 2.761904761904762, "percentage": 41.43, "elapsed_time": "0:27:39", "remaining_time": "0:39:06"}
30
  {"current_steps": 30, "total_steps": 70, "loss": 0.356, "lr": 1.4112871031306118e-05, "epoch": 2.857142857142857, "percentage": 42.86, "elapsed_time": "0:28:22", "remaining_time": "0:37:49"}
31
  {"current_steps": 31, "total_steps": 70, "loss": 0.3729, "lr": 1.3653410243663953e-05, "epoch": 2.9523809523809526, "percentage": 44.29, "elapsed_time": "0:29:05", "remaining_time": "0:36:36"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  {"current_steps": 29, "total_steps": 70, "loss": 0.3724, "lr": 1.4562106573531632e-05, "epoch": 2.761904761904762, "percentage": 41.43, "elapsed_time": "0:27:39", "remaining_time": "0:39:06"}
30
  {"current_steps": 30, "total_steps": 70, "loss": 0.356, "lr": 1.4112871031306118e-05, "epoch": 2.857142857142857, "percentage": 42.86, "elapsed_time": "0:28:22", "remaining_time": "0:37:49"}
31
  {"current_steps": 31, "total_steps": 70, "loss": 0.3729, "lr": 1.3653410243663953e-05, "epoch": 2.9523809523809526, "percentage": 44.29, "elapsed_time": "0:29:05", "remaining_time": "0:36:36"}
32
+ {"current_steps": 32, "total_steps": 70, "loss": 0.3332, "lr": 1.3184866502516846e-05, "epoch": 3.0476190476190474, "percentage": 45.71, "elapsed_time": "0:34:00", "remaining_time": "0:40:23"}
33
+ {"current_steps": 33, "total_steps": 70, "loss": 0.3045, "lr": 1.2708404681430054e-05, "epoch": 3.142857142857143, "percentage": 47.14, "elapsed_time": "0:34:41", "remaining_time": "0:38:53"}
34
+ {"current_steps": 34, "total_steps": 70, "loss": 0.2815, "lr": 1.2225209339563144e-05, "epoch": 3.238095238095238, "percentage": 48.57, "elapsed_time": "0:35:24", "remaining_time": "0:37:29"}
35
+ {"current_steps": 35, "total_steps": 70, "loss": 0.2993, "lr": 1.1736481776669307e-05, "epoch": 3.3333333333333335, "percentage": 50.0, "elapsed_time": "0:36:00", "remaining_time": "0:36:00"}
36
+ {"current_steps": 36, "total_steps": 70, "loss": 0.2955, "lr": 1.1243437046474854e-05, "epoch": 3.4285714285714284, "percentage": 51.43, "elapsed_time": "0:36:47", "remaining_time": "0:34:45"}
37
+ {"current_steps": 37, "total_steps": 70, "loss": 0.2987, "lr": 1.0747300935864245e-05, "epoch": 3.5238095238095237, "percentage": 52.86, "elapsed_time": "0:37:29", "remaining_time": "0:33:26"}
38
+ {"current_steps": 38, "total_steps": 70, "loss": 0.2944, "lr": 1.0249306917380731e-05, "epoch": 3.619047619047619, "percentage": 54.29, "elapsed_time": "0:38:09", "remaining_time": "0:32:07"}
39
+ {"current_steps": 39, "total_steps": 70, "loss": 0.2769, "lr": 9.750693082619274e-06, "epoch": 3.7142857142857144, "percentage": 55.71, "elapsed_time": "0:38:49", "remaining_time": "0:30:51"}
40
+ {"current_steps": 40, "total_steps": 70, "loss": 0.3137, "lr": 9.252699064135759e-06, "epoch": 3.8095238095238093, "percentage": 57.14, "elapsed_time": "0:39:25", "remaining_time": "0:29:33"}
41
+ {"current_steps": 41, "total_steps": 70, "loss": 0.2652, "lr": 8.756562953525151e-06, "epoch": 3.9047619047619047, "percentage": 58.57, "elapsed_time": "0:40:05", "remaining_time": "0:28:21"}
42
+ {"current_steps": 42, "total_steps": 70, "loss": 0.2901, "lr": 8.263518223330698e-06, "epoch": 4.0, "percentage": 60.0, "elapsed_time": "0:40:47", "remaining_time": "0:27:11"}
43
+ {"current_steps": 43, "total_steps": 70, "loss": 0.2513, "lr": 7.774790660436857e-06, "epoch": 4.095238095238095, "percentage": 61.43, "elapsed_time": "0:44:48", "remaining_time": "0:28:08"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.2517, "lr": 7.291595318569951e-06, "epoch": 4.190476190476191, "percentage": 62.86, "elapsed_time": "0:45:29", "remaining_time": "0:26:53"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.2496, "lr": 6.815133497483157e-06, "epoch": 4.285714285714286, "percentage": 64.29, "elapsed_time": "0:46:16", "remaining_time": "0:25:42"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.2777, "lr": 6.34658975633605e-06, "epoch": 4.380952380952381, "percentage": 65.71, "elapsed_time": "0:47:00", "remaining_time": "0:24:31"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.2519, "lr": 5.887128968693887e-06, "epoch": 4.476190476190476, "percentage": 67.14, "elapsed_time": "0:47:39", "remaining_time": "0:23:19"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.228, "lr": 5.43789342646837e-06, "epoch": 4.571428571428571, "percentage": 68.57, "elapsed_time": "0:48:24", "remaining_time": "0:22:11"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.2454, "lr": 5.000000000000003e-06, "epoch": 4.666666666666667, "percentage": 70.0, "elapsed_time": "0:48:59", "remaining_time": "0:20:59"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.2234, "lr": 4.5745373613424075e-06, "epoch": 4.761904761904762, "percentage": 71.43, "elapsed_time": "0:49:41", "remaining_time": "0:19:52"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.2155, "lr": 4.162563277652104e-06, "epoch": 4.857142857142857, "percentage": 72.86, "elapsed_time": "0:50:19", "remaining_time": "0:18:44"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.2527, "lr": 3.7651019814126656e-06, "epoch": 4.9523809523809526, "percentage": 74.29, "elapsed_time": "0:50:56", "remaining_time": "0:17:38"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.2293, "lr": 3.3831416240314085e-06, "epoch": 5.0476190476190474, "percentage": 75.71, "elapsed_time": "0:54:35", "remaining_time": "0:17:30"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.2281, "lr": 3.017631819139273e-06, "epoch": 5.142857142857143, "percentage": 77.14, "elapsed_time": "0:55:15", "remaining_time": "0:16:22"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.1992, "lr": 2.669481281701739e-06, "epoch": 5.238095238095238, "percentage": 78.57, "elapsed_time": "0:55:56", "remaining_time": "0:15:15"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.178, "lr": 2.339555568810221e-06, "epoch": 5.333333333333333, "percentage": 80.0, "elapsed_time": "0:56:30", "remaining_time": "0:14:07"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.2168, "lr": 2.0286749277707783e-06, "epoch": 5.428571428571429, "percentage": 81.43, "elapsed_time": "0:57:11", "remaining_time": "0:13:02"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.2271, "lr": 1.7376122568400533e-06, "epoch": 5.523809523809524, "percentage": 82.86, "elapsed_time": "0:57:52", "remaining_time": "0:11:58"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.2314, "lr": 1.467091183678444e-06, "epoch": 5.619047619047619, "percentage": 84.29, "elapsed_time": "0:58:31", "remaining_time": "0:10:54"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.1739, "lr": 1.2177842662977136e-06, "epoch": 5.714285714285714, "percentage": 85.71, "elapsed_time": "0:59:08", "remaining_time": "0:09:51"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.2262, "lr": 9.903113209758098e-07, "epoch": 5.809523809523809, "percentage": 87.14, "elapsed_time": "0:59:47", "remaining_time": "0:08:49"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.225, "lr": 7.852378812959227e-07, "epoch": 5.904761904761905, "percentage": 88.57, "elapsed_time": "1:00:31", "remaining_time": "0:07:48"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.2453, "lr": 6.030737921409169e-07, "epoch": 6.0, "percentage": 90.0, "elapsed_time": "1:01:16", "remaining_time": "0:06:48"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.2161, "lr": 4.4427194213859216e-07, "epoch": 6.095238095238095, "percentage": 91.43, "elapsed_time": "1:03:59", "remaining_time": "0:05:59"}
65
+ {"current_steps": 65, "total_steps": 70, "loss": 0.1761, "lr": 3.0922713770922155e-07, "epoch": 6.190476190476191, "percentage": 92.86, "elapsed_time": "1:04:47", "remaining_time": "0:04:59"}
66
+ {"current_steps": 66, "total_steps": 70, "loss": 0.1877, "lr": 1.9827512151456175e-07, "epoch": 6.285714285714286, "percentage": 94.29, "elapsed_time": "1:05:26", "remaining_time": "0:03:57"}
67
+ {"current_steps": 67, "total_steps": 70, "loss": 0.223, "lr": 1.1169173774871478e-07, "epoch": 6.380952380952381, "percentage": 95.71, "elapsed_time": "1:06:08", "remaining_time": "0:02:57"}
68
+ {"current_steps": 68, "total_steps": 70, "loss": 0.2255, "lr": 4.9692246345985905e-08, "epoch": 6.476190476190476, "percentage": 97.14, "elapsed_time": "1:06:55", "remaining_time": "0:01:58"}
69
+ {"current_steps": 69, "total_steps": 70, "loss": 0.2008, "lr": 1.2430787810776556e-08, "epoch": 6.571428571428571, "percentage": 98.57, "elapsed_time": "1:07:42", "remaining_time": "0:00:58"}
70
+ {"current_steps": 70, "total_steps": 70, "loss": 0.2137, "lr": 0.0, "epoch": 6.666666666666667, "percentage": 100.0, "elapsed_time": "1:08:21", "remaining_time": "0:00:00"}
71
+ {"current_steps": 70, "total_steps": 70, "epoch": 6.666666666666667, "percentage": 100.0, "elapsed_time": "1:13:54", "remaining_time": "0:00:00"}