8k SFT step 7000
Browse files- config.json +1 -1
- generation_config.json +4 -1
- model-00001-of-00031.safetensors +2 -2
- model-00002-of-00031.safetensors +2 -2
- model-00003-of-00031.safetensors +2 -2
- model-00004-of-00031.safetensors +2 -2
- model-00005-of-00031.safetensors +2 -2
- model-00006-of-00031.safetensors +2 -2
- model-00007-of-00031.safetensors +2 -2
- model-00008-of-00031.safetensors +2 -2
- model-00009-of-00031.safetensors +2 -2
- model-00010-of-00031.safetensors +2 -2
- model-00011-of-00031.safetensors +2 -2
- model-00012-of-00031.safetensors +2 -2
- model-00013-of-00031.safetensors +2 -2
- model-00014-of-00031.safetensors +2 -2
- model-00015-of-00031.safetensors +2 -2
- model-00016-of-00031.safetensors +2 -2
- model-00017-of-00031.safetensors +2 -2
- model-00018-of-00031.safetensors +2 -2
- model-00019-of-00031.safetensors +2 -2
- model-00020-of-00031.safetensors +2 -2
- model-00021-of-00031.safetensors +2 -2
- model-00022-of-00031.safetensors +2 -2
- model-00023-of-00031.safetensors +2 -2
- model-00024-of-00031.safetensors +2 -2
- model-00025-of-00031.safetensors +2 -2
- model-00026-of-00031.safetensors +2 -2
- model-00027-of-00031.safetensors +2 -2
- model-00028-of-00031.safetensors +2 -2
- model-00029-of-00031.safetensors +2 -2
- model-00030-of-00031.safetensors +2 -2
- model-00031-of-00031.safetensors +2 -2
- model.safetensors.index.json +0 -0
config.json
CHANGED
|
@@ -12,7 +12,7 @@
|
|
| 12 |
"hidden_size": 8192,
|
| 13 |
"initializer_range": 0.02,
|
| 14 |
"intermediate_size": 28672,
|
| 15 |
-
"max_position_embeddings":
|
| 16 |
"mlp_bias": false,
|
| 17 |
"model_type": "llama",
|
| 18 |
"num_attention_heads": 64,
|
|
|
|
| 12 |
"hidden_size": 8192,
|
| 13 |
"initializer_range": 0.02,
|
| 14 |
"intermediate_size": 28672,
|
| 15 |
+
"max_position_embeddings": 8192,
|
| 16 |
"mlp_bias": false,
|
| 17 |
"model_type": "llama",
|
| 18 |
"num_attention_heads": 64,
|
generation_config.json
CHANGED
|
@@ -1,7 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"_from_model_config": true,
|
| 3 |
"bos_token_id": 2,
|
| 4 |
-
"eos_token_id": [
|
|
|
|
|
|
|
|
|
|
| 5 |
"transformers_version": "4.57.1",
|
| 6 |
"use_cache": false
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"_from_model_config": true,
|
| 3 |
"bos_token_id": 2,
|
| 4 |
+
"eos_token_id": [
|
| 5 |
+
1,
|
| 6 |
+
106
|
| 7 |
+
],
|
| 8 |
"transformers_version": "4.57.1",
|
| 9 |
"use_cache": false
|
| 10 |
}
|
model-00001-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6101b28b1462889a5d8732f6a5eff27481a69263451e4501b28910eeb1855755
|
| 3 |
+
size 4613819728
|
model-00002-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43dbf63f353db1416049a6350adbbc4e6d799d7956abc916f660083769f62552
|
| 3 |
+
size 4966140568
|
model-00003-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8775f5e400e8da57896b8f693b73723251051b090fdf0f008698ce64f828495f
|
| 3 |
+
size 4563471232
|
model-00004-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cd6c4d7edb04cae470db8f206c84d5edd5e2b253d88f5d9a9d74f38b6b00396
|
| 3 |
+
size 4815196288
|
model-00005-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60513c91acfd7b98478616f521277da5c0173eb42bdfb17acce1db16eae097bd
|
| 3 |
+
size 4966073280
|
model-00006-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cde1f97a42ac15e7c56f95c1b929a9ea7a2da40ed708f07f68fae1244c52cbf
|
| 3 |
+
size 4580280832
|
model-00007-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28eafcabc6fb1a54a2f4dc6be713cece32b3ecdf7896f79022bc05622da2a9d8
|
| 3 |
+
size 4831906224
|
model-00008-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62a48e02a0ec5346dfcfb520a70c8ca1b65d0dac3f21a5f2a6877e5bce876ddc
|
| 3 |
+
size 4815095880
|
model-00009-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04a2298f08ed2f7b1134d847e40fb3dc3ee28666f3c03cdd899b30f88cad115a
|
| 3 |
+
size 4781574912
|
model-00010-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53d20353e669c46a6a8645f20e2bf2e0def561564173ff80824dfb2d7a1527a1
|
| 3 |
+
size 4680927528
|
model-00011-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b60c8ee6a6f477e7c776ed21b62a3f1e5f3f57757fadc0ef631ed00129dabf4
|
| 3 |
+
size 3691055400
|
model-00012-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:719f682f5f4df94da10da6227f448718c77c29fc950cc985be46af3211069421
|
| 3 |
+
size 4915724776
|
model-00013-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c77ec4bfa6539d656194e5eaa349b74185c50ddd88285a415e0d340fd01fe7e2
|
| 3 |
+
size 4949396216
|
model-00014-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03dd32116df7cb579afc89aa3db41f27cafe5a6c899e15c68a498631320af27b
|
| 3 |
+
size 4898998928
|
model-00015-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ffb4fce4ffc9b9a697e057f7590d64eb9c0a98d61a7d4ef94169778b6dae2aa
|
| 3 |
+
size 4882237496
|
model-00016-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c946f7d3b2fd60b2579895be09f5b2d13500c65d77fd4e0868947c40f288e1b
|
| 3 |
+
size 4915825192
|
model-00017-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23d4dc4ac352ac21c8615af5f0e3b85c7fd72e8f534d27eeb78854a1fb0942b5
|
| 3 |
+
size 4680960536
|
model-00018-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d2884d7b555e6d0112892e14d34e20e66a167444d9d9fe99e55b274af6b5902
|
| 3 |
+
size 4680961248
|
model-00019-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f710dfe2b8969f241eb3407b8dab283e2714c02dcb70f46c2b08a34ea922fd6
|
| 3 |
+
size 4932552896
|
model-00020-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87bdda79cbf8fb5deafd381f044d5ec2c01e3b598f83a1f4d27593216fcaba27
|
| 3 |
+
size 4815113072
|
model-00021-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c70370dbb287ecbea148d7a8cb997200fbab1196723ac491d932b34745be93ca
|
| 3 |
+
size 4798467728
|
model-00022-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b4fa5f9fbc3b792de931095a3f3495e84228aa84602acc858b3222565548eca
|
| 3 |
+
size 4781673920
|
model-00023-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fb8a643e23506ba8f057601d409a935a3a5ae223ed54b1a282f58f9e24843a1
|
| 3 |
+
size 4882287728
|
model-00024-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b32fb13284ecfec87260bcb6c9e52299896bb463cbf249389201c4c021f30bd
|
| 3 |
+
size 4949280728
|
model-00025-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:853ad0b777ede4a543c0f3af870542ea256c23f0aabeb7bc2ff394e375ff3469
|
| 3 |
+
size 4798451984
|
model-00026-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d9ad1b79a5dfbcb943c4e0d6186d910b72c35b92e9f181bb5305f0857b389bc
|
| 3 |
+
size 4630546744
|
model-00027-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ce9cdd1993c1e11e8d237426cb8b0b781ed3502a9be737cad4b9d3ac8e2751c
|
| 3 |
+
size 4546744120
|
model-00028-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55b561adb2219f32bd94a5bda0922a3083a18c3266596bc8055ff9052d2c4f9f
|
| 3 |
+
size 4966322784
|
model-00029-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d279aa3f548f543c930ba93c50e9ce403af00db040b1d6c717e80bd1e30f1a3
|
| 3 |
+
size 4966206536
|
model-00030-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8491bf25c095b5094b0f369f5edf0734746c0eebc05fef644eceed9adbc5d7a3
|
| 3 |
+
size 4966074560
|
model-00031-of-00031.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e950025e3154f727b9b6cb82d2bfeec3532a226d046bcb3abdfdba1149235da
|
| 3 |
+
size 2231370920
|
model.safetensors.index.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|