Upload folder using huggingface_hub
Browse files- config.json +4 -4
- generation_config.json +1 -1
- model-00001-of-00005.safetensors +2 -2
- model-00002-of-00005.safetensors +1 -1
- model-00003-of-00005.safetensors +1 -1
- model-00004-of-00005.safetensors +1 -1
- model-00005-of-00005.safetensors +2 -2
- model.safetensors.index.json +1 -1
- tokenizer.json +2 -2
- tokenizer_config.json +4 -36
config.json
CHANGED
|
@@ -4,7 +4,7 @@
|
|
| 4 |
],
|
| 5 |
"attention_dropout": 0.0,
|
| 6 |
"bos_token_id": 1,
|
| 7 |
-
"eos_token_id":
|
| 8 |
"head_dim": 128,
|
| 9 |
"hidden_act": "silu",
|
| 10 |
"hidden_size": 5120,
|
|
@@ -20,7 +20,7 @@
|
|
| 20 |
"sliding_window": null,
|
| 21 |
"tie_word_embeddings": false,
|
| 22 |
"torch_dtype": "bfloat16",
|
| 23 |
-
"transformers_version": "4.51.
|
| 24 |
-
"use_cache":
|
| 25 |
-
"vocab_size":
|
| 26 |
}
|
|
|
|
| 4 |
],
|
| 5 |
"attention_dropout": 0.0,
|
| 6 |
"bos_token_id": 1,
|
| 7 |
+
"eos_token_id": 17,
|
| 8 |
"head_dim": 128,
|
| 9 |
"hidden_act": "silu",
|
| 10 |
"hidden_size": 5120,
|
|
|
|
| 20 |
"sliding_window": null,
|
| 21 |
"tie_word_embeddings": false,
|
| 22 |
"torch_dtype": "bfloat16",
|
| 23 |
+
"transformers_version": "4.51.3",
|
| 24 |
+
"use_cache": true,
|
| 25 |
+
"vocab_size": 131072
|
| 26 |
}
|
generation_config.json
CHANGED
|
@@ -3,5 +3,5 @@
|
|
| 3 |
"bos_token_id": 1,
|
| 4 |
"do_sample": true,
|
| 5 |
"eos_token_id": 2,
|
| 6 |
-
"transformers_version": "4.51.
|
| 7 |
}
|
|
|
|
| 3 |
"bos_token_id": 1,
|
| 4 |
"do_sample": true,
|
| 5 |
"eos_token_id": 2,
|
| 6 |
+
"transformers_version": "4.51.3"
|
| 7 |
}
|
model-00001-of-00005.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a10a172096dd98e39d29fa5f2d638a555ca507afdaa32add4ab8430491c28599
|
| 3 |
+
size 4865522496
|
model-00002-of-00005.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4907529424
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0cb8ed56e931bac99ba94400491237c81defe954e745e8a900f54e098c9b0e2
|
| 3 |
size 4907529424
|
model-00003-of-00005.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4907529456
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d3d42f17f8416813b982c6fd3e5d6f0af88200df843e4265496e8654170d966
|
| 3 |
size 4907529456
|
model-00004-of-00005.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4907529456
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d515e55fbdf889f16247101b4e30430b6fe47898e79a98197b871a2f525963d7
|
| 3 |
size 4907529456
|
model-00005-of-00005.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7adbaab3984cfaa63aa152c62633484d9d72811acf619d7c738a0066edca205a
|
| 3 |
+
size 4907496272
|
model.safetensors.index.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
-
"total_size":
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"lm_head.weight": "model-00005-of-00005.safetensors",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
+
"total_size": 24495564800
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"lm_head.weight": "model-00005-of-00005.safetensors",
|
tokenizer.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4134ad5fafadb3d5548d1eeb269d0de40f00244947690bf518a53c946d265e6
|
| 3 |
+
size 17078326
|
tokenizer_config.json
CHANGED
|
@@ -116,7 +116,7 @@
|
|
| 116 |
"special": true
|
| 117 |
},
|
| 118 |
"14": {
|
| 119 |
-
"content": "
|
| 120 |
"lstrip": false,
|
| 121 |
"normalized": false,
|
| 122 |
"rstrip": false,
|
|
@@ -124,7 +124,7 @@
|
|
| 124 |
"special": true
|
| 125 |
},
|
| 126 |
"15": {
|
| 127 |
-
"content": "
|
| 128 |
"lstrip": false,
|
| 129 |
"normalized": false,
|
| 130 |
"rstrip": false,
|
|
@@ -132,7 +132,7 @@
|
|
| 132 |
"special": true
|
| 133 |
},
|
| 134 |
"16": {
|
| 135 |
-
"content": "
|
| 136 |
"lstrip": false,
|
| 137 |
"normalized": false,
|
| 138 |
"rstrip": false,
|
|
@@ -140,7 +140,7 @@
|
|
| 140 |
"special": true
|
| 141 |
},
|
| 142 |
"17": {
|
| 143 |
-
"content": "
|
| 144 |
"lstrip": false,
|
| 145 |
"normalized": false,
|
| 146 |
"rstrip": false,
|
|
@@ -8002,38 +8002,6 @@
|
|
| 8002 |
"rstrip": false,
|
| 8003 |
"single_word": false,
|
| 8004 |
"special": true
|
| 8005 |
-
},
|
| 8006 |
-
"131072": {
|
| 8007 |
-
"content": "<|im_end|>",
|
| 8008 |
-
"lstrip": false,
|
| 8009 |
-
"normalized": false,
|
| 8010 |
-
"rstrip": false,
|
| 8011 |
-
"single_word": false,
|
| 8012 |
-
"special": true
|
| 8013 |
-
},
|
| 8014 |
-
"131073": {
|
| 8015 |
-
"content": "<|im_start|>system",
|
| 8016 |
-
"lstrip": false,
|
| 8017 |
-
"normalized": false,
|
| 8018 |
-
"rstrip": false,
|
| 8019 |
-
"single_word": false,
|
| 8020 |
-
"special": false
|
| 8021 |
-
},
|
| 8022 |
-
"131074": {
|
| 8023 |
-
"content": "<|im_start|>assistant",
|
| 8024 |
-
"lstrip": false,
|
| 8025 |
-
"normalized": false,
|
| 8026 |
-
"rstrip": false,
|
| 8027 |
-
"single_word": false,
|
| 8028 |
-
"special": false
|
| 8029 |
-
},
|
| 8030 |
-
"131075": {
|
| 8031 |
-
"content": "<|im_start|>user",
|
| 8032 |
-
"lstrip": false,
|
| 8033 |
-
"normalized": false,
|
| 8034 |
-
"rstrip": false,
|
| 8035 |
-
"single_word": false,
|
| 8036 |
-
"special": false
|
| 8037 |
}
|
| 8038 |
},
|
| 8039 |
"bos_token": "<s>",
|
|
|
|
| 116 |
"special": true
|
| 117 |
},
|
| 118 |
"14": {
|
| 119 |
+
"content": "<|im_start|>user",
|
| 120 |
"lstrip": false,
|
| 121 |
"normalized": false,
|
| 122 |
"rstrip": false,
|
|
|
|
| 124 |
"special": true
|
| 125 |
},
|
| 126 |
"15": {
|
| 127 |
+
"content": "<|im_start|>assistant",
|
| 128 |
"lstrip": false,
|
| 129 |
"normalized": false,
|
| 130 |
"rstrip": false,
|
|
|
|
| 132 |
"special": true
|
| 133 |
},
|
| 134 |
"16": {
|
| 135 |
+
"content": "<|im_start|>system",
|
| 136 |
"lstrip": false,
|
| 137 |
"normalized": false,
|
| 138 |
"rstrip": false,
|
|
|
|
| 140 |
"special": true
|
| 141 |
},
|
| 142 |
"17": {
|
| 143 |
+
"content": "<|im_end|>",
|
| 144 |
"lstrip": false,
|
| 145 |
"normalized": false,
|
| 146 |
"rstrip": false,
|
|
|
|
| 8002 |
"rstrip": false,
|
| 8003 |
"single_word": false,
|
| 8004 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8005 |
}
|
| 8006 |
},
|
| 8007 |
"bos_token": "<s>",
|