Upload folder using huggingface_hub
Browse files- README.md +2 -2
- config.json +1 -1
- model.safetensors +2 -2
- model.safetensors.index.json +1 -1
- tokenizer.json +12 -3
README.md
CHANGED
|
@@ -2,10 +2,10 @@
|
|
| 2 |
|
| 3 |
## Model Details
|
| 4 |
- **Architecture**: Transformer with ternary weights (1.58 bits)
|
| 5 |
-
- **Parameters**: 194,
|
| 6 |
- **Model Size**: 38.44 MB (ternary)
|
| 7 |
- **Context Size**: 32768
|
| 8 |
-
- **Vocab Size**:
|
| 9 |
|
| 10 |
## Usage
|
| 11 |
#will be added later
|
|
|
|
| 2 |
|
| 3 |
## Model Details
|
| 4 |
- **Architecture**: Transformer with ternary weights (1.58 bits)
|
| 5 |
+
- **Parameters**: 194,652,233
|
| 6 |
- **Model Size**: 38.44 MB (ternary)
|
| 7 |
- **Context Size**: 32768
|
| 8 |
+
- **Vocab Size**: 4908
|
| 9 |
|
| 10 |
## Usage
|
| 11 |
#will be added later
|
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"vocab_size":
|
| 3 |
"embed_size": 1024,
|
| 4 |
"num_layers": 12,
|
| 5 |
"num_heads": 16,
|
|
|
|
| 1 |
{
|
| 2 |
+
"vocab_size": 4908,
|
| 3 |
"embed_size": 1024,
|
| 4 |
"num_layers": 12,
|
| 5 |
"num_heads": 16,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7c21dd36e5338564a7345592d8986efa6740b8a6abd469ff3d4ffa1a8c7e4fa
|
| 3 |
+
size 1402719116
|
model.safetensors.index.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
-
"total_size":
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"token_embed.weight": "model.safetensors",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
+
"total_size": 778608932
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"token_embed.weight": "model.safetensors",
|
tokenizer.json
CHANGED
|
@@ -4905,7 +4905,10 @@
|
|
| 4905 |
"\ud83e\uddf6",
|
| 4906 |
"\u0a83",
|
| 4907 |
"\u8ca1",
|
| 4908 |
-
"\u90b8"
|
|
|
|
|
|
|
|
|
|
| 4909 |
],
|
| 4910 |
"stoi": {
|
| 4911 |
"\t": 0,
|
|
@@ -9812,7 +9815,10 @@
|
|
| 9812 |
"\ud83e\uddf6": 4901,
|
| 9813 |
"\u0a83": 4902,
|
| 9814 |
"\u8ca1": 4903,
|
| 9815 |
-
"\u90b8": 4904
|
|
|
|
|
|
|
|
|
|
| 9816 |
},
|
| 9817 |
"itos": {
|
| 9818 |
"0": "\t",
|
|
@@ -14719,6 +14725,9 @@
|
|
| 14719 |
"4901": "\ud83e\uddf6",
|
| 14720 |
"4902": "\u0a83",
|
| 14721 |
"4903": "\u8ca1",
|
| 14722 |
-
"4904": "\u90b8"
|
|
|
|
|
|
|
|
|
|
| 14723 |
}
|
| 14724 |
}
|
|
|
|
| 4905 |
"\ud83e\uddf6",
|
| 4906 |
"\u0a83",
|
| 4907 |
"\u8ca1",
|
| 4908 |
+
"\u90b8",
|
| 4909 |
+
"\u2005",
|
| 4910 |
+
"\u200a",
|
| 4911 |
+
"\u2012"
|
| 4912 |
],
|
| 4913 |
"stoi": {
|
| 4914 |
"\t": 0,
|
|
|
|
| 9815 |
"\ud83e\uddf6": 4901,
|
| 9816 |
"\u0a83": 4902,
|
| 9817 |
"\u8ca1": 4903,
|
| 9818 |
+
"\u90b8": 4904,
|
| 9819 |
+
"\u2005": 4905,
|
| 9820 |
+
"\u200a": 4906,
|
| 9821 |
+
"\u2012": 4907
|
| 9822 |
},
|
| 9823 |
"itos": {
|
| 9824 |
"0": "\t",
|
|
|
|
| 14725 |
"4901": "\ud83e\uddf6",
|
| 14726 |
"4902": "\u0a83",
|
| 14727 |
"4903": "\u8ca1",
|
| 14728 |
+
"4904": "\u90b8",
|
| 14729 |
+
"4905": "\u2005",
|
| 14730 |
+
"4906": "\u200a",
|
| 14731 |
+
"4907": "\u2012"
|
| 14732 |
}
|
| 14733 |
}
|