morriszms commited on
Commit
e567290
·
verified ·
1 Parent(s): 5f3e675

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ L-MChat-Small-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ L-MChat-Small-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ L-MChat-Small-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ L-MChat-Small-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ L-MChat-Small-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ L-MChat-Small-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ L-MChat-Small-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ L-MChat-Small-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ L-MChat-Small-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ L-MChat-Small-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ L-MChat-Small-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ L-MChat-Small-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
L-MChat-Small-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80743d46e27f69207bd58b3d4b3d7c79c30b48b3a950cf5ec3ee1dbcc2bfe497
3
+ size 1109720768
L-MChat-Small-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e090aafb934e052468c4af127dc510cf6b221d5b56c7f84f45fe341b843d147
3
+ size 1575231168
L-MChat-Small-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8926d5feee6e7edaf25f6b4a11f08387bb2c85790123963e6dc02a17edb045aa
3
+ size 1426136768
L-MChat-Small-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caa311906919964983267bf6ebc3b93ffc873f46b03f7e27bed42c4a44a4f2c3
3
+ size 1250827968
L-MChat-Small-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c829cce09a469201a83ced21f23b7968596ad682c2f27a8cb5b4c6385e3d20
3
+ size 1602469568
L-MChat-Small-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ca11b0473eba42fd394d106e6d2809f3139b09c792dff353dc9322ab4ae7f71
3
+ size 1737637568
L-MChat-Small-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9c04aa5c0b319fceb2eebe5efdfcffa4de51fb19d63eaff4b37e5c0a4fd9749
3
+ size 1618853568
L-MChat-Small-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b447e36e17fd8cff2123ad1df79644b5e7a372acf3e2bbec900b353938d6a154
3
+ size 1933426368
L-MChat-Small-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0a42e5315fd2a248c1561e9b79506d99b261c46369f55b5808a9e7595dc92f1
3
+ size 2003058368
L-MChat-Small-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a44372f1de5704dd4cf011154f7c9b4f530f4c0829c888b3f66a9330a4e1f939
3
+ size 1933426368
L-MChat-Small-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:990f0b585e27502fb9a715cf7118990d086dbb9b25fb94103f5beb7542948f82
3
+ size 2285067968
L-MChat-Small-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a05565f48bffe23339d9541ea99a2f12c358fa217d84ab7d30ac2214d61f7a5
3
+ size 2958040768
README.md ADDED
@@ -0,0 +1,180 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+ - TensorBlock
8
+ - GGUF
9
+ base_model: Artples/L-MChat-Small
10
+ model-index:
11
+ - name: L-MChat-Small
12
+ results:
13
+ - task:
14
+ type: text-generation
15
+ name: Text Generation
16
+ dataset:
17
+ name: AI2 Reasoning Challenge (25-Shot)
18
+ type: ai2_arc
19
+ config: ARC-Challenge
20
+ split: test
21
+ args:
22
+ num_few_shot: 25
23
+ metrics:
24
+ - type: acc_norm
25
+ value: 61.6
26
+ name: normalized accuracy
27
+ source:
28
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Artples/L-MChat-Small
29
+ name: Open LLM Leaderboard
30
+ - task:
31
+ type: text-generation
32
+ name: Text Generation
33
+ dataset:
34
+ name: HellaSwag (10-Shot)
35
+ type: hellaswag
36
+ split: validation
37
+ args:
38
+ num_few_shot: 10
39
+ metrics:
40
+ - type: acc_norm
41
+ value: 75.9
42
+ name: normalized accuracy
43
+ source:
44
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Artples/L-MChat-Small
45
+ name: Open LLM Leaderboard
46
+ - task:
47
+ type: text-generation
48
+ name: Text Generation
49
+ dataset:
50
+ name: MMLU (5-Shot)
51
+ type: cais/mmlu
52
+ config: all
53
+ split: test
54
+ args:
55
+ num_few_shot: 5
56
+ metrics:
57
+ - type: acc
58
+ value: 57.41
59
+ name: accuracy
60
+ source:
61
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Artples/L-MChat-Small
62
+ name: Open LLM Leaderboard
63
+ - task:
64
+ type: text-generation
65
+ name: Text Generation
66
+ dataset:
67
+ name: TruthfulQA (0-shot)
68
+ type: truthful_qa
69
+ config: multiple_choice
70
+ split: validation
71
+ args:
72
+ num_few_shot: 0
73
+ metrics:
74
+ - type: mc2
75
+ value: 49.94
76
+ source:
77
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Artples/L-MChat-Small
78
+ name: Open LLM Leaderboard
79
+ - task:
80
+ type: text-generation
81
+ name: Text Generation
82
+ dataset:
83
+ name: Winogrande (5-shot)
84
+ type: winogrande
85
+ config: winogrande_xl
86
+ split: validation
87
+ args:
88
+ num_few_shot: 5
89
+ metrics:
90
+ - type: acc
91
+ value: 74.98
92
+ name: accuracy
93
+ source:
94
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Artples/L-MChat-Small
95
+ name: Open LLM Leaderboard
96
+ - task:
97
+ type: text-generation
98
+ name: Text Generation
99
+ dataset:
100
+ name: GSM8k (5-shot)
101
+ type: gsm8k
102
+ config: main
103
+ split: test
104
+ args:
105
+ num_few_shot: 5
106
+ metrics:
107
+ - type: acc
108
+ value: 58.98
109
+ name: accuracy
110
+ source:
111
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Artples/L-MChat-Small
112
+ name: Open LLM Leaderboard
113
+ ---
114
+
115
+ <div style="width: auto; margin-left: auto; margin-right: auto">
116
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
117
+ </div>
118
+ <div style="display: flex; justify-content: space-between; width: 100%;">
119
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
120
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
121
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
122
+ </p>
123
+ </div>
124
+ </div>
125
+
126
+ ## Artples/L-MChat-Small - GGUF
127
+
128
+ This repo contains GGUF format model files for [Artples/L-MChat-Small](https://huggingface.co/Artples/L-MChat-Small).
129
+
130
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4011](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
131
+
132
+ ## Prompt template
133
+
134
+ ```
135
+ <|im_start|>system
136
+ {system_prompt}<|im_end|>
137
+ <|im_start|>user
138
+ {prompt}<|im_end|>
139
+ <|im_start|>assistant
140
+ ```
141
+
142
+ ## Model file specification
143
+
144
+ | Filename | Quant type | File Size | Description |
145
+ | -------- | ---------- | --------- | ----------- |
146
+ | [L-MChat-Small-Q2_K.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q2_K.gguf) | Q2_K | 1.034 GB | smallest, significant quality loss - not recommended for most purposes |
147
+ | [L-MChat-Small-Q3_K_S.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q3_K_S.gguf) | Q3_K_S | 1.165 GB | very small, high quality loss |
148
+ | [L-MChat-Small-Q3_K_M.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q3_K_M.gguf) | Q3_K_M | 1.328 GB | very small, high quality loss |
149
+ | [L-MChat-Small-Q3_K_L.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q3_K_L.gguf) | Q3_K_L | 1.467 GB | small, substantial quality loss |
150
+ | [L-MChat-Small-Q4_0.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q4_0.gguf) | Q4_0 | 1.492 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
151
+ | [L-MChat-Small-Q4_K_S.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q4_K_S.gguf) | Q4_K_S | 1.508 GB | small, greater quality loss |
152
+ | [L-MChat-Small-Q4_K_M.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q4_K_M.gguf) | Q4_K_M | 1.618 GB | medium, balanced quality - recommended |
153
+ | [L-MChat-Small-Q5_0.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q5_0.gguf) | Q5_0 | 1.801 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
154
+ | [L-MChat-Small-Q5_K_S.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q5_K_S.gguf) | Q5_K_S | 1.801 GB | large, low quality loss - recommended |
155
+ | [L-MChat-Small-Q5_K_M.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q5_K_M.gguf) | Q5_K_M | 1.865 GB | large, very low quality loss - recommended |
156
+ | [L-MChat-Small-Q6_K.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q6_K.gguf) | Q6_K | 2.128 GB | very large, extremely low quality loss |
157
+ | [L-MChat-Small-Q8_0.gguf](https://huggingface.co/tensorblock/L-MChat-Small-GGUF/tree/main/L-MChat-Small-Q8_0.gguf) | Q8_0 | 2.755 GB | very large, extremely low quality loss - not recommended |
158
+
159
+
160
+ ## Downloading instruction
161
+
162
+ ### Command line
163
+
164
+ Firstly, install Huggingface Client
165
+
166
+ ```shell
167
+ pip install -U "huggingface_hub[cli]"
168
+ ```
169
+
170
+ Then, downoad the individual model file the a local directory
171
+
172
+ ```shell
173
+ huggingface-cli download tensorblock/L-MChat-Small-GGUF --include "L-MChat-Small-Q2_K.gguf" --local-dir MY_LOCAL_DIR
174
+ ```
175
+
176
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
177
+
178
+ ```shell
179
+ huggingface-cli download tensorblock/L-MChat-Small-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
180
+ ```