morriszms commited on
Commit
37f4972
·
verified ·
1 Parent(s): ca4f24d

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ lamatama-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ lamatama-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ lamatama-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ lamatama-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ lamatama-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ lamatama-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ lamatama-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ lamatama-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ lamatama-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ lamatama-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ lamatama-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ lamatama-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,185 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: apache-2.0
5
+ base_model: kevin009/lamatama
6
+ tags:
7
+ - TensorBlock
8
+ - GGUF
9
+ model-index:
10
+ - name: lamatama
11
+ results:
12
+ - task:
13
+ type: text-generation
14
+ name: Text Generation
15
+ dataset:
16
+ name: AI2 Reasoning Challenge (25-Shot)
17
+ type: ai2_arc
18
+ config: ARC-Challenge
19
+ split: test
20
+ args:
21
+ num_few_shot: 25
22
+ metrics:
23
+ - type: acc_norm
24
+ value: 36.35
25
+ name: normalized accuracy
26
+ source:
27
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=kevin009/lamatama
28
+ name: Open LLM Leaderboard
29
+ - task:
30
+ type: text-generation
31
+ name: Text Generation
32
+ dataset:
33
+ name: HellaSwag (10-Shot)
34
+ type: hellaswag
35
+ split: validation
36
+ args:
37
+ num_few_shot: 10
38
+ metrics:
39
+ - type: acc_norm
40
+ value: 61.12
41
+ name: normalized accuracy
42
+ source:
43
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=kevin009/lamatama
44
+ name: Open LLM Leaderboard
45
+ - task:
46
+ type: text-generation
47
+ name: Text Generation
48
+ dataset:
49
+ name: MMLU (5-Shot)
50
+ type: cais/mmlu
51
+ config: all
52
+ split: test
53
+ args:
54
+ num_few_shot: 5
55
+ metrics:
56
+ - type: acc
57
+ value: 24.72
58
+ name: accuracy
59
+ source:
60
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=kevin009/lamatama
61
+ name: Open LLM Leaderboard
62
+ - task:
63
+ type: text-generation
64
+ name: Text Generation
65
+ dataset:
66
+ name: TruthfulQA (0-shot)
67
+ type: truthful_qa
68
+ config: multiple_choice
69
+ split: validation
70
+ args:
71
+ num_few_shot: 0
72
+ metrics:
73
+ - type: mc2
74
+ value: 37.67
75
+ source:
76
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=kevin009/lamatama
77
+ name: Open LLM Leaderboard
78
+ - task:
79
+ type: text-generation
80
+ name: Text Generation
81
+ dataset:
82
+ name: Winogrande (5-shot)
83
+ type: winogrande
84
+ config: winogrande_xl
85
+ split: validation
86
+ args:
87
+ num_few_shot: 5
88
+ metrics:
89
+ - type: acc
90
+ value: 60.77
91
+ name: accuracy
92
+ source:
93
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=kevin009/lamatama
94
+ name: Open LLM Leaderboard
95
+ - task:
96
+ type: text-generation
97
+ name: Text Generation
98
+ dataset:
99
+ name: GSM8k (5-shot)
100
+ type: gsm8k
101
+ config: main
102
+ split: test
103
+ args:
104
+ num_few_shot: 5
105
+ metrics:
106
+ - type: acc
107
+ value: 2.27
108
+ name: accuracy
109
+ source:
110
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=kevin009/lamatama
111
+ name: Open LLM Leaderboard
112
+ ---
113
+
114
+ <div style="width: auto; margin-left: auto; margin-right: auto">
115
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
116
+ </div>
117
+ <div style="display: flex; justify-content: space-between; width: 100%;">
118
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
119
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
120
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
121
+ </p>
122
+ </div>
123
+ </div>
124
+
125
+ ## kevin009/lamatama - GGUF
126
+
127
+ This repo contains GGUF format model files for [kevin009/lamatama](https://huggingface.co/kevin009/lamatama).
128
+
129
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4242](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
130
+
131
+ <div style="text-align: left; margin: 20px 0;">
132
+ <a href="https://tensorblock.co/waitlist/client" style="display: inline-block; padding: 10px 20px; background-color: #007bff; color: white; text-decoration: none; border-radius: 5px; font-weight: bold;">
133
+ Run them on the TensorBlock client using your local machine ↗
134
+ </a>
135
+ </div>
136
+
137
+ ## Prompt template
138
+
139
+ ```
140
+ <|system|>
141
+ {system_prompt}</s>
142
+ <|user|>
143
+ {prompt}</s>
144
+ <|assistant|>
145
+ ```
146
+
147
+ ## Model file specification
148
+
149
+ | Filename | Quant type | File Size | Description |
150
+ | -------- | ---------- | --------- | ----------- |
151
+ | [lamatama-Q2_K.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q2_K.gguf) | Q2_K | 0.432 GB | smallest, significant quality loss - not recommended for most purposes |
152
+ | [lamatama-Q3_K_S.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q3_K_S.gguf) | Q3_K_S | 0.499 GB | very small, high quality loss |
153
+ | [lamatama-Q3_K_M.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q3_K_M.gguf) | Q3_K_M | 0.548 GB | very small, high quality loss |
154
+ | [lamatama-Q3_K_L.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q3_K_L.gguf) | Q3_K_L | 0.592 GB | small, substantial quality loss |
155
+ | [lamatama-Q4_0.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q4_0.gguf) | Q4_0 | 0.637 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
156
+ | [lamatama-Q4_K_S.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q4_K_S.gguf) | Q4_K_S | 0.640 GB | small, greater quality loss |
157
+ | [lamatama-Q4_K_M.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q4_K_M.gguf) | Q4_K_M | 0.668 GB | medium, balanced quality - recommended |
158
+ | [lamatama-Q5_0.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q5_0.gguf) | Q5_0 | 0.766 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
159
+ | [lamatama-Q5_K_S.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q5_K_S.gguf) | Q5_K_S | 0.766 GB | large, low quality loss - recommended |
160
+ | [lamatama-Q5_K_M.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q5_K_M.gguf) | Q5_K_M | 0.782 GB | large, very low quality loss - recommended |
161
+ | [lamatama-Q6_K.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q6_K.gguf) | Q6_K | 0.903 GB | very large, extremely low quality loss |
162
+ | [lamatama-Q8_0.gguf](https://huggingface.co/tensorblock/lamatama-GGUF/blob/main/lamatama-Q8_0.gguf) | Q8_0 | 1.170 GB | very large, extremely low quality loss - not recommended |
163
+
164
+
165
+ ## Downloading instruction
166
+
167
+ ### Command line
168
+
169
+ Firstly, install Huggingface Client
170
+
171
+ ```shell
172
+ pip install -U "huggingface_hub[cli]"
173
+ ```
174
+
175
+ Then, downoad the individual model file the a local directory
176
+
177
+ ```shell
178
+ huggingface-cli download tensorblock/lamatama-GGUF --include "lamatama-Q2_K.gguf" --local-dir MY_LOCAL_DIR
179
+ ```
180
+
181
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
182
+
183
+ ```shell
184
+ huggingface-cli download tensorblock/lamatama-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
185
+ ```
lamatama-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:767f2d81c08571acac3674c0e16c587f1d1119f4f18336bc69d23566c0c1c6b2
3
+ size 432131328
lamatama-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93476f16ff5f095323773afcd62229aec60afbf375e0157aa20540cf97b265a
3
+ size 591527168
lamatama-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c3122e9754caa89bb339dcf81acb236bcc638f27add05cb04aaa341658b3aa
3
+ size 548404480
lamatama-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6df62529512a9cbba07cc576c8afd8fadccef640317d8487135498cd68e19f1
3
+ size 499342592
lamatama-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9147ae51b5bb0a399b5a7f70c1918a16698871912262151466d0e0364b6c6ae1
3
+ size 636726528
lamatama-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4aa013c07236943f6ad7fe693585f593e4ac2db4b68f0983691ac1ee87042894
3
+ size 667815168
lamatama-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c752b5da87b1ab97468e75d9aa5589a449fa6aa3dec23e14f3a144d680b4533
3
+ size 639872256
lamatama-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5c3431f3a6044ce95847afbda6fd835654fed33754063ac76acebadc7e805c4
3
+ size 766029056
lamatama-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4eb8ac6ab4e3b15a5bd8018b59867378f33846283d9c4d549bc3711d439339a
3
+ size 782044416
lamatama-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a0d1a91904ae1c6482dbcc80795dc2fd0620fcdfca48057f47d027ac025a398
3
+ size 766029056
lamatama-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46e5b768848b5cfe0a5dbc9526c8f40918cb885e27e76bfa787b0fa17628da6d
3
+ size 903412992
lamatama-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b985c5121a946b4e783ced96e29adcafc067acd57c15b24d577133c69e5dccc1
3
+ size 1169808640