Update README.md
Browse files
README.md
CHANGED
|
@@ -211,35 +211,11 @@ license: apache-2.0
|
|
| 211 |
<tbody>
|
| 212 |
<!-- UPDATE THESE ROWS WITH YOUR ACTUAL FILES -->
|
| 213 |
<tr>
|
| 214 |
-
<td><code>
|
| 215 |
<td><span class="nc-quant-tag">Q8_0</span></td>
|
| 216 |
<td>-- GB</td>
|
| 217 |
<td>Near-lossless. Best quality, higher VRAM/RAM requirement.</td>
|
| 218 |
</tr>
|
| 219 |
-
<tr>
|
| 220 |
-
<td><code>north-code-quant-Q6_K.gguf</code></td>
|
| 221 |
-
<td><span class="nc-quant-tag">Q6_K</span></td>
|
| 222 |
-
<td>-- GB</td>
|
| 223 |
-
<td>Very low perplexity loss. Great for critical code tasks.</td>
|
| 224 |
-
</tr>
|
| 225 |
-
<tr style="background: rgba(88, 166, 255, 0.05);">
|
| 226 |
-
<td><code>north-code-quant-Q4_K_M.gguf</code></td>
|
| 227 |
-
<td><span class="nc-quant-tag">Q4_K_M</span></td>
|
| 228 |
-
<td>-- GB</td>
|
| 229 |
-
<td><strong>⭐ Recommended.</strong> Best size/performance ratio.</td>
|
| 230 |
-
</tr>
|
| 231 |
-
<tr>
|
| 232 |
-
<td><code>north-code-quant-Q3_K_M.gguf</code></td>
|
| 233 |
-
<td><span class="nc-quant-tag">Q3_K_M</span></td>
|
| 234 |
-
<td>-- GB</td>
|
| 235 |
-
<td>Lower resource usage. Noticeable quality degradation in complex reasoning.</td>
|
| 236 |
-
</tr>
|
| 237 |
-
<tr>
|
| 238 |
-
<td><code>north-code-quant-IQ4_XS.gguf</code></td>
|
| 239 |
-
<td><span class="nc-quant-tag">IQ4_XS</span></td>
|
| 240 |
-
<td>-- GB</td>
|
| 241 |
-
<td>Importance Matrix quant. Smaller than Q4 with similar quality.</td>
|
| 242 |
-
</tr>
|
| 243 |
</tbody>
|
| 244 |
</table>
|
| 245 |
</div>
|
|
@@ -251,11 +227,6 @@ license: apache-2.0
|
|
| 251 |
<a href="https://huggingface.co/CohereForAI/c4ai-command-r-plus" target="_blank">Cohere North Code</a>
|
| 252 |
weights using <code>llama.cpp</code> with importance matrix calibration for optimal token-level precision retention.
|
| 253 |
</p>
|
| 254 |
-
<ul style="color: var(--nc-text-muted); padding-left: 1.5rem;">
|
| 255 |
-
<li><strong>Calibration Dataset:</strong> CodeAlpaca + SlimOrca subset</li>
|
| 256 |
-
<li><strong>Imatrix:</strong> Enabled for K-quants (Q3_K through Q6_K)</li>
|
| 257 |
-
<li><strong>Vocab:</strong> Original Cohere tokenizer preserved</li>
|
| 258 |
-
</ul>
|
| 259 |
|
| 260 |
<!-- DISCLAIMER -->
|
| 261 |
<div class="nc-disclaimer">
|
|
|
|
| 211 |
<tbody>
|
| 212 |
<!-- UPDATE THESE ROWS WITH YOUR ACTUAL FILES -->
|
| 213 |
<tr>
|
| 214 |
+
<td><code>North-Code-Quant.gguf</code></td>
|
| 215 |
<td><span class="nc-quant-tag">Q8_0</span></td>
|
| 216 |
<td>-- GB</td>
|
| 217 |
<td>Near-lossless. Best quality, higher VRAM/RAM requirement.</td>
|
| 218 |
</tr>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 219 |
</tbody>
|
| 220 |
</table>
|
| 221 |
</div>
|
|
|
|
| 227 |
<a href="https://huggingface.co/CohereForAI/c4ai-command-r-plus" target="_blank">Cohere North Code</a>
|
| 228 |
weights using <code>llama.cpp</code> with importance matrix calibration for optimal token-level precision retention.
|
| 229 |
</p>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 230 |
|
| 231 |
<!-- DISCLAIMER -->
|
| 232 |
<div class="nc-disclaimer">
|