Upload model
Browse files- .gitattributes +12 -0
- README.md +34 -0
- config.json +38 -0
- gemma3-4b-it-afq2-0.uqff +3 -0
- gemma3-4b-it-afq3-0.uqff +3 -0
- gemma3-4b-it-afq4-0.uqff +3 -0
- gemma3-4b-it-afq6-0.uqff +3 -0
- gemma3-4b-it-afq8-0.uqff +3 -0
- gemma3-4b-it-f8e4m3-0.uqff +3 -0
- gemma3-4b-it-q2k-0.uqff +3 -0
- gemma3-4b-it-q3k-0.uqff +3 -0
- gemma3-4b-it-q4k-0.uqff +3 -0
- gemma3-4b-it-q5k-0.uqff +3 -0
- gemma3-4b-it-q8_0-0.uqff +3 -0
- generation_config.json +13 -0
- preprocessor_config.json +29 -0
- processor_config.json +4 -0
- residual.safetensors +3 -0
- tokenizer.json +3 -0
- tokenizer_config.json +0 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
gemma3-4b-it-afq2-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
gemma3-4b-it-afq3-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
gemma3-4b-it-afq4-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
gemma3-4b-it-afq6-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
gemma3-4b-it-afq8-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
gemma3-4b-it-f8e4m3-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
gemma3-4b-it-q2k-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
gemma3-4b-it-q3k-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
gemma3-4b-it-q4k-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
gemma3-4b-it-q5k-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
gemma3-4b-it-q8_0-0.uqff filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- uqff
|
| 4 |
+
- mistral.rs
|
| 5 |
+
base_model: google/gemma-3-4b-it
|
| 6 |
+
base_model_relation: quantized
|
| 7 |
+
---
|
| 8 |
+
|
| 9 |
+
<!-- Autogenerated from user input. -->
|
| 10 |
+
|
| 11 |
+
# `google/gemma-3-4b-it`, UQFF quantization
|
| 12 |
+
|
| 13 |
+
|
| 14 |
+
Run with [mistral.rs](https://github.com/EricLBuehler/mistral.rs). Documentation: [UQFF docs](https://github.com/EricLBuehler/mistral.rs/blob/master/docs/UQFF.md).
|
| 15 |
+
|
| 16 |
+
1) **Flexible** 🌀: Multiple quantization formats in *one* file format with *one* framework to run them all.
|
| 17 |
+
2) **Reliable** 🔒: Compatibility ensured with *embedded* and *checked* semantic versioning information from day 1.
|
| 18 |
+
3) **Easy** 🤗: Download UQFF models *easily* and *quickly* from Hugging Face, or use a local file.
|
| 19 |
+
3) **Customizable** 🛠️: Make and publish your own UQFF files in minutes.
|
| 20 |
+
|
| 21 |
+
## Examples
|
| 22 |
+
|Quantization type(s)|Example|
|
| 23 |
+
|--|--|
|
| 24 |
+
|AFQ2|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq2-0.uqff`|
|
| 25 |
+
|AFQ3|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq3-0.uqff`|
|
| 26 |
+
|AFQ4|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq4-0.uqff`|
|
| 27 |
+
|AFQ6|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq6-0.uqff`|
|
| 28 |
+
|AFQ8|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq8-0.uqff`|
|
| 29 |
+
|F8E4M3|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-f8e4m3-0.uqff`|
|
| 30 |
+
|Q2K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q2k-0.uqff`|
|
| 31 |
+
|Q3K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q3k-0.uqff`|
|
| 32 |
+
|Q4K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q4k-0.uqff`|
|
| 33 |
+
|Q5K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q5k-0.uqff`|
|
| 34 |
+
|Q8_0|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q8_0-0.uqff`|
|
config.json
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"Gemma3ForConditionalGeneration"
|
| 4 |
+
],
|
| 5 |
+
"boi_token_index": 255999,
|
| 6 |
+
"eoi_token_index": 256000,
|
| 7 |
+
"eos_token_id": [
|
| 8 |
+
1,
|
| 9 |
+
106
|
| 10 |
+
],
|
| 11 |
+
"image_token_index": 262144,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"mm_tokens_per_image": 256,
|
| 14 |
+
"model_type": "gemma3",
|
| 15 |
+
"text_config": {
|
| 16 |
+
"hidden_size": 2560,
|
| 17 |
+
"intermediate_size": 10240,
|
| 18 |
+
"model_type": "gemma3_text",
|
| 19 |
+
"num_hidden_layers": 34,
|
| 20 |
+
"rope_scaling": {
|
| 21 |
+
"factor": 8.0,
|
| 22 |
+
"rope_type": "linear"
|
| 23 |
+
},
|
| 24 |
+
"sliding_window": 1024
|
| 25 |
+
},
|
| 26 |
+
"torch_dtype": "bfloat16",
|
| 27 |
+
"transformers_version": "4.50.0.dev0",
|
| 28 |
+
"vision_config": {
|
| 29 |
+
"hidden_size": 1152,
|
| 30 |
+
"image_size": 896,
|
| 31 |
+
"intermediate_size": 4304,
|
| 32 |
+
"model_type": "siglip_vision_model",
|
| 33 |
+
"num_attention_heads": 16,
|
| 34 |
+
"num_hidden_layers": 27,
|
| 35 |
+
"patch_size": 14,
|
| 36 |
+
"vision_use_head": false
|
| 37 |
+
}
|
| 38 |
+
}
|
gemma3-4b-it-afq2-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7fd4da935e4a4643265e4a2faa69a5beda8fbe043646ee4414f83235f5177ea4
|
| 3 |
+
size 1212501540
|
gemma3-4b-it-afq3-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4eda4c491c5b28fc15f99b2d855c25254f12ab6d360750e148b9e1e3b7a2f516
|
| 3 |
+
size 1697488724
|
gemma3-4b-it-afq4-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75ec12d5c4ce731a259245a3978e5caa1ab482160311f3fa321b14a6df3c53c1
|
| 3 |
+
size 2182475684
|
gemma3-4b-it-afq6-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:398aeedf5048fc3ac09210ba3cc1120766fcd33edcf99cf85757b81d38a795f3
|
| 3 |
+
size 3152449524
|
gemma3-4b-it-afq8-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1749869931a1d89294655bb95fac86358a3a978835593798d0b77d2573f03090
|
| 3 |
+
size 4122423324
|
gemma3-4b-it-f8e4m3-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d94e158247d6a4d4f70785d2e864653cc66ba78febe2cfc308234478c65642a
|
| 3 |
+
size 3879923662
|
gemma3-4b-it-q2k-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa7485733a89779463dd130963da9a182ed0e048e0b0e5170fdbbcc02ae3a5a0
|
| 3 |
+
size 1273114886
|
gemma3-4b-it-q3k-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b07b1e98d893331ac077e409240faa2cc54f13247c69972e518392e1f88efad4
|
| 3 |
+
size 1667167006
|
gemma3-4b-it-q4k-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab3e3af19315a00229b6b4aeca1b7b1db061127575a360a79e38e097987b9e77
|
| 3 |
+
size 2182465646
|
gemma3-4b-it-q5k-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be6e3e7eceeb9ed1133f31e0b768cab3ac2235423ae760355103444acf7cb3ea
|
| 3 |
+
size 2667452574
|
gemma3-4b-it-q8_0-0.uqff
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fee927648a2e8d1f2d6059867d24edd342735dffc65ad343e3eac084d8bf8647
|
| 3 |
+
size 4122413286
|
generation_config.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 2,
|
| 3 |
+
"cache_implementation": "hybrid",
|
| 4 |
+
"do_sample": true,
|
| 5 |
+
"eos_token_id": [
|
| 6 |
+
1,
|
| 7 |
+
106
|
| 8 |
+
],
|
| 9 |
+
"pad_token_id": 0,
|
| 10 |
+
"top_k": 64,
|
| 11 |
+
"top_p": 0.95,
|
| 12 |
+
"transformers_version": "4.50.0.dev0"
|
| 13 |
+
}
|
preprocessor_config.json
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"do_convert_rgb": null,
|
| 3 |
+
"do_normalize": true,
|
| 4 |
+
"do_pan_and_scan": null,
|
| 5 |
+
"do_rescale": true,
|
| 6 |
+
"do_resize": true,
|
| 7 |
+
"image_mean": [
|
| 8 |
+
0.5,
|
| 9 |
+
0.5,
|
| 10 |
+
0.5
|
| 11 |
+
],
|
| 12 |
+
"image_processor_type": "Gemma3ImageProcessor",
|
| 13 |
+
"image_seq_length": 256,
|
| 14 |
+
"image_std": [
|
| 15 |
+
0.5,
|
| 16 |
+
0.5,
|
| 17 |
+
0.5
|
| 18 |
+
],
|
| 19 |
+
"pan_and_scan_max_num_crops": null,
|
| 20 |
+
"pan_and_scan_min_crop_size": null,
|
| 21 |
+
"pan_and_scan_min_ratio_to_activate": null,
|
| 22 |
+
"processor_class": "Gemma3Processor",
|
| 23 |
+
"resample": 2,
|
| 24 |
+
"rescale_factor": 0.00392156862745098,
|
| 25 |
+
"size": {
|
| 26 |
+
"height": 896,
|
| 27 |
+
"width": 896
|
| 28 |
+
}
|
| 29 |
+
}
|
processor_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"image_seq_length": 256,
|
| 3 |
+
"processor_class": "Gemma3Processor"
|
| 4 |
+
}
|
residual.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b0ea96131be74e2b699f2cb5ec4e44a1231ab94c5a2cd622bcb965822267dcb
|
| 3 |
+
size 2182961544
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90a4672a51a9f582918ab48639e47c6cf053961c0bb6c6e6e32479f1ff123322
|
| 3 |
+
size 33384604
|
tokenizer_config.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|