EricB HF Staff commited on
Commit
d534299
·
verified ·
1 Parent(s): efde00d

Upload model

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ gemma3-4b-it-afq2-0.uqff filter=lfs diff=lfs merge=lfs -text
37
+ gemma3-4b-it-afq3-0.uqff filter=lfs diff=lfs merge=lfs -text
38
+ gemma3-4b-it-afq4-0.uqff filter=lfs diff=lfs merge=lfs -text
39
+ gemma3-4b-it-afq6-0.uqff filter=lfs diff=lfs merge=lfs -text
40
+ gemma3-4b-it-afq8-0.uqff filter=lfs diff=lfs merge=lfs -text
41
+ gemma3-4b-it-f8e4m3-0.uqff filter=lfs diff=lfs merge=lfs -text
42
+ gemma3-4b-it-q2k-0.uqff filter=lfs diff=lfs merge=lfs -text
43
+ gemma3-4b-it-q3k-0.uqff filter=lfs diff=lfs merge=lfs -text
44
+ gemma3-4b-it-q4k-0.uqff filter=lfs diff=lfs merge=lfs -text
45
+ gemma3-4b-it-q5k-0.uqff filter=lfs diff=lfs merge=lfs -text
46
+ gemma3-4b-it-q8_0-0.uqff filter=lfs diff=lfs merge=lfs -text
47
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - uqff
4
+ - mistral.rs
5
+ base_model: google/gemma-3-4b-it
6
+ base_model_relation: quantized
7
+ ---
8
+
9
+ <!-- Autogenerated from user input. -->
10
+
11
+ # `google/gemma-3-4b-it`, UQFF quantization
12
+
13
+
14
+ Run with [mistral.rs](https://github.com/EricLBuehler/mistral.rs). Documentation: [UQFF docs](https://github.com/EricLBuehler/mistral.rs/blob/master/docs/UQFF.md).
15
+
16
+ 1) **Flexible** 🌀: Multiple quantization formats in *one* file format with *one* framework to run them all.
17
+ 2) **Reliable** 🔒: Compatibility ensured with *embedded* and *checked* semantic versioning information from day 1.
18
+ 3) **Easy** 🤗: Download UQFF models *easily* and *quickly* from Hugging Face, or use a local file.
19
+ 3) **Customizable** 🛠️: Make and publish your own UQFF files in minutes.
20
+
21
+ ## Examples
22
+ |Quantization type(s)|Example|
23
+ |--|--|
24
+ |AFQ2|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq2-0.uqff`|
25
+ |AFQ3|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq3-0.uqff`|
26
+ |AFQ4|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq4-0.uqff`|
27
+ |AFQ6|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq6-0.uqff`|
28
+ |AFQ8|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-afq8-0.uqff`|
29
+ |F8E4M3|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-f8e4m3-0.uqff`|
30
+ |Q2K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q2k-0.uqff`|
31
+ |Q3K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q3k-0.uqff`|
32
+ |Q4K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q4k-0.uqff`|
33
+ |Q5K|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q5k-0.uqff`|
34
+ |Q8_0|`./mistralrs-server -i vision-plain -m EricB/gemma-3-4b-it-UQFF -f gemma3-4b-it-q8_0-0.uqff`|
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Gemma3ForConditionalGeneration"
4
+ ],
5
+ "boi_token_index": 255999,
6
+ "eoi_token_index": 256000,
7
+ "eos_token_id": [
8
+ 1,
9
+ 106
10
+ ],
11
+ "image_token_index": 262144,
12
+ "initializer_range": 0.02,
13
+ "mm_tokens_per_image": 256,
14
+ "model_type": "gemma3",
15
+ "text_config": {
16
+ "hidden_size": 2560,
17
+ "intermediate_size": 10240,
18
+ "model_type": "gemma3_text",
19
+ "num_hidden_layers": 34,
20
+ "rope_scaling": {
21
+ "factor": 8.0,
22
+ "rope_type": "linear"
23
+ },
24
+ "sliding_window": 1024
25
+ },
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.50.0.dev0",
28
+ "vision_config": {
29
+ "hidden_size": 1152,
30
+ "image_size": 896,
31
+ "intermediate_size": 4304,
32
+ "model_type": "siglip_vision_model",
33
+ "num_attention_heads": 16,
34
+ "num_hidden_layers": 27,
35
+ "patch_size": 14,
36
+ "vision_use_head": false
37
+ }
38
+ }
gemma3-4b-it-afq2-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fd4da935e4a4643265e4a2faa69a5beda8fbe043646ee4414f83235f5177ea4
3
+ size 1212501540
gemma3-4b-it-afq3-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eda4c491c5b28fc15f99b2d855c25254f12ab6d360750e148b9e1e3b7a2f516
3
+ size 1697488724
gemma3-4b-it-afq4-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75ec12d5c4ce731a259245a3978e5caa1ab482160311f3fa321b14a6df3c53c1
3
+ size 2182475684
gemma3-4b-it-afq6-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:398aeedf5048fc3ac09210ba3cc1120766fcd33edcf99cf85757b81d38a795f3
3
+ size 3152449524
gemma3-4b-it-afq8-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1749869931a1d89294655bb95fac86358a3a978835593798d0b77d2573f03090
3
+ size 4122423324
gemma3-4b-it-f8e4m3-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d94e158247d6a4d4f70785d2e864653cc66ba78febe2cfc308234478c65642a
3
+ size 3879923662
gemma3-4b-it-q2k-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa7485733a89779463dd130963da9a182ed0e048e0b0e5170fdbbcc02ae3a5a0
3
+ size 1273114886
gemma3-4b-it-q3k-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b07b1e98d893331ac077e409240faa2cc54f13247c69972e518392e1f88efad4
3
+ size 1667167006
gemma3-4b-it-q4k-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3e3af19315a00229b6b4aeca1b7b1db061127575a360a79e38e097987b9e77
3
+ size 2182465646
gemma3-4b-it-q5k-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be6e3e7eceeb9ed1133f31e0b768cab3ac2235423ae760355103444acf7cb3ea
3
+ size 2667452574
gemma3-4b-it-q8_0-0.uqff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fee927648a2e8d1f2d6059867d24edd342735dffc65ad343e3eac084d8bf8647
3
+ size 4122413286
generation_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 2,
3
+ "cache_implementation": "hybrid",
4
+ "do_sample": true,
5
+ "eos_token_id": [
6
+ 1,
7
+ 106
8
+ ],
9
+ "pad_token_id": 0,
10
+ "top_k": 64,
11
+ "top_p": 0.95,
12
+ "transformers_version": "4.50.0.dev0"
13
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_pan_and_scan": null,
5
+ "do_rescale": true,
6
+ "do_resize": true,
7
+ "image_mean": [
8
+ 0.5,
9
+ 0.5,
10
+ 0.5
11
+ ],
12
+ "image_processor_type": "Gemma3ImageProcessor",
13
+ "image_seq_length": 256,
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "pan_and_scan_max_num_crops": null,
20
+ "pan_and_scan_min_crop_size": null,
21
+ "pan_and_scan_min_ratio_to_activate": null,
22
+ "processor_class": "Gemma3Processor",
23
+ "resample": 2,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "height": 896,
27
+ "width": 896
28
+ }
29
+ }
processor_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "image_seq_length": 256,
3
+ "processor_class": "Gemma3Processor"
4
+ }
residual.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b0ea96131be74e2b699f2cb5ec4e44a1231ab94c5a2cd622bcb965822267dcb
3
+ size 2182961544
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90a4672a51a9f582918ab48639e47c6cf053961c0bb6c6e6e32479f1ff123322
3
+ size 33384604
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff