jeffasante commited on
Commit
900eccd
·
verified ·
1 Parent(s): 21ed690

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -44,3 +44,5 @@ gemma-3-1b-it-int8-v1/gemma-3-1b-it-int8-v1.cellm filter=lfs diff=lfs merge=lfs
44
  gemma-3-1b-it-int8-v1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
45
  gemma-3-1b-it-mixed-int4-v1/gemma-3-1b-it-mixed-int4-v1.cellm filter=lfs diff=lfs merge=lfs -text
46
  smollm2-360m-int8-v1/smollm2-360m-int8-v1.cellm filter=lfs diff=lfs merge=lfs -text
 
 
 
44
  gemma-3-1b-it-int8-v1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
45
  gemma-3-1b-it-mixed-int4-v1/gemma-3-1b-it-mixed-int4-v1.cellm filter=lfs diff=lfs merge=lfs -text
46
  smollm2-360m-int8-v1/smollm2-360m-int8-v1.cellm filter=lfs diff=lfs merge=lfs -text
47
+ gemma-4-E2B-it-int4-aggr-v5/gemma-4-E2B-it-int4-aggr-v5.cellmd filter=lfs diff=lfs merge=lfs -text
48
+ gemma-4-E2B-it-int4-aggr-v5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
gemma-4-E2B-it-int4-aggr-v5/README.md ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # gemma-4-E2B-it-int4-aggr-v5 (cellm)
2
+
3
+ ## Files
4
+
5
+ - `gemma-4-E2B-it-int4-aggr-v5.cellmd` (~3.3GB)
6
+ - `tokenizer.json`
7
+ - `tokenizer_config.json`
8
+
9
+ ## Run (CPU)
10
+
11
+ ```bash
12
+ cd /cellm
13
+ ./target/release/infer \
14
+ --model models/to-huggingface/gemma-4-E2B-it-int4-aggr-v5/gemma-4-E2B-it-int4-aggr-v5.cellmd \
15
+ --tokenizer models/to-huggingface/gemma-4-E2B-it-int4-aggr-v5/tokenizer.json \
16
+ --prompt "What is consciousness?" \
17
+ --chat --chat-format auto \
18
+ --gen 48 \
19
+ --temperature 0 \
20
+ --backend cpu \
21
+ --kv-encoding f16
22
+ ```
23
+
24
+ ## Run (Metal)
25
+
26
+ ```bash
27
+ cd /cellm
28
+ ./target/release/infer \
29
+ --model models/to-huggingface/gemma-4-E2B-it-int4-aggr-v5/gemma-4-E2B-it-int4-aggr-v5.cellmd \
30
+ --tokenizer models/to-huggingface/gemma-4-E2B-it-int4-aggr-v5/tokenizer.json \
31
+ --prompt "What is consciousness?" \
32
+ --chat --chat-format auto \
33
+ --gen 48 \
34
+ --temperature 0 \
35
+ --backend metal \
36
+ --kv-encoding turboquant
37
+ ```
gemma-4-E2B-it-int4-aggr-v5/gemma-4-E2B-it-int4-aggr-v5.cellmd ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54cf219d4da3c50efe03f10841b0bac572b164ab1c61020d9fa6143ab11b90a
3
+ size 3591368768
gemma-4-E2B-it-int4-aggr-v5/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc8d3a0ce36466ccc1278bf987df5f71db1719b9ca6b4118264f45cb627bfe0f
3
+ size 32169626
gemma-4-E2B-it-int4-aggr-v5/tokenizer_config.json ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio_token": "<|audio|>",
3
+ "backend": "tokenizers",
4
+ "boa_token": "<|audio>",
5
+ "boi_token": "<|image>",
6
+ "bos_token": "<bos>",
7
+ "eoa_token": "<audio|>",
8
+ "eoc_token": "<channel|>",
9
+ "eoi_token": "<image|>",
10
+ "eos_token": "<eos>",
11
+ "eot_token": "<turn|>",
12
+ "escape_token": "<|\"|>",
13
+ "etc_token": "<tool_call|>",
14
+ "etd_token": "<tool|>",
15
+ "etr_token": "<tool_response|>",
16
+ "extra_special_tokens": [
17
+ "<|video|>"
18
+ ],
19
+ "image_token": "<|image|>",
20
+ "mask_token": "<mask>",
21
+ "model_max_length": 1000000000000000019884624838656,
22
+ "pad_token": "<pad>",
23
+ "padding_side": "left",
24
+ "processor_class": "Gemma4Processor",
25
+ "response_schema": {
26
+ "type": "object",
27
+ "properties": {
28
+ "role": {
29
+ "const": "assistant"
30
+ },
31
+ "thinking": {
32
+ "type": "string"
33
+ },
34
+ "content": {
35
+ "type": "string"
36
+ },
37
+ "tool_calls": {
38
+ "x-regex-iterator": "<\\|tool_call>(.*?)<tool_call\\|>",
39
+ "type": "array",
40
+ "items": {
41
+ "type": "object",
42
+ "properties": {
43
+ "type": {
44
+ "const": "function"
45
+ },
46
+ "function": {
47
+ "type": "object",
48
+ "x-regex": "call\\:(?P<name>\\w+)(?P<arguments>\\{.*\\})",
49
+ "properties": {
50
+ "name": {
51
+ "type": "string"
52
+ },
53
+ "arguments": {
54
+ "type": "object",
55
+ "x-parser": "gemma4-tool-call",
56
+ "additionalProperties": {}
57
+ }
58
+ }
59
+ }
60
+ }
61
+ }
62
+ }
63
+ },
64
+ "x-regex": "(\\<\\|channel\\>thought\\n(?P<thinking>.*?)\\<channel\\|\\>)?(?P<content>(?:(?!\\<\\|tool_call\\>)(?!\\<turn\\|\\>).)+)?(?P<tool_calls>\\<\\|tool_call\\>.*\\<tool_call\\|\\>)?(?:\\<turn\\|\\>)?"
65
+ },
66
+ "soc_token": "<|channel>",
67
+ "sot_token": "<|turn>",
68
+ "stc_token": "<|tool_call>",
69
+ "std_token": "<|tool>",
70
+ "str_token": "<|tool_response>",
71
+ "think_token": "<|think|>",
72
+ "tokenizer_class": "GemmaTokenizer",
73
+ "unk_token": "<unk>"
74
+ }