jeffasante commited on
Commit
47a6080
·
verified ·
1 Parent(s): 3e258d0

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -50,3 +50,12 @@ gemma-4-E2B-it-int4-aggr-v2/gemma-4-E2B-it-int4-aggr-v2.cellmd filter=lfs diff=l
50
  gemma-4-E2B-it-int4-aggr-v2/gemma-4-E2B-it-int4-aggr-v2.tokenizer.json filter=lfs diff=lfs merge=lfs -text
51
  Bonsai-1.7B_v2/Bonsai-1.7B_v2.cellm filter=lfs diff=lfs merge=lfs -text
52
  lfm2.5-350m-v1/lfm2.5-350m-v1.cellm filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
50
  gemma-4-E2B-it-int4-aggr-v2/gemma-4-E2B-it-int4-aggr-v2.tokenizer.json filter=lfs diff=lfs merge=lfs -text
51
  Bonsai-1.7B_v2/Bonsai-1.7B_v2.cellm filter=lfs diff=lfs merge=lfs -text
52
  lfm2.5-350m-v1/lfm2.5-350m-v1.cellm filter=lfs diff=lfs merge=lfs -text
53
+ qwen3-0.6b-v1/qwen3-0.6b-f16-new.cellm filter=lfs diff=lfs merge=lfs -text
54
+ qwen3-0.6b-v1/qwen3-0.6b-f16.cellm filter=lfs diff=lfs merge=lfs -text
55
+ qwen3-0.6b-v1/qwen3-0.6b-int4-g128.cellm filter=lfs diff=lfs merge=lfs -text
56
+ qwen3-0.6b-v1/qwen3-0.6b-int4-g32.cellm filter=lfs diff=lfs merge=lfs -text
57
+ qwen3-0.6b-v1/qwen3-0.6b-int4.cellm filter=lfs diff=lfs merge=lfs -text
58
+ qwen3-0.6b-v1/qwen3-0.6b-int8.cellm filter=lfs diff=lfs merge=lfs -text
59
+ qwen3-0.6b-v1/qwen3-0.6b-mixed-int4.cellm filter=lfs diff=lfs merge=lfs -text
60
+ qwen3-0.6b-v1/qwen3-0.6b-test-i4.cellm filter=lfs diff=lfs merge=lfs -text
61
+ qwen3-0.6b-v1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
qwen3-0.6b-v1/README.md ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Qwen3-0.6B (cellm)
2
+
3
+ Qwen3-0.6B base model converted to cellm format at various quantization levels.
4
+
5
+ This is a base (pretrained) model, not instruction-tuned. It works in text completion mode but does not follow chat templates.
6
+
7
+ ## Model details
8
+
9
+ - **Base model**: Qwen/Qwen3-0.6B
10
+ - **Architecture**: Standard transformer with grouped-query attention
11
+ - **Hidden size**: 1024
12
+ - **Attention**: 16 heads, 128 head dim, attn_dim = 2048
13
+ - **Vocab**: 151,936
14
+
15
+ ## Variants
16
+
17
+ | File | Format | Size | Quality |
18
+ |------|--------|------|---------|
19
+ | qwen3-0.6b-f16.cellm | f16 | 1.4 GB | Repetitive but on-topic |
20
+ | qwen3-0.6b-f16-new.cellm | f16 (rebuilt) | 1.4 GB | Same as above |
21
+ | qwen3-0.6b-int8.cellm | int8 | 866 MB | Repetitive but on-topic |
22
+ | qwen3-0.6b-int4-g32.cellm | int4 g32 | 830 MB | Noisy, sometimes on-topic |
23
+ | qwen3-0.6b-mixed-int4.cellm | mixed int4 | 810 MB | Mostly repetitive |
24
+ | qwen3-0.6b-int4-g128.cellm | int4 g128 | 590 MB | Mostly repetitive |
25
+ | qwen3-0.6b-test-i4.cellm | int4 test | 582 MB | Fragmented |
26
+ | qwen3-0.6b-int4.cellm | int4 aggressive | 360 MB | Fragmented |
27
+
28
+ All variants share one tokenizer.json.
29
+
30
+ ## Usage
31
+
32
+ ```sh
33
+ ./target/release/infer \
34
+ --model qwen3-0.6b-f16.cellm \
35
+ --tokenizer tokenizer.json \
36
+ --prompt "Explain what a computer is:" \
37
+ --gen 40 --temperature 0.7 --backend cpu --kv-encoding f16
38
+ ```
39
+
40
+ ## Notes
41
+
42
+ - This is a 0.6B base model. Output quality is limited across all quantizations.
43
+ - Use temperature 0.7+ to avoid repetition loops.
44
+ - f16 and int8 are the most coherent. Below int8, quality drops.
45
+ - For instruction-following, use Qwen3.5-0.8B instead.
46
+
47
+ ## License
48
+
49
+ Apache 2.0 (same as upstream Qwen3)
qwen3-0.6b-v1/qwen3-0.6b-f16-new.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25ac1e945b9ee9b0fdf0410fcff42e8b8413194a5ef5d4aca8c46c66c60f4a4d
3
+ size 1503304448
qwen3-0.6b-v1/qwen3-0.6b-f16.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25ac1e945b9ee9b0fdf0410fcff42e8b8413194a5ef5d4aca8c46c66c60f4a4d
3
+ size 1503304448
qwen3-0.6b-v1/qwen3-0.6b-int4-g128.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8ef2b7838efcdcf5e094dc08d6d706a9af93923754d7a40c05dffa9bf200c2f
3
+ size 618664768
qwen3-0.6b-v1/qwen3-0.6b-int4-g32.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c3c2587c542cf1771b71e10bdf022e0efe0d9b334c0a54eb952efca7ac7a2f7
3
+ size 870251520
qwen3-0.6b-v1/qwen3-0.6b-int4.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb1a1f6d812c9d6fc3309982bdd2983c8bb6c3031a93498260a9ab37eba94a57
3
+ size 377274176
qwen3-0.6b-v1/qwen3-0.6b-int8.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fd22eea57a3d4c3d55487c70315675231fbc9f6540cd6f91dd5fe2255e775bf
3
+ size 908336128
qwen3-0.6b-v1/qwen3-0.6b-mixed-int4.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57b4b7f83b96431d78f442cb7d291f338d516c95df318b41fed8e4f11bae6ccb
3
+ size 849607424
qwen3-0.6b-v1/qwen3-0.6b-test-i4.cellm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:168d58198b103bb3cb6083b3198547ffafb9adb243eb563a0d3cadb5b9b1d16f
3
+ size 610343872
qwen3-0.6b-v1/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
3
+ size 11422654