Explyt commited on
Commit
2347d3b
·
verified ·
1 Parent(s): c917108

Add files using upload-large-folder tool

Browse files
config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name_or_path": "tclf90/Qwen3-Coder-480B-A35B-Instruct-AWQ",
3
+ "architectures": [
4
+ "Qwen3MoeForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "decoder_sparse_step": 1,
9
+ "eos_token_id": 151645,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 6144,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 8192,
15
+ "max_position_embeddings": 262144,
16
+ "max_window_layers": 62,
17
+ "mlp_only_layers": [],
18
+ "model_type": "qwen3_moe",
19
+ "moe_intermediate_size": 2560,
20
+ "norm_topk_prob": true,
21
+ "num_attention_heads": 96,
22
+ "num_experts": 160,
23
+ "num_experts_per_tok": 8,
24
+ "num_hidden_layers": 62,
25
+ "num_key_value_heads": 8,
26
+ "output_router_logits": false,
27
+ "qkv_bias": false,
28
+ "rms_norm_eps": 1e-06,
29
+ "rope_scaling": null,
30
+ "rope_theta": 10000000,
31
+ "router_aux_loss_coef": 0.0,
32
+ "shared_expert_intermediate_size": 0,
33
+ "sliding_window": null,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "float16",
36
+ "transformers_version": "4.51.0",
37
+ "use_cache": true,
38
+ "use_qk_norm": true,
39
+ "use_sliding_window": false,
40
+ "vocab_size": 151936,
41
+ "quantization_config": {
42
+ "quant_method": "awq",
43
+ "bits": 4,
44
+ "group_size": 128,
45
+ "version": "gemm",
46
+ "zero_point": true,
47
+ "modules_to_not_convert": [".mlp.gate"]
48
+ }
49
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "pad_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "repetition_penalty": 1.05,
9
+ "temperature": 0.7,
10
+ "top_p": 0.8,
11
+ "top_k": 20
12
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00002-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38d06568f8a1a3e9eb9aac6806f36f5df05e2db0d10cf1db44d49dc28e1f3a1e
3
+ size 5000025136
model-00005-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6554d7098a31868fd7d7dda0f5b559ebedd8c3d3c6ab13da13a1fced6a566eb7
3
+ size 4998280000
model-00011-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b738181e7db8e3df923e0910807f75cf6123d0c56c98880cb3d6f60aa754804a
3
+ size 4995355240
model-00014-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00177b7ab83afb7614efff38569247187842c0dcb0abc1684eeba28e0316f8f1
3
+ size 4998294304
model-00015-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5f63a5bbac480bfd320c4384b10256481c5f623dcccfe6596736f9a9bdf2c32
3
+ size 4977378288
model-00019-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9c5896f15877ac4d0fe3bec0c9714a7bb34fad80afb8e719e4e0b611ac2cd2c
3
+ size 4995355256
model-00021-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1a609ab99c5686a9657d92502dd6accce05575c96e01e73848e144d0967c56a
3
+ size 4998281664
model-00024-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:602b5d6c280288f6090c7c80179ec003efe0e22816ffeceba46b4553eef19f8e
3
+ size 4998281520
model-00025-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:500476466ab0dd024ba7feeb42de2ad942395213c342289a8cc2760c765bd97e
3
+ size 4998281632
model-00029-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19fef4e0bbbaddee4d34cacf7ff71a6d9b4bffc2e3f34d58841544bd10f7b714
3
+ size 4998281712
model-00030-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe5e7a8b2c312fd0e506aa0d9e1ba41669e6a72092ef4b370332582d46151459
3
+ size 4998294200
model-00033-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74552e6261a416dee6b3dcd0e55799f2079d569247c159522410993d3cc5a2a7
3
+ size 4998281688
model-00034-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11c3d7ef47e5fe582b37c7965d4551e92608e7a21ed90598fdc0b1cca1ce82de
3
+ size 4998294200
model-00036-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5b0a76956421e64b78380696929551833e41706a456fa21cb54e7c20a071572
3
+ size 4998281520
model-00038-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e285f65c066b046319281d1c1b4759478bf64be4aff58b508f9fd3ba5f66eb4
3
+ size 4998281896
model-00047-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31999fd22a9c3d87693eb9de49b5850aadbf1dfd08c1879f019ec9862b1a5068
3
+ size 4995355432
model-00051-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59c22d8de7bcd7025539d91b21b03bc5d181599af0dc21d7b77402dd56a9f8a9
3
+ size 2457368880