Add files using upload-large-folder tool
Browse files- config.json +49 -0
- generation_config.json +12 -0
- merges.txt +0 -0
- model-00002-of-00051.safetensors +3 -0
- model-00005-of-00051.safetensors +3 -0
- model-00011-of-00051.safetensors +3 -0
- model-00014-of-00051.safetensors +3 -0
- model-00015-of-00051.safetensors +3 -0
- model-00019-of-00051.safetensors +3 -0
- model-00021-of-00051.safetensors +3 -0
- model-00024-of-00051.safetensors +3 -0
- model-00025-of-00051.safetensors +3 -0
- model-00029-of-00051.safetensors +3 -0
- model-00030-of-00051.safetensors +3 -0
- model-00033-of-00051.safetensors +3 -0
- model-00034-of-00051.safetensors +3 -0
- model-00036-of-00051.safetensors +3 -0
- model-00038-of-00051.safetensors +3 -0
- model-00047-of-00051.safetensors +3 -0
- model-00051-of-00051.safetensors +3 -0
config.json
ADDED
|
@@ -0,0 +1,49 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name_or_path": "tclf90/Qwen3-Coder-480B-A35B-Instruct-AWQ",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"Qwen3MoeForCausalLM"
|
| 5 |
+
],
|
| 6 |
+
"attention_bias": false,
|
| 7 |
+
"attention_dropout": 0.0,
|
| 8 |
+
"decoder_sparse_step": 1,
|
| 9 |
+
"eos_token_id": 151645,
|
| 10 |
+
"head_dim": 128,
|
| 11 |
+
"hidden_act": "silu",
|
| 12 |
+
"hidden_size": 6144,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 8192,
|
| 15 |
+
"max_position_embeddings": 262144,
|
| 16 |
+
"max_window_layers": 62,
|
| 17 |
+
"mlp_only_layers": [],
|
| 18 |
+
"model_type": "qwen3_moe",
|
| 19 |
+
"moe_intermediate_size": 2560,
|
| 20 |
+
"norm_topk_prob": true,
|
| 21 |
+
"num_attention_heads": 96,
|
| 22 |
+
"num_experts": 160,
|
| 23 |
+
"num_experts_per_tok": 8,
|
| 24 |
+
"num_hidden_layers": 62,
|
| 25 |
+
"num_key_value_heads": 8,
|
| 26 |
+
"output_router_logits": false,
|
| 27 |
+
"qkv_bias": false,
|
| 28 |
+
"rms_norm_eps": 1e-06,
|
| 29 |
+
"rope_scaling": null,
|
| 30 |
+
"rope_theta": 10000000,
|
| 31 |
+
"router_aux_loss_coef": 0.0,
|
| 32 |
+
"shared_expert_intermediate_size": 0,
|
| 33 |
+
"sliding_window": null,
|
| 34 |
+
"tie_word_embeddings": false,
|
| 35 |
+
"torch_dtype": "float16",
|
| 36 |
+
"transformers_version": "4.51.0",
|
| 37 |
+
"use_cache": true,
|
| 38 |
+
"use_qk_norm": true,
|
| 39 |
+
"use_sliding_window": false,
|
| 40 |
+
"vocab_size": 151936,
|
| 41 |
+
"quantization_config": {
|
| 42 |
+
"quant_method": "awq",
|
| 43 |
+
"bits": 4,
|
| 44 |
+
"group_size": 128,
|
| 45 |
+
"version": "gemm",
|
| 46 |
+
"zero_point": true,
|
| 47 |
+
"modules_to_not_convert": [".mlp.gate"]
|
| 48 |
+
}
|
| 49 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"pad_token_id": 151643,
|
| 3 |
+
"do_sample": true,
|
| 4 |
+
"eos_token_id": [
|
| 5 |
+
151645,
|
| 6 |
+
151643
|
| 7 |
+
],
|
| 8 |
+
"repetition_penalty": 1.05,
|
| 9 |
+
"temperature": 0.7,
|
| 10 |
+
"top_p": 0.8,
|
| 11 |
+
"top_k": 20
|
| 12 |
+
}
|
merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
model-00002-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38d06568f8a1a3e9eb9aac6806f36f5df05e2db0d10cf1db44d49dc28e1f3a1e
|
| 3 |
+
size 5000025136
|
model-00005-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6554d7098a31868fd7d7dda0f5b559ebedd8c3d3c6ab13da13a1fced6a566eb7
|
| 3 |
+
size 4998280000
|
model-00011-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b738181e7db8e3df923e0910807f75cf6123d0c56c98880cb3d6f60aa754804a
|
| 3 |
+
size 4995355240
|
model-00014-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:00177b7ab83afb7614efff38569247187842c0dcb0abc1684eeba28e0316f8f1
|
| 3 |
+
size 4998294304
|
model-00015-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5f63a5bbac480bfd320c4384b10256481c5f623dcccfe6596736f9a9bdf2c32
|
| 3 |
+
size 4977378288
|
model-00019-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9c5896f15877ac4d0fe3bec0c9714a7bb34fad80afb8e719e4e0b611ac2cd2c
|
| 3 |
+
size 4995355256
|
model-00021-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1a609ab99c5686a9657d92502dd6accce05575c96e01e73848e144d0967c56a
|
| 3 |
+
size 4998281664
|
model-00024-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:602b5d6c280288f6090c7c80179ec003efe0e22816ffeceba46b4553eef19f8e
|
| 3 |
+
size 4998281520
|
model-00025-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:500476466ab0dd024ba7feeb42de2ad942395213c342289a8cc2760c765bd97e
|
| 3 |
+
size 4998281632
|
model-00029-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19fef4e0bbbaddee4d34cacf7ff71a6d9b4bffc2e3f34d58841544bd10f7b714
|
| 3 |
+
size 4998281712
|
model-00030-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe5e7a8b2c312fd0e506aa0d9e1ba41669e6a72092ef4b370332582d46151459
|
| 3 |
+
size 4998294200
|
model-00033-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74552e6261a416dee6b3dcd0e55799f2079d569247c159522410993d3cc5a2a7
|
| 3 |
+
size 4998281688
|
model-00034-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11c3d7ef47e5fe582b37c7965d4551e92608e7a21ed90598fdc0b1cca1ce82de
|
| 3 |
+
size 4998294200
|
model-00036-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5b0a76956421e64b78380696929551833e41706a456fa21cb54e7c20a071572
|
| 3 |
+
size 4998281520
|
model-00038-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e285f65c066b046319281d1c1b4759478bf64be4aff58b508f9fd3ba5f66eb4
|
| 3 |
+
size 4998281896
|
model-00047-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31999fd22a9c3d87693eb9de49b5850aadbf1dfd08c1879f019ec9862b1a5068
|
| 3 |
+
size 4995355432
|
model-00051-of-00051.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59c22d8de7bcd7025539d91b21b03bc5d181599af0dc21d7b77402dd56a9f8a9
|
| 3 |
+
size 2457368880
|