tomzhou10010 commited on
Commit
634b237
·
verified ·
1 Parent(s): 5e84cab

Release 3x-0.5B-Chat (standard HF interface, no trust_remote_code needed)

Browse files
config.json CHANGED
@@ -37,6 +37,7 @@
37
  "full_attention"
38
  ],
39
  "max_position_embeddings": 32768,
 
40
  "model_type": "threex2",
41
  "num_attention_heads": 16,
42
  "num_hidden_layers": 24,
@@ -44,12 +45,12 @@
44
  "pad_token_id": 151645,
45
  "rms_norm_eps": 1e-06,
46
  "rope_parameters": {
47
- "rope_theta": 10000.0,
48
  "rope_type": "default"
49
  },
50
- "rope_theta": 10000.0,
51
- "sliding_window": null,
52
- "tie_word_embeddings": false,
53
  "transformers_version": "5.2.0",
54
  "use_cache": true,
55
  "use_sliding_window": false,
 
37
  "full_attention"
38
  ],
39
  "max_position_embeddings": 32768,
40
+ "max_window_layers": 21,
41
  "model_type": "threex2",
42
  "num_attention_heads": 16,
43
  "num_hidden_layers": 24,
 
45
  "pad_token_id": 151645,
46
  "rms_norm_eps": 1e-06,
47
  "rope_parameters": {
48
+ "rope_theta": 1000000.0,
49
  "rope_type": "default"
50
  },
51
+ "rope_theta": 1000000.0,
52
+ "sliding_window": 32768,
53
+ "tie_word_embeddings": true,
54
  "transformers_version": "5.2.0",
55
  "use_cache": true,
56
  "use_sliding_window": false,
generation_config.json CHANGED
@@ -1,10 +1,12 @@
1
  {
2
- "_from_model_config": true,
3
  "bos_token_id": 151643,
4
- "eos_token_id": 151645,
5
- "output_attentions": false,
6
- "output_hidden_states": false,
7
- "pad_token_id": 151645,
8
- "transformers_version": "5.2.0",
9
- "use_cache": true
 
 
 
10
  }
 
1
  {
 
2
  "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "repetition_penalty": 1.1,
10
+ "top_p": 0.8,
11
+ "transformers_version": "5.2.0"
12
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:840b3fe9d6ebf7926947f2c0d4fa841c61b66359ce1c8f4b968c026f43d639e4
3
- size 2478313760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a7cc9681a0a7c1d4640ee1296d10045ce3b4000a98d751f35eb5abc3a2d40d3
3
+ size 1855983640
tokenizer_config.json CHANGED
@@ -14,7 +14,5 @@
14
  "pad_token": "<|endoftext|>",
15
  "split_special_tokens": false,
16
  "tokenizer_class": "Qwen2Tokenizer",
17
- "unk_token": null,
18
- "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\\nYou are a helpful assistant.<|im_end|>\\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\\n' + message['content'] + '<|im_end|>' + '\\n'}}{% endfor %}{{ '<|im_start|>assistant\\n' }}",
19
- "model_type": "threex"
20
- }
 
14
  "pad_token": "<|endoftext|>",
15
  "split_special_tokens": false,
16
  "tokenizer_class": "Qwen2Tokenizer",
17
+ "unk_token": null
18
+ }