Naruto123321 commited on
Commit
810494b
·
verified ·
1 Parent(s): aaf91f8

Upload Qwen3ForCausalLM

Browse files
Files changed (4) hide show
  1. README.md +3 -1
  2. config.json +1 -1
  3. generation_config.json +0 -1
  4. model.safetensors +1 -1
README.md CHANGED
@@ -1,6 +1,8 @@
1
  ---
2
  library_name: transformers
3
- tags: []
 
 
4
  ---
5
 
6
  # Model Card for Model ID
 
1
  ---
2
  library_name: transformers
3
+ tags:
4
+ - trl
5
+ - sft
6
  ---
7
 
8
  # Model Card for Model ID
config.json CHANGED
@@ -4,7 +4,6 @@
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
- "bos_token_id": 151643,
8
  "dtype": "float32",
9
  "eos_token_id": 151645,
10
  "head_dim": 128,
@@ -48,6 +47,7 @@
48
  "num_attention_heads": 16,
49
  "num_hidden_layers": 28,
50
  "num_key_value_heads": 8,
 
51
  "rms_norm_eps": 1e-06,
52
  "rope_scaling": null,
53
  "rope_theta": 1000000,
 
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
 
7
  "dtype": "float32",
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
 
47
  "num_attention_heads": 16,
48
  "num_hidden_layers": 28,
49
  "num_key_value_heads": 8,
50
+ "pad_token_id": 151643,
51
  "rms_norm_eps": 1e-06,
52
  "rope_scaling": null,
53
  "rope_theta": 1000000,
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "bos_token_id": 151643,
3
  "do_sample": true,
4
  "eos_token_id": [
5
  151645,
 
1
  {
 
2
  "do_sample": true,
3
  "eos_token_id": [
4
  151645,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:941a2503043d05e25800d01c9dde185659a89a8577f1b4445af6c2a7f7140b7b
3
  size 2384234968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0013beb29261fb78ef2f1932eece31c07e1376794000cb11119d923330bcef1a
3
  size 2384234968