waddie commited on
Commit
b2c30f2
·
verified ·
1 Parent(s): c8c9e17

Upload Qwen3_5ForCausalLM

Browse files
Files changed (3) hide show
  1. README.md +3 -1
  2. config.json +2 -2
  3. generation_config.json +5 -1
README.md CHANGED
@@ -1,6 +1,8 @@
1
  ---
2
  library_name: transformers
3
- tags: []
 
 
4
  ---
5
 
6
  # Model Card for Model ID
 
1
  ---
2
  library_name: transformers
3
+ tags:
4
+ - trl
5
+ - sft
6
  ---
7
 
8
  # Model Card for Model ID
config.json CHANGED
@@ -7,7 +7,7 @@
7
  "attn_output_gate": true,
8
  "bos_token_id": null,
9
  "dtype": "bfloat16",
10
- "eos_token_id": 248044,
11
  "full_attention_interval": 4,
12
  "head_dim": 256,
13
  "hidden_act": "silu",
@@ -78,6 +78,6 @@
78
  },
79
  "tie_word_embeddings": false,
80
  "transformers_version": "5.6.2",
81
- "use_cache": true,
82
  "vocab_size": 248320
83
  }
 
7
  "attn_output_gate": true,
8
  "bos_token_id": null,
9
  "dtype": "bfloat16",
10
+ "eos_token_id": 248046,
11
  "full_attention_interval": 4,
12
  "head_dim": 256,
13
  "hidden_act": "silu",
 
78
  },
79
  "tie_word_embeddings": false,
80
  "transformers_version": "5.6.2",
81
+ "use_cache": false,
82
  "vocab_size": 248320
83
  }
generation_config.json CHANGED
@@ -1,6 +1,10 @@
1
  {
2
  "_from_model_config": true,
3
- "eos_token_id": 248044,
 
 
 
 
4
  "transformers_version": "5.6.2",
5
  "use_cache": true
6
  }
 
1
  {
2
  "_from_model_config": true,
3
+ "eos_token_id": [
4
+ 248046,
5
+ 248044
6
+ ],
7
+ "pad_token_id": 248055,
8
  "transformers_version": "5.6.2",
9
  "use_cache": true
10
  }