zzman commited on
Commit
9843cbe
·
verified ·
1 Parent(s): 1450a61

zzman/QWEN2.1-0.5-SFT

Browse files
README.md CHANGED
@@ -34,10 +34,10 @@ This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.15.2
38
- - Transformers: 4.49.0
39
  - Pytorch: 2.6.0+cu124
40
- - Datasets: 3.4.1
41
  - Tokenizers: 0.21.1
42
 
43
  ## Citations
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.16.0
38
+ - Transformers: 4.50.0
39
  - Pytorch: 2.6.0+cu124
40
+ - Datasets: 3.5.0
41
  - Tokenizers: 0.21.1
42
 
43
  ## Citations
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "Qwen/Qwen2.5-0.5B-Instruct",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
@@ -22,7 +21,7 @@
22
  "sliding_window": 32768,
23
  "tie_word_embeddings": true,
24
  "torch_dtype": "bfloat16",
25
- "transformers_version": "4.49.0",
26
  "use_cache": true,
27
  "use_sliding_window": false,
28
  "vocab_size": 151936
 
1
  {
 
2
  "architectures": [
3
  "Qwen2ForCausalLM"
4
  ],
 
21
  "sliding_window": 32768,
22
  "tie_word_embeddings": true,
23
  "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.50.0",
25
  "use_cache": true,
26
  "use_sliding_window": false,
27
  "vocab_size": 151936
generation_config.json CHANGED
@@ -10,5 +10,5 @@
10
  "temperature": 0.7,
11
  "top_k": 20,
12
  "top_p": 0.8,
13
- "transformers_version": "4.49.0"
14
  }
 
10
  "temperature": 0.7,
11
  "top_k": 20,
12
  "top_p": 0.8,
13
+ "transformers_version": "4.50.0"
14
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bd2f69716a38d0c83f47ddc6abb0f256deee9d4da231ae8aee0ede230d8a85a
3
  size 988097824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49618884170f0f734a09aece2e47c0d3320fa1b21bd299b86747ba6fb2c046af
3
  size 988097824
tokenizer_config.json CHANGED
@@ -202,7 +202,6 @@
202
  "extra_special_tokens": {},
203
  "model_max_length": 131072,
204
  "pad_token": "<|endoftext|>",
205
- "padding_side": "right",
206
  "split_special_tokens": false,
207
  "tokenizer_class": "Qwen2Tokenizer",
208
  "unk_token": null
 
202
  "extra_special_tokens": {},
203
  "model_max_length": 131072,
204
  "pad_token": "<|endoftext|>",
 
205
  "split_special_tokens": false,
206
  "tokenizer_class": "Qwen2Tokenizer",
207
  "unk_token": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37f618eb0b738d870d555a233ea8422b57aaf99c5d09f24494909f8140affb26
3
- size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b94f36f06c24f4116c23dbc193373bc5f0e13595a32449365770e7102007b86
3
+ size 5624