Death-Raider commited on
Commit
3cae727
·
verified ·
1 Parent(s): 9997581

model updated

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: QwenModel_dpo
5
  tags:
6
  - generated_from_trainer
7
- - dpo
8
  - trl
 
9
  licence: license
10
  ---
11
 
@@ -35,10 +35,10 @@ This model was trained with DPO, a method introduced in [Direct Preference Optim
35
  ### Framework versions
36
 
37
  - TRL: 0.23.0
38
- - Transformers: 4.56.1
39
  - Pytorch: 2.8.0.dev20250319+cu128
40
  - Datasets: 4.1.1
41
- - Tokenizers: 0.22.0
42
 
43
  ## Citations
44
 
 
4
  model_name: QwenModel_dpo
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - dpo
9
  licence: license
10
  ---
11
 
 
35
  ### Framework versions
36
 
37
  - TRL: 0.23.0
38
+ - Transformers: 4.56.2
39
  - Pytorch: 2.8.0.dev20250319+cu128
40
  - Datasets: 4.1.1
41
+ - Tokenizers: 0.22.1
42
 
43
  ## Citations
44
 
config.json CHANGED
@@ -51,7 +51,7 @@
51
  "rope_theta": 1000000.0,
52
  "sliding_window": null,
53
  "tie_word_embeddings": false,
54
- "transformers_version": "4.56.1",
55
  "use_cache": true,
56
  "use_sliding_window": false,
57
  "vocab_size": 152064
 
51
  "rope_theta": 1000000.0,
52
  "sliding_window": null,
53
  "tie_word_embeddings": false,
54
+ "transformers_version": "4.56.2",
55
  "use_cache": true,
56
  "use_sliding_window": false,
57
  "vocab_size": 152064
generation_config.json CHANGED
@@ -9,5 +9,5 @@
9
  "temperature": 0.7,
10
  "top_k": 20,
11
  "top_p": 0.8,
12
- "transformers_version": "4.56.1"
13
  }
 
9
  "temperature": 0.7,
10
  "top_k": 20,
11
  "top_p": 0.8,
12
+ "transformers_version": "4.56.2"
13
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24b5f36e5c538c00a414ab69e74b700d0fb9241c1973a18125c89d19d7df9b3c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adc6d07800dbb954f5ee36b7257cbc2a2aa526161b8940cd818cec0920b3369d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d41fcfca9a56b6a7ad97f5edec9659d38d6b764520ad8cb405405dcb469b2b0a
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b49f291cf1ca115dcb845b8f293aaeda0001486cf56fcf75eaa5559c50d34d0a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1380dce938198543506c39ef9445fee48030877ff39023c99133832e9804859
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d16e5c4f0e0ebd005dda6ec5ccee73510662e7145ec6c1699eed1045e7ccbec
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd70e777116decbccca81e84c28955490f3c9c2817c9f61e0c21de09efae97eb
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62b045376cd6363b450a3bc3d37c90942f8c226f3fd60c4d660521c132b97b32
3
  size 1089994880
special_tokens_map.json CHANGED
@@ -21,11 +21,5 @@
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
- "pad_token": {
25
- "content": "<|endoftext|>",
26
- "lstrip": false,
27
- "normalized": false,
28
- "rstrip": false,
29
- "single_word": false
30
- }
31
  }
 
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
+ "pad_token": "<|im_end|>"
 
 
 
 
 
 
25
  }
tokenizer_config.json CHANGED
@@ -200,7 +200,7 @@
200
  "errors": "replace",
201
  "extra_special_tokens": {},
202
  "model_max_length": 131072,
203
- "pad_token": "<|endoftext|>",
204
  "padding_side": "right",
205
  "split_special_tokens": false,
206
  "tokenizer_class": "Qwen2Tokenizer",
 
200
  "errors": "replace",
201
  "extra_special_tokens": {},
202
  "model_max_length": 131072,
203
+ "pad_token": "<|im_end|>",
204
  "padding_side": "right",
205
  "split_special_tokens": false,
206
  "tokenizer_class": "Qwen2Tokenizer",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfe6254b4b821c430481204db5415dedc784d6dad7cf725a918df7e847d0f1a6
3
  size 6801
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12122b9fdc78225f20c28a9cffc0e46a45aa91a2facc7e5e3735f047f27247a4
3
  size 6801