Jlonge4 commited on
Commit
5fff7f8
·
verified ·
1 Parent(s): 8f7565e

End of training

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: outputs
5
  tags:
6
  - generated_from_trainer
7
- - grpo
8
  - trl
 
9
  licence: license
10
  ---
11
 
@@ -34,9 +34,9 @@ This model was trained with GRPO, a method introduced in [DeepSeekMath: Pushing
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.23.1
38
- - Transformers: 4.56.2
39
- - Pytorch: 2.8.0+cu129
40
  - Datasets: 4.1.1
41
  - Tokenizers: 0.22.1
42
 
 
4
  model_name: outputs
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - grpo
9
  licence: license
10
  ---
11
 
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.24.0
38
+ - Transformers: 4.57.0
39
+ - Pytorch: 2.8.0+cu126
40
  - Datasets: 4.1.1
41
  - Tokenizers: 0.22.1
42
 
adapter_config.json CHANGED
@@ -21,14 +21,14 @@
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
  "qalora_group_size": 16,
24
- "r": 16,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "k_proj",
29
- "v_proj",
30
  "o_proj",
31
- "q_proj"
 
 
32
  ],
33
  "target_parameters": null,
34
  "task_type": "CAUSAL_LM",
 
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
  "qalora_group_size": 16,
24
+ "r": 32,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
 
28
  "o_proj",
29
+ "down_proj",
30
+ "gate_up_proj",
31
+ "qkv_proj"
32
  ],
33
  "target_parameters": null,
34
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aac5d4c268fd60de4d378348cf3e9ca1c039ca84f40530812587b2043b40a1aa
3
- size 12591456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b5a945595c8d2c04f78865b6e9ca7cbe932e031eaaa17e90d5619a3237d565a
3
+ size 184584072
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d27bf952925b6e14ec92a0a31758494613e50dd289b4496b49db0c015a98dae7
3
- size 15524645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37b10016a39382ff2d24acc20a291ed83243a26c4549ab01f6240e72c6291d56
3
+ size 15524472
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81e11fdc026269ad9e7c955bf1192f3856b85a20528efff7bbbf03f4fc71752b
3
- size 7121
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60a0cf0420a6ce27c1428d63743609bedfb1d82d0921253d7efab8cd2f233083
3
+ size 7185