acezxn commited on
Commit
5f6f7c6
·
verified ·
1 Parent(s): b37e367

End of training

Browse files
README.md CHANGED
@@ -4,9 +4,9 @@ library_name: transformers
4
  model_name: SOC_Task_Generation_Base_GPT_OSS_20B
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - unsloth
9
  - sft
 
10
  licence: license
11
  ---
12
 
@@ -35,7 +35,7 @@ This model was trained with SFT.
35
 
36
  ### Framework versions
37
 
38
- - TRL: 0.26.1
39
  - Transformers: 4.57.3
40
  - Pytorch: 2.10.0a0+b558c986e8.nv25.11
41
  - Datasets: 4.3.0
 
4
  model_name: SOC_Task_Generation_Base_GPT_OSS_20B
5
  tags:
6
  - generated_from_trainer
 
7
  - unsloth
8
  - sft
9
+ - trl
10
  licence: license
11
  ---
12
 
 
35
 
36
  ### Framework versions
37
 
38
+ - TRL: 0.24.0
39
  - Transformers: 4.57.3
40
  - Pytorch: 2.10.0a0+b558c986e8.nv25.11
41
  - Datasets: 4.3.0
adapter_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "layers_pattern": null,
21
  "layers_to_transform": null,
22
  "loftq_config": {},
23
- "lora_alpha": 32,
24
  "lora_bias": false,
25
  "lora_dropout": 0,
26
  "megatron_config": null,
@@ -29,17 +29,17 @@
29
  "peft_type": "LORA",
30
  "peft_version": "0.18.1",
31
  "qalora_group_size": 16,
32
- "r": 32,
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
 
36
  "o_proj",
37
- "v_proj",
38
- "k_proj",
39
  "up_proj",
40
- "q_proj",
 
41
  "down_proj",
42
- "gate_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
20
  "layers_pattern": null,
21
  "layers_to_transform": null,
22
  "loftq_config": {},
23
+ "lora_alpha": 16,
24
  "lora_bias": false,
25
  "lora_dropout": 0,
26
  "megatron_config": null,
 
29
  "peft_type": "LORA",
30
  "peft_version": "0.18.1",
31
  "qalora_group_size": 16,
32
+ "r": 8,
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "q_proj",
37
  "o_proj",
 
 
38
  "up_proj",
39
+ "k_proj",
40
+ "gate_proj",
41
  "down_proj",
42
+ "v_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:659336bcc434d9000b6f4dcf035ab0c00b88d186417018ab88ac3edefe37b0e9
3
- size 31876384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5c2af0bcf565c4b98589edbb83095f17ba07792ff9ea4a81e417134ff2bb036
3
+ size 15950616
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1ea6d24dfe5e22310f5691b59c053f4dabd0cbe23837adf61f4ce00176fea3a
3
  size 6353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95df2588c348d024f51a2ca56681f4a4ff77da205285e10065b7c72dfd1454d9
3
  size 6353