NetherQuartz commited on
Commit
10778a0
·
verified ·
1 Parent(s): 5fb8498

Try lr 13e-5

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: ilo-toki-gemmax2-28-2b
5
  tags:
6
  - generated_from_trainer
7
- - sft
8
  - trl
 
9
  licence: license
10
  ---
11
 
 
4
  model_name: ilo-toki-gemmax2-28-2b
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - sft
9
  licence: license
10
  ---
11
 
adapter_config.json CHANGED
@@ -25,13 +25,13 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
28
  "down_proj",
29
- "gate_proj",
30
- "o_proj",
31
- "k_proj",
32
  "q_proj",
 
 
33
  "v_proj",
34
- "up_proj"
35
  ],
36
  "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "up_proj",
29
  "down_proj",
 
 
 
30
  "q_proj",
31
+ "k_proj",
32
+ "gate_proj",
33
  "v_proj",
34
+ "o_proj"
35
  ],
36
  "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e41df19783ffeabb30d0d862f5429135a6175176caa48946c94ed3fc67f76cd7
3
  size 41581360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84fcad9ea0c8652d4bc9523f93d5d5b1e1ff67cf81ff7384cedfbdd5f436e689
3
  size 41581360
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2454c5ff0108dc47ce21c6eb9c9bdf16b4cbbc2a7f1e60c21064ab600efef47
3
  size 6161
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd8cd14f9e60a4336c9af3fd57767c07145338d922cc9bb4dd9544bc3f2c1789
3
  size 6161