NetherQuartz commited on
Commit
ef7c744
·
verified ·
1 Parent(s): e5ff766

Retrain with lr 3e-4

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: ilo-toki-gemma-2-2b-it
5
  tags:
6
  - generated_from_trainer
7
- - sft
8
  - trl
 
9
  licence: license
10
  ---
11
 
 
4
  model_name: ilo-toki-gemma-2-2b-it
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - sft
9
  licence: license
10
  ---
11
 
adapter_config.json CHANGED
@@ -25,13 +25,13 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "k_proj",
29
- "o_proj",
30
- "v_proj",
31
  "gate_proj",
32
  "q_proj",
 
 
33
  "down_proj",
34
- "up_proj"
 
35
  ],
36
  "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
 
 
28
  "gate_proj",
29
  "q_proj",
30
+ "up_proj",
31
+ "o_proj",
32
  "down_proj",
33
+ "v_proj",
34
+ "k_proj"
35
  ],
36
  "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d057febad91490c181084f34f3c4b1594b1baef546762cb6999e39ec4a36d006
3
  size 41581360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24f42fc75588ee10a0f12ca10d637b613de164e1bf429032efe71810e89d7a9d
3
  size 41581360
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0e1f98f7813700b0fe42434f14b69aba50b71ca18aa9cbfed289d6df7b777c4
3
  size 6161
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acdd1bbfef85b2cc7b2c5d1d869a4f78212ece60836b6424acab7c5fe0067a66
3
  size 6161