skar0 commited on
Commit
fc08669
·
verified ·
1 Parent(s): 3e85fec

Upload trained reward model

Browse files
reference/adapter_config.json CHANGED
@@ -25,12 +25,12 @@
25
  "revision": null,
26
  "target_modules": [
27
  "gate_proj",
28
- "o_proj",
29
- "up_proj",
30
  "k_proj",
31
- "v_proj",
 
32
  "q_proj",
33
- "down_proj"
 
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
 
25
  "revision": null,
26
  "target_modules": [
27
  "gate_proj",
 
 
28
  "k_proj",
29
+ "down_proj",
30
+ "o_proj",
31
  "q_proj",
32
+ "v_proj",
33
+ "up_proj"
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
reward/adapter_config.json CHANGED
@@ -28,11 +28,11 @@
28
  "revision": null,
29
  "target_modules": [
30
  "gate_proj",
31
- "o_proj",
32
  "k_proj",
33
  "down_proj",
34
- "v_proj",
35
  "q_proj",
 
36
  "up_proj"
37
  ],
38
  "task_type": "SEQ_CLS",
 
28
  "revision": null,
29
  "target_modules": [
30
  "gate_proj",
 
31
  "k_proj",
32
  "down_proj",
33
+ "o_proj",
34
  "q_proj",
35
+ "v_proj",
36
  "up_proj"
37
  ],
38
  "task_type": "SEQ_CLS",
reward/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40913392efe9fa98f604c13926068499518ba8e6cdef5d2fa95d0b78ccf54c2f
3
  size 323018720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1d0b3e5c08883117b481cfef43073ab7112e5c17543d375b70090a41cc4bca
3
  size 323018720
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d47e2eb397104ed176cc05078c98144471ea3a203dc595058ebc55878660f2d
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0a0f29b308507da95e2765eee680cc9fb31429b3f8969f1334d70b21265b765
3
  size 5496