End of training

Files changed (4) hide show

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-base_model: eth-dl-rewards/internlm2-7b-reward-code-active-merged
 library_name: transformers
 model_name: internlm2-7b-reward-code-active
 tags:
@@ -11,7 +11,7 @@ licence: license
 # Model Card for internlm2-7b-reward-code-active
-This model is a fine-tuned version of [eth-dl-rewards/internlm2-7b-reward-code-active-merged](https://huggingface.co/eth-dl-rewards/internlm2-7b-reward-code-active-merged).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/eth-dl-rewards/train-rm/runs/l4y28zpk)
 This model was trained with Reward.

 ---
+base_model: internlm/internlm2-7b-reward
 library_name: transformers
 model_name: internlm2-7b-reward-code-active
 tags:
 # Model Card for internlm2-7b-reward-code-active
+This model is a fine-tuned version of [internlm/internlm2-7b-reward](https://huggingface.co/internlm/internlm2-7b-reward).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/eth-dl-rewards/train-rm/runs/s0329pid)
 This model was trained with Reward.

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "eth-dl-rewards/internlm2-7b-reward-code-active-merged",
   "bias": "none",
   "eva_config": null,
   "exclude_modules": null,
@@ -26,11 +26,11 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "wqkv",
     "wo",
-    "w1",
     "w3",
-    "w2"
   ],
   "task_type": "SEQ_CLS",
   "use_dora": false,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "internlm/internlm2-7b-reward",
   "bias": "none",
   "eva_config": null,
   "exclude_modules": null,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "wo",
     "w3",
+    "w2",
+    "wqkv",
+    "w1"
   ],
   "task_type": "SEQ_CLS",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee7aa43d9dd73868f07fc90a2606372898d790738837fab88a84e69d978f4267
 size 151038080

 version https://git-lfs.github.com/spec/v1
+oid sha256:67bf9cd645761737dc7ce15a08e7d6ec7e917b8f07353b7c688924107988f861
 size 151038080

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e432ddbd2e5474ba9f85856fa61b6158778eaefe509e8bed672444141535e46e
 size 6648

 version https://git-lfs.github.com/spec/v1
+oid sha256:2d7dd76e6352adb2a6fc3e1e8ae0a2397e3cb2134531a1f8dca93e55c6df12d6
 size 6648