Upload ray_tune_logs/params.json with huggingface_hub
Browse files
ray_tune_logs/params.json
CHANGED
|
@@ -60,11 +60,11 @@
|
|
| 60 |
"push_to_hub": null,
|
| 61 |
"ref_role1_name_or_path": "gpt2",
|
| 62 |
"ref_role2_name_or_path": "gpt2",
|
| 63 |
-
"rl_algo": "
|
| 64 |
"rl_w": 1.0,
|
| 65 |
"rollout_config": {
|
| 66 |
-
"accuracy_w":
|
| 67 |
-
"accuracy_w2": 2.
|
| 68 |
"len_pen": 1.0,
|
| 69 |
"len_pen2": 1.0,
|
| 70 |
"max_ctx_len": 1000,
|
|
@@ -83,7 +83,7 @@
|
|
| 83 |
"temperature": 1.0
|
| 84 |
},
|
| 85 |
"similarity_fn": "rouge",
|
| 86 |
-
"threshold": 0.
|
| 87 |
},
|
| 88 |
"rollout_game": "baseline3v2",
|
| 89 |
"sample_config": {
|
|
|
|
| 60 |
"push_to_hub": null,
|
| 61 |
"ref_role1_name_or_path": "gpt2",
|
| 62 |
"ref_role2_name_or_path": "gpt2",
|
| 63 |
+
"rl_algo": "off_policy",
|
| 64 |
"rl_w": 1.0,
|
| 65 |
"rollout_config": {
|
| 66 |
+
"accuracy_w": 1.490628836610164,
|
| 67 |
+
"accuracy_w2": 2.5601615250028704,
|
| 68 |
"len_pen": 1.0,
|
| 69 |
"len_pen2": 1.0,
|
| 70 |
"max_ctx_len": 1000,
|
|
|
|
| 83 |
"temperature": 1.0
|
| 84 |
},
|
| 85 |
"similarity_fn": "rouge",
|
| 86 |
+
"threshold": 0.07098936257405905
|
| 87 |
},
|
| 88 |
"rollout_game": "baseline3v2",
|
| 89 |
"sample_config": {
|