Upload ray_tune_logs/params.json with huggingface_hub
Browse files- ray_tune_logs/params.json +14 -21
ray_tune_logs/params.json
CHANGED
|
@@ -25,8 +25,8 @@
|
|
| 25 |
"group_relative_norm": false,
|
| 26 |
"inference_config": {
|
| 27 |
"do_sample": true,
|
| 28 |
-
"max_new_tokens":
|
| 29 |
-
"min_new_tokens":
|
| 30 |
"temperature": 0.0
|
| 31 |
},
|
| 32 |
"keep_eval_size": false,
|
|
@@ -63,27 +63,27 @@
|
|
| 63 |
"rl_algo": "off_policy",
|
| 64 |
"rl_w": 1.0,
|
| 65 |
"rollout_config": {
|
| 66 |
-
"accuracy_w":
|
| 67 |
-
"accuracy_w2":
|
| 68 |
"len_pen": 1.0,
|
| 69 |
"len_pen2": 1.0,
|
| 70 |
-
"max_ctx_len":
|
| 71 |
"sampling_params_1": {
|
| 72 |
"logprobs": 5,
|
| 73 |
-
"max_tokens":
|
| 74 |
-
"min_tokens":
|
| 75 |
"n": 1,
|
| 76 |
"temperature": 1.0
|
| 77 |
},
|
| 78 |
"sampling_params_2": {
|
| 79 |
"logprobs": 5,
|
| 80 |
-
"max_tokens":
|
| 81 |
-
"min_tokens":
|
| 82 |
"n": 4,
|
| 83 |
"temperature": 1.0
|
| 84 |
},
|
| 85 |
"similarity_fn": "rouge",
|
| 86 |
-
"threshold": 0.
|
| 87 |
},
|
| 88 |
"rollout_game": "baseline3v2",
|
| 89 |
"sample_config": {
|
|
@@ -99,23 +99,16 @@
|
|
| 99 |
"text_template": "{text}\nTL;DR: {summary}",
|
| 100 |
"tokenizer_name": null,
|
| 101 |
"train_from_raw": true,
|
| 102 |
-
"train_split_name": "
|
| 103 |
"trunc_eval": 256,
|
| 104 |
"trunc_evals": [
|
| 105 |
-
"
|
| 106 |
-
"samsum___12",
|
| 107 |
-
"xsum___12",
|
| 108 |
-
"gigaword___200",
|
| 109 |
-
"duc___50"
|
| 110 |
],
|
| 111 |
"trust_remote_code": true,
|
| 112 |
"tune_metrics": [
|
| 113 |
"cnndm/rouge1___1.0",
|
| 114 |
-
"cnndm/
|
| 115 |
-
"
|
| 116 |
-
"samsum/bertscore_f1___0.25",
|
| 117 |
-
"xsum/rouge1___1.0",
|
| 118 |
-
"xsum/bertscore_f1___0.25"
|
| 119 |
],
|
| 120 |
"use_deepspeed": false,
|
| 121 |
"use_slow_tokenizer": false,
|
|
|
|
| 25 |
"group_relative_norm": false,
|
| 26 |
"inference_config": {
|
| 27 |
"do_sample": true,
|
| 28 |
+
"max_new_tokens": 135,
|
| 29 |
+
"min_new_tokens": 32,
|
| 30 |
"temperature": 0.0
|
| 31 |
},
|
| 32 |
"keep_eval_size": false,
|
|
|
|
| 63 |
"rl_algo": "off_policy",
|
| 64 |
"rl_w": 1.0,
|
| 65 |
"rollout_config": {
|
| 66 |
+
"accuracy_w": 1.96282248134428,
|
| 67 |
+
"accuracy_w2": 19.549524484259873,
|
| 68 |
"len_pen": 1.0,
|
| 69 |
"len_pen2": 1.0,
|
| 70 |
+
"max_ctx_len": 860,
|
| 71 |
"sampling_params_1": {
|
| 72 |
"logprobs": 5,
|
| 73 |
+
"max_tokens": 135,
|
| 74 |
+
"min_tokens": 32,
|
| 75 |
"n": 1,
|
| 76 |
"temperature": 1.0
|
| 77 |
},
|
| 78 |
"sampling_params_2": {
|
| 79 |
"logprobs": 5,
|
| 80 |
+
"max_tokens": 860,
|
| 81 |
+
"min_tokens": 5,
|
| 82 |
"n": 4,
|
| 83 |
"temperature": 1.0
|
| 84 |
},
|
| 85 |
"similarity_fn": "rouge",
|
| 86 |
+
"threshold": 0.01605191133358762
|
| 87 |
},
|
| 88 |
"rollout_game": "baseline3v2",
|
| 89 |
"sample_config": {
|
|
|
|
| 99 |
"text_template": "{text}\nTL;DR: {summary}",
|
| 100 |
"tokenizer_name": null,
|
| 101 |
"train_from_raw": true,
|
| 102 |
+
"train_split_name": "sim_with_one_golden__cnndm_train",
|
| 103 |
"trunc_eval": 256,
|
| 104 |
"trunc_evals": [
|
| 105 |
+
"cnndm___10"
|
|
|
|
|
|
|
|
|
|
|
|
|
| 106 |
],
|
| 107 |
"trust_remote_code": true,
|
| 108 |
"tune_metrics": [
|
| 109 |
"cnndm/rouge1___1.0",
|
| 110 |
+
"cnndm/rouge2___2.0",
|
| 111 |
+
"cnndm/bertscore_f1___0.25"
|
|
|
|
|
|
|
|
|
|
| 112 |
],
|
| 113 |
"use_deepspeed": false,
|
| 114 |
"use_slow_tokenizer": false,
|