nbtpj commited on
Commit
4c6deb2
·
verified ·
1 Parent(s): e748ac7

Upload ray_tune_logs/params.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. ray_tune_logs/params.json +14 -21
ray_tune_logs/params.json CHANGED
@@ -25,8 +25,8 @@
25
  "group_relative_norm": false,
26
  "inference_config": {
27
  "do_sample": true,
28
- "max_new_tokens": 250,
29
- "min_new_tokens": 5,
30
  "temperature": 0.0
31
  },
32
  "keep_eval_size": false,
@@ -63,27 +63,27 @@
63
  "rl_algo": "off_policy",
64
  "rl_w": 1.0,
65
  "rollout_config": {
66
- "accuracy_w": 0.4222048983149828,
67
- "accuracy_w2": 224.2012371372442,
68
  "len_pen": 1.0,
69
  "len_pen2": 1.0,
70
- "max_ctx_len": 1000,
71
  "sampling_params_1": {
72
  "logprobs": 5,
73
- "max_tokens": 56,
74
- "min_tokens": 8,
75
  "n": 1,
76
  "temperature": 1.0
77
  },
78
  "sampling_params_2": {
79
  "logprobs": 5,
80
- "max_tokens": 512,
81
- "min_tokens": 20,
82
  "n": 4,
83
  "temperature": 1.0
84
  },
85
  "similarity_fn": "rouge",
86
- "threshold": 0.08459126528049378
87
  },
88
  "rollout_game": "baseline3v2",
89
  "sample_config": {
@@ -99,23 +99,16 @@
99
  "text_template": "{text}\nTL;DR: {summary}",
100
  "tokenizer_name": null,
101
  "train_from_raw": true,
102
- "train_split_name": "merge36_cnndmsamsumxsum",
103
  "trunc_eval": 256,
104
  "trunc_evals": [
105
- "cnndm___12",
106
- "samsum___12",
107
- "xsum___12",
108
- "gigaword___200",
109
- "duc___50"
110
  ],
111
  "trust_remote_code": true,
112
  "tune_metrics": [
113
  "cnndm/rouge1___1.0",
114
- "cnndm/bertscore_f1___0.25",
115
- "samsum/rouge1___1.0",
116
- "samsum/bertscore_f1___0.25",
117
- "xsum/rouge1___1.0",
118
- "xsum/bertscore_f1___0.25"
119
  ],
120
  "use_deepspeed": false,
121
  "use_slow_tokenizer": false,
 
25
  "group_relative_norm": false,
26
  "inference_config": {
27
  "do_sample": true,
28
+ "max_new_tokens": 135,
29
+ "min_new_tokens": 32,
30
  "temperature": 0.0
31
  },
32
  "keep_eval_size": false,
 
63
  "rl_algo": "off_policy",
64
  "rl_w": 1.0,
65
  "rollout_config": {
66
+ "accuracy_w": 1.96282248134428,
67
+ "accuracy_w2": 19.549524484259873,
68
  "len_pen": 1.0,
69
  "len_pen2": 1.0,
70
+ "max_ctx_len": 860,
71
  "sampling_params_1": {
72
  "logprobs": 5,
73
+ "max_tokens": 135,
74
+ "min_tokens": 32,
75
  "n": 1,
76
  "temperature": 1.0
77
  },
78
  "sampling_params_2": {
79
  "logprobs": 5,
80
+ "max_tokens": 860,
81
+ "min_tokens": 5,
82
  "n": 4,
83
  "temperature": 1.0
84
  },
85
  "similarity_fn": "rouge",
86
+ "threshold": 0.01605191133358762
87
  },
88
  "rollout_game": "baseline3v2",
89
  "sample_config": {
 
99
  "text_template": "{text}\nTL;DR: {summary}",
100
  "tokenizer_name": null,
101
  "train_from_raw": true,
102
+ "train_split_name": "sim_with_one_golden__cnndm_train",
103
  "trunc_eval": 256,
104
  "trunc_evals": [
105
+ "cnndm___10"
 
 
 
 
106
  ],
107
  "trust_remote_code": true,
108
  "tune_metrics": [
109
  "cnndm/rouge1___1.0",
110
+ "cnndm/rouge2___2.0",
111
+ "cnndm/bertscore_f1___0.25"
 
 
 
112
  ],
113
  "use_deepspeed": false,
114
  "use_slow_tokenizer": false,