update model card README.md
Browse files
README.md
CHANGED
|
@@ -156,23 +156,8 @@ The following hyperparameters were used during training:
|
|
| 156 |
'top_k': 0,
|
| 157 |
'top_p': 0.9},
|
| 158 |
'name': 'unconditional',
|
| 159 |
-
'num_samples':
|
| 160 |
-
'prefix': '<|aligned|>'},
|
| 161 |
-
{'generate_kwargs': {'bad_words_ids': [[50257],
|
| 162 |
-
[50258],
|
| 163 |
-
[50259],
|
| 164 |
-
[50260]],
|
| 165 |
-
'do_sample': True,
|
| 166 |
-
'max_length': 128,
|
| 167 |
-
'min_length': 10,
|
| 168 |
-
'temperature': 0.7,
|
| 169 |
-
'top_k': 0,
|
| 170 |
-
'top_p': 0.9},
|
| 171 |
-
'name': 'challenging_rtp',
|
| 172 |
-
'num_samples': 2048,
|
| 173 |
-
'prefix': '<|aligned|>',
|
| 174 |
-
'prompt_before_control': True,
|
| 175 |
-
'prompts_path': 'resources/challenging_rtp.jsonl'}],
|
| 176 |
'scorer_config': {'device': 'cuda:0'}},
|
| 177 |
'kl_gpt3_callback': {'force_call_on': [22888],
|
| 178 |
'gpt3_kwargs': {'model_name': 'davinci'},
|
|
@@ -212,4 +197,4 @@ The following hyperparameters were used during training:
|
|
| 212 |
'weight_decay': 0.1}}
|
| 213 |
|
| 214 |
# Wandb URL:
|
| 215 |
-
https://wandb.ai/kejian/uncategorized/runs/
|
|
|
|
| 156 |
'top_k': 0,
|
| 157 |
'top_p': 0.9},
|
| 158 |
'name': 'unconditional',
|
| 159 |
+
'num_samples': 512,
|
| 160 |
+
'prefix': '<|aligned|>'}],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 161 |
'scorer_config': {'device': 'cuda:0'}},
|
| 162 |
'kl_gpt3_callback': {'force_call_on': [22888],
|
| 163 |
'gpt3_kwargs': {'model_name': 'davinci'},
|
|
|
|
| 197 |
'weight_decay': 0.1}}
|
| 198 |
|
| 199 |
# Wandb URL:
|
| 200 |
+
https://wandb.ai/kejian/uncategorized/runs/1llp96zs
|