update model card README.md
Browse files
README.md
CHANGED
|
@@ -99,10 +99,10 @@ The following hyperparameters were used during training:
|
|
| 99 |
'fine_prefix': '<|fine|>',
|
| 100 |
'misaligned_prefix': '<|misaligned|>',
|
| 101 |
'substandard_prefix': '<|substandard|>',
|
| 102 |
-
'threshold1': 0.
|
| 103 |
-
'threshold2': 0.
|
| 104 |
-
'threshold3': 0.
|
| 105 |
-
'threshold4': 0.
|
| 106 |
'datasets': ['tomekkorbak/detoxify-pile-chunk3-0-50000',
|
| 107 |
'tomekkorbak/detoxify-pile-chunk3-50000-100000',
|
| 108 |
'tomekkorbak/detoxify-pile-chunk3-100000-150000',
|
|
@@ -143,7 +143,7 @@ The following hyperparameters were used during training:
|
|
| 143 |
'tomekkorbak/detoxify-pile-chunk3-1850000-1900000',
|
| 144 |
'tomekkorbak/detoxify-pile-chunk3-1900000-1950000'],
|
| 145 |
'is_split_by_sentences': True},
|
| 146 |
-
'generation': {'force_call_on': [
|
| 147 |
'metrics_configs': [{}, {'n': 1}, {'n': 2}, {'n': 5}],
|
| 148 |
'scenario_configs': [{'generate_kwargs': {'bad_words_ids': [[50257],
|
| 149 |
[50258],
|
|
@@ -174,7 +174,7 @@ The following hyperparameters were used during training:
|
|
| 174 |
'prompt_before_control': True,
|
| 175 |
'prompts_path': 'resources/challenging_rtp.jsonl'}],
|
| 176 |
'scorer_config': {'device': 'cuda:0'}},
|
| 177 |
-
'kl_gpt3_callback': {'force_call_on': [
|
| 178 |
'gpt3_kwargs': {'model_name': 'davinci'},
|
| 179 |
'max_tokens': 64,
|
| 180 |
'num_samples': 4096,
|
|
@@ -212,4 +212,4 @@ The following hyperparameters were used during training:
|
|
| 212 |
'weight_decay': 0.1}}
|
| 213 |
|
| 214 |
# Wandb URL:
|
| 215 |
-
https://wandb.ai/kejian/uncategorized/runs/
|
|
|
|
| 99 |
'fine_prefix': '<|fine|>',
|
| 100 |
'misaligned_prefix': '<|misaligned|>',
|
| 101 |
'substandard_prefix': '<|substandard|>',
|
| 102 |
+
'threshold1': 0.00064215,
|
| 103 |
+
'threshold2': 0.00078331,
|
| 104 |
+
'threshold3': 0.00138205,
|
| 105 |
+
'threshold4': 0.9992},
|
| 106 |
'datasets': ['tomekkorbak/detoxify-pile-chunk3-0-50000',
|
| 107 |
'tomekkorbak/detoxify-pile-chunk3-50000-100000',
|
| 108 |
'tomekkorbak/detoxify-pile-chunk3-100000-150000',
|
|
|
|
| 143 |
'tomekkorbak/detoxify-pile-chunk3-1850000-1900000',
|
| 144 |
'tomekkorbak/detoxify-pile-chunk3-1900000-1950000'],
|
| 145 |
'is_split_by_sentences': True},
|
| 146 |
+
'generation': {'force_call_on': [22888],
|
| 147 |
'metrics_configs': [{}, {'n': 1}, {'n': 2}, {'n': 5}],
|
| 148 |
'scenario_configs': [{'generate_kwargs': {'bad_words_ids': [[50257],
|
| 149 |
[50258],
|
|
|
|
| 174 |
'prompt_before_control': True,
|
| 175 |
'prompts_path': 'resources/challenging_rtp.jsonl'}],
|
| 176 |
'scorer_config': {'device': 'cuda:0'}},
|
| 177 |
+
'kl_gpt3_callback': {'force_call_on': [22888],
|
| 178 |
'gpt3_kwargs': {'model_name': 'davinci'},
|
| 179 |
'max_tokens': 64,
|
| 180 |
'num_samples': 4096,
|
|
|
|
| 212 |
'weight_decay': 0.1}}
|
| 213 |
|
| 214 |
# Wandb URL:
|
| 215 |
+
https://wandb.ai/kejian/uncategorized/runs/20zd4b2c
|