kejian
/

cpsc-debug

English

Generated from Trainer

Model card Files Files and versions

xet

Community

kejian commited on Feb 28, 2023

Commit

3709fef

1 Parent(s): 3a9f32b

update model card README.md

Browse files

Files changed (1) hide show

README.md +6 -45

README.md CHANGED Viewed

@@ -99,9 +99,9 @@ The following hyperparameters were used during training:
                                              'fine_prefix': '<|fine|>',
                                              'misaligned_prefix': '<|misaligned|>',
                                              'substandard_prefix': '<|substandard|>',
-                                             'threshold1': 0.00064215,
-                                             'threshold2': 0.00078331,
-                                             'threshold3': 0.00138205,
                                              'threshold4': 0.9992},
              'datasets': ['tomekkorbak/detoxify-pile-chunk3-0-50000',
                           'tomekkorbak/detoxify-pile-chunk3-50000-100000',
@@ -158,45 +158,6 @@ The following hyperparameters were used during training:
                                       'name': 'unconditional',
                                       'num_samples': 2560,
                                       'prefix': '<|aligned|>'},
-                                     {'generate_kwargs': {'bad_words_ids': [[50257],
-                                                                            [50258],
-                                                                            [50259],
-                                                                            [50260]],
-                                                          'do_sample': True,
-                                                          'max_length': 128,
-                                                          'min_length': 10,
-                                                          'temperature': 0.7,
-                                                          'top_k': 0,
-                                                          'top_p': 0.9},
-                                      'name': 'unconditional-fine',
-                                      'num_samples': 512,
-                                      'prefix': '<|fine|>'},
-                                     {'generate_kwargs': {'bad_words_ids': [[50257],
-                                                                            [50258],
-                                                                            [50259],
-                                                                            [50260]],
-                                                          'do_sample': True,
-                                                          'max_length': 128,
-                                                          'min_length': 10,
-                                                          'temperature': 0.7,
-                                                          'top_k': 0,
-                                                          'top_p': 0.9},
-                                      'name': 'unconditional-substandard',
-                                      'num_samples': 512,
-                                      'prefix': '<|substandard|>'},
-                                     {'generate_kwargs': {'bad_words_ids': [[50257],
-                                                                            [50258],
-                                                                            [50259],
-                                                                            [50260]],
-                                                          'do_sample': True,
-                                                          'max_length': 128,
-                                                          'min_length': 10,
-                                                          'temperature': 0.7,
-                                                          'top_k': 0,
-                                                          'top_p': 0.9},
-                                      'name': 'unconditional-misaligned',
-                                      'num_samples': 512,
-                                      'prefix': '<|misaligned|>'},
                                      {'generate_kwargs': {'bad_words_ids': [[50257],
                                                                             [50258],
                                                                             [50259],
@@ -216,7 +177,7 @@ The following hyperparameters were used during training:
  'kl_gpt3_callback': {'force_call_on': [21362],
                       'gpt3_kwargs': {'model_name': 'davinci'},
                       'max_tokens': 64,
-                      'num_samples': 1024,
                       'prefix': '<|aligned|>',
                       'should_insert_prefix': True},
  'model': {'from_scratch': True,
@@ -240,7 +201,7 @@ The following hyperparameters were used during training:
               'logging_first_step': True,
               'logging_steps': 500,
               'num_tokens': 2800000000.0,
-              'output_dir': 'training_output_3',
               'per_device_train_batch_size': 8,
               'push_to_hub': True,
               'remove_unused_columns': False,
@@ -251,4 +212,4 @@ The following hyperparameters were used during training:
               'weight_decay': 0.1}}
 # Wandb URL:
-https://wandb.ai/kejian/uncategorized/runs/1pc0ev96

                                              'fine_prefix': '<|fine|>',
                                              'misaligned_prefix': '<|misaligned|>',
                                              'substandard_prefix': '<|substandard|>',
+                                             'threshold1': 0.0006038,
+                                             'threshold2': 0.0006638,
+                                             'threshold3': 0.00089704,
                                              'threshold4': 0.9992},
              'datasets': ['tomekkorbak/detoxify-pile-chunk3-0-50000',
                           'tomekkorbak/detoxify-pile-chunk3-50000-100000',
                                       'name': 'unconditional',
                                       'num_samples': 2560,
                                       'prefix': '<|aligned|>'},
                                      {'generate_kwargs': {'bad_words_ids': [[50257],
                                                                             [50258],
                                                                             [50259],
  'kl_gpt3_callback': {'force_call_on': [21362],
                       'gpt3_kwargs': {'model_name': 'davinci'},
                       'max_tokens': 64,
+                      'num_samples': 2048,
                       'prefix': '<|aligned|>',
                       'should_insert_prefix': True},
  'model': {'from_scratch': True,
               'logging_first_step': True,
               'logging_steps': 500,
               'num_tokens': 2800000000.0,
+              'output_dir': 'training_output_2',
               'per_device_train_batch_size': 8,
               'push_to_hub': True,
               'remove_unused_columns': False,
               'weight_decay': 0.1}}
 # Wandb URL:
+https://wandb.ai/kejian/uncategorized/runs/3m4axm31