s3766882 commited on
Commit ·
b09b21e
1
Parent(s): 21aaa3a
update models
Browse files- config.json +2 -86
- model_args.json +1 -1
- pytorch_model.bin +2 -2
- training_args.bin +1 -1
config.json
CHANGED
|
@@ -94,49 +94,7 @@
|
|
| 94 |
"80": "LABEL_80",
|
| 95 |
"81": "LABEL_81",
|
| 96 |
"82": "LABEL_82",
|
| 97 |
-
"83": "LABEL_83"
|
| 98 |
-
"84": "LABEL_84",
|
| 99 |
-
"85": "LABEL_85",
|
| 100 |
-
"86": "LABEL_86",
|
| 101 |
-
"87": "LABEL_87",
|
| 102 |
-
"88": "LABEL_88",
|
| 103 |
-
"89": "LABEL_89",
|
| 104 |
-
"90": "LABEL_90",
|
| 105 |
-
"91": "LABEL_91",
|
| 106 |
-
"92": "LABEL_92",
|
| 107 |
-
"93": "LABEL_93",
|
| 108 |
-
"94": "LABEL_94",
|
| 109 |
-
"95": "LABEL_95",
|
| 110 |
-
"96": "LABEL_96",
|
| 111 |
-
"97": "LABEL_97",
|
| 112 |
-
"98": "LABEL_98",
|
| 113 |
-
"99": "LABEL_99",
|
| 114 |
-
"100": "LABEL_100",
|
| 115 |
-
"101": "LABEL_101",
|
| 116 |
-
"102": "LABEL_102",
|
| 117 |
-
"103": "LABEL_103",
|
| 118 |
-
"104": "LABEL_104",
|
| 119 |
-
"105": "LABEL_105",
|
| 120 |
-
"106": "LABEL_106",
|
| 121 |
-
"107": "LABEL_107",
|
| 122 |
-
"108": "LABEL_108",
|
| 123 |
-
"109": "LABEL_109",
|
| 124 |
-
"110": "LABEL_110",
|
| 125 |
-
"111": "LABEL_111",
|
| 126 |
-
"112": "LABEL_112",
|
| 127 |
-
"113": "LABEL_113",
|
| 128 |
-
"114": "LABEL_114",
|
| 129 |
-
"115": "LABEL_115",
|
| 130 |
-
"116": "LABEL_116",
|
| 131 |
-
"117": "LABEL_117",
|
| 132 |
-
"118": "LABEL_118",
|
| 133 |
-
"119": "LABEL_119",
|
| 134 |
-
"120": "LABEL_120",
|
| 135 |
-
"121": "LABEL_121",
|
| 136 |
-
"122": "LABEL_122",
|
| 137 |
-
"123": "LABEL_123",
|
| 138 |
-
"124": "LABEL_124",
|
| 139 |
-
"125": "LABEL_125"
|
| 140 |
},
|
| 141 |
"initializer_range": 0.02,
|
| 142 |
"intermediate_size": 3072,
|
|
@@ -144,34 +102,8 @@
|
|
| 144 |
"LABEL_0": 0,
|
| 145 |
"LABEL_1": 1,
|
| 146 |
"LABEL_10": 10,
|
| 147 |
-
"LABEL_100": 100,
|
| 148 |
-
"LABEL_101": 101,
|
| 149 |
-
"LABEL_102": 102,
|
| 150 |
-
"LABEL_103": 103,
|
| 151 |
-
"LABEL_104": 104,
|
| 152 |
-
"LABEL_105": 105,
|
| 153 |
-
"LABEL_106": 106,
|
| 154 |
-
"LABEL_107": 107,
|
| 155 |
-
"LABEL_108": 108,
|
| 156 |
-
"LABEL_109": 109,
|
| 157 |
"LABEL_11": 11,
|
| 158 |
-
"LABEL_110": 110,
|
| 159 |
-
"LABEL_111": 111,
|
| 160 |
-
"LABEL_112": 112,
|
| 161 |
-
"LABEL_113": 113,
|
| 162 |
-
"LABEL_114": 114,
|
| 163 |
-
"LABEL_115": 115,
|
| 164 |
-
"LABEL_116": 116,
|
| 165 |
-
"LABEL_117": 117,
|
| 166 |
-
"LABEL_118": 118,
|
| 167 |
-
"LABEL_119": 119,
|
| 168 |
"LABEL_12": 12,
|
| 169 |
-
"LABEL_120": 120,
|
| 170 |
-
"LABEL_121": 121,
|
| 171 |
-
"LABEL_122": 122,
|
| 172 |
-
"LABEL_123": 123,
|
| 173 |
-
"LABEL_124": 124,
|
| 174 |
-
"LABEL_125": 125,
|
| 175 |
"LABEL_13": 13,
|
| 176 |
"LABEL_14": 14,
|
| 177 |
"LABEL_15": 15,
|
|
@@ -250,23 +182,7 @@
|
|
| 250 |
"LABEL_81": 81,
|
| 251 |
"LABEL_82": 82,
|
| 252 |
"LABEL_83": 83,
|
| 253 |
-
"
|
| 254 |
-
"LABEL_85": 85,
|
| 255 |
-
"LABEL_86": 86,
|
| 256 |
-
"LABEL_87": 87,
|
| 257 |
-
"LABEL_88": 88,
|
| 258 |
-
"LABEL_89": 89,
|
| 259 |
-
"LABEL_9": 9,
|
| 260 |
-
"LABEL_90": 90,
|
| 261 |
-
"LABEL_91": 91,
|
| 262 |
-
"LABEL_92": 92,
|
| 263 |
-
"LABEL_93": 93,
|
| 264 |
-
"LABEL_94": 94,
|
| 265 |
-
"LABEL_95": 95,
|
| 266 |
-
"LABEL_96": 96,
|
| 267 |
-
"LABEL_97": 97,
|
| 268 |
-
"LABEL_98": 98,
|
| 269 |
-
"LABEL_99": 99
|
| 270 |
},
|
| 271 |
"layer_norm_eps": 1e-05,
|
| 272 |
"max_position_embeddings": 514,
|
|
|
|
| 94 |
"80": "LABEL_80",
|
| 95 |
"81": "LABEL_81",
|
| 96 |
"82": "LABEL_82",
|
| 97 |
+
"83": "LABEL_83"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 98 |
},
|
| 99 |
"initializer_range": 0.02,
|
| 100 |
"intermediate_size": 3072,
|
|
|
|
| 102 |
"LABEL_0": 0,
|
| 103 |
"LABEL_1": 1,
|
| 104 |
"LABEL_10": 10,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 105 |
"LABEL_11": 11,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 106 |
"LABEL_12": 12,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 107 |
"LABEL_13": 13,
|
| 108 |
"LABEL_14": 14,
|
| 109 |
"LABEL_15": 15,
|
|
|
|
| 182 |
"LABEL_81": 81,
|
| 183 |
"LABEL_82": 82,
|
| 184 |
"LABEL_83": 83,
|
| 185 |
+
"LABEL_9": 9
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 186 |
},
|
| 187 |
"layer_norm_eps": 1e-05,
|
| 188 |
"max_position_embeddings": 514,
|
model_args.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"adafactor_beta1": null, "adafactor_clip_threshold": 1.0, "adafactor_decay_rate": -0.8, "adafactor_eps": [1e-30, 0.001], "adafactor_relative_step": true, "adafactor_scale_parameter": true, "adafactor_warmup_init": true, "adam_epsilon": 1e-08, "best_model_dir": "outputs/best_model", "cache_dir": "cache_dir/", "config": {}, "cosine_schedule_num_cycles": 0.5, "custom_layer_parameters": [], "custom_parameter_groups": [], "dataloader_num_workers": 0, "do_lower_case": false, "dynamic_quantize": false, "early_stopping_consider_epochs": false, "early_stopping_delta": 0, "early_stopping_metric": "eval_loss", "early_stopping_metric_minimize": true, "early_stopping_patience": 3, "encoding": null, "eval_batch_size": 8, "evaluate_during_training": false, "evaluate_during_training_silent": true, "evaluate_during_training_steps": 2000, "evaluate_during_training_verbose": false, "evaluate_each_epoch": true, "fp16":
|
|
|
|
| 1 |
+
{"adafactor_beta1": null, "adafactor_clip_threshold": 1.0, "adafactor_decay_rate": -0.8, "adafactor_eps": [1e-30, 0.001], "adafactor_relative_step": true, "adafactor_scale_parameter": true, "adafactor_warmup_init": true, "adam_epsilon": 1e-08, "best_model_dir": "outputs/best_model", "cache_dir": "cache_dir/", "config": {}, "cosine_schedule_num_cycles": 0.5, "custom_layer_parameters": [], "custom_parameter_groups": [], "dataloader_num_workers": 0, "do_lower_case": false, "dynamic_quantize": false, "early_stopping_consider_epochs": false, "early_stopping_delta": 0, "early_stopping_metric": "eval_loss", "early_stopping_metric_minimize": true, "early_stopping_patience": 3, "encoding": null, "eval_batch_size": 8, "evaluate_during_training": false, "evaluate_during_training_silent": true, "evaluate_during_training_steps": 2000, "evaluate_during_training_verbose": false, "evaluate_each_epoch": true, "fp16": true, "gradient_accumulation_steps": 1, "learning_rate": 1e-05, "local_rank": -1, "logging_steps": 50, "loss_type": null, "loss_args": {}, "manual_seed": null, "max_grad_norm": 1.0, "max_seq_length": 128, "model_name": "roberta-base", "model_type": "roberta", "multiprocessing_chunksize": -1, "n_gpu": 1, "no_cache": false, "no_save": false, "not_saved_args": [], "num_train_epochs": 6, "optimizer": "AdamW", "output_dir": "outputs/", "overwrite_output_dir": true, "polynomial_decay_schedule_lr_end": 1e-07, "polynomial_decay_schedule_power": 1.0, "process_count": 1, "quantized_model": false, "reprocess_input_data": true, "save_best_model": true, "save_eval_checkpoints": true, "save_model_every_epoch": false, "save_optimizer_and_scheduler": true, "save_steps": 2000, "scheduler": "linear_schedule_with_warmup", "silent": false, "skip_special_tokens": true, "tensorboard_dir": null, "thread_count": null, "tokenizer_name": null, "tokenizer_type": null, "train_batch_size": 8, "train_custom_parameters_only": false, "use_cached_eval_features": false, "use_early_stopping": false, "use_hf_datasets": false, "use_multiprocessing": true, "use_multiprocessing_for_evaluation": true, "wandb_kwargs": {}, "wandb_project": null, "warmup_ratio": 0.06, "warmup_steps": 3, "weight_decay": 0.0, "model_class": "MultiLabelClassificationModel", "sliding_window": false, "stride": 0.8, "threshold": 0.5, "tie_value": 1, "labels_list": [], "labels_map": {}, "lazy_loading": false, "special_tokens_list": []}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7359a64f7ac60b11e4347b3abdd42df81ae484eafb169932fb8d8078dcceebe
|
| 3 |
+
size 501289449
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2991
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ce85e0f40402828049238da313ad4b732e6efa682dca78dfe6fed583681441e
|
| 3 |
size 2991
|