Lysa
/

subheading_generator_nl

text2text-generation

Model card Files Files and versions

Lysa commited on Jun 11, 2021

Commit

4dcf42e

·

1 Parent(s): 4c3564c

add model

Files changed (2) hide show

config.json +15 -25
pytorch_model.bin +2 -2

config.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-  "_name_or_path": "sshleifer/distilbart-xsum-12-1",
   "_num_labels": 3,
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "add_bias_logits": false,
-  "add_final_layer_norm": false,
   "architectures": [
-    "BartForConditionalGeneration"
   ],
   "attention_dropout": 0.0,
   "bos_token_id": 0,
@@ -16,19 +16,13 @@
   "decoder_attention_heads": 16,
   "decoder_ffn_dim": 4096,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 1,
-  "decoder_start_token_id": 2,
   "dropout": 0.1,
-  "early_stopping": true,
   "encoder_attention_heads": 16,
   "encoder_ffn_dim": 4096,
   "encoder_layerdrop": 0.0,
   "encoder_layers": 12,
   "eos_token_id": 2,
-  "eos_token_ids": [
-    2
-  ],
-  "extra_pos_embeddings": 2,
   "forced_eos_token_id": 2,
   "gradient_checkpointing": false,
   "id2label": {
@@ -43,27 +37,23 @@
     "LABEL_1": 1,
     "LABEL_2": 2
   },
-  "length_penalty": 0.5,
-  "max_length": 62,
   "max_position_embeddings": 1024,
-  "min_length": 11,
-  "model_type": "bart",
-  "no_repeat_ngram_size": 3,
-  "normalize_before": false,
   "normalize_embedding": true,
-  "num_beams": 6,
   "num_hidden_layers": 12,
   "output_past": true,
   "pad_token_id": 1,
-  "prefix": " ",
-  "replacing_rate": 0,
-  "save_step": 52,
-  "scale_embedding": false,
   "static_position_embeddings": false,
-  "student_decoder_layers": null,
-  "student_encoder_layers": null,
-  "task_specific_params": {},
   "transformers_version": "4.6.1",
   "use_cache": true,
-  "vocab_size": 50264
 }

 {
+  "_name_or_path": "facebook/mbart-large-cc25",
   "_num_labels": 3,
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "add_bias_logits": false,
+  "add_final_layer_norm": true,
   "architectures": [
+    "MBartForConditionalGeneration"
   ],
   "attention_dropout": 0.0,
   "bos_token_id": 0,
   "decoder_attention_heads": 16,
   "decoder_ffn_dim": 4096,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 12,
   "dropout": 0.1,
   "encoder_attention_heads": 16,
   "encoder_ffn_dim": 4096,
   "encoder_layerdrop": 0.0,
   "encoder_layers": 12,
   "eos_token_id": 2,
   "forced_eos_token_id": 2,
   "gradient_checkpointing": false,
   "id2label": {
     "LABEL_1": 1,
     "LABEL_2": 2
   },
+  "max_length": 1024,
   "max_position_embeddings": 1024,
+  "model_type": "mbart",
+  "normalize_before": true,
   "normalize_embedding": true,
+  "num_beams": 5,
   "num_hidden_layers": 12,
   "output_past": true,
   "pad_token_id": 1,
+  "scale_embedding": true,
   "static_position_embeddings": false,
+  "task_specific_params": {
+    "translation_en_to_ro": {
+      "decoder_start_token_id": 250020
+    }
+  },
   "transformers_version": "4.6.1",
   "use_cache": true,
+  "vocab_size": 250027
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ec7657d3380f68ebce97da0c6411dccc3cdd01797b91aa0361495c0b85e7c25f
-size 886398433

 version https://git-lfs.github.com/spec/v1
+oid sha256:7620da2177e1578d7c02c6bf4b3745ec7826ab7df89b470fabc60cee6f6af908
+size 2444611475