Pablo Serna commited on
Commit ·
4f6f57d
1
Parent(s): dd1dea7
corrected to original config models
Browse files- README.md +1 -1
- config.json +19 -7
- pytorch_model.bin +2 -2
README.md
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
|
| 3 |
Fine-tuning of a [question generator model](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation) into a rephraser model using a poor-man's translation of the Quora question pairs dataset.
|
| 4 |
|
| 5 |
-
- Original
|
| 6 |
- Custom database: "Poor-man's" translation of duplicated questions in Quora (translated with [Helsinki-NLP/opus-mt-en-es](https://huggingface.co/Helsinki-NLP/opus-mt-en-es))
|
| 7 |
|
| 8 |
|
|
|
|
| 2 |
|
| 3 |
Fine-tuning of a [question generator model](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation) into a rephraser model using a poor-man's translation of the Quora question pairs dataset.
|
| 4 |
|
| 5 |
+
- Original models: [mrm8488/bert2bert-spanish-question-generation](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation?text=Manuel+vive+en+Murcia%2C+Espa%C3%B1a), which is based on [dccuchile/bert-base-spanish-wwm-cased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-cased) (?).
|
| 6 |
- Custom database: "Poor-man's" translation of duplicated questions in Quora (translated with [Helsinki-NLP/opus-mt-en-es](https://huggingface.co/Helsinki-NLP/opus-mt-en-es))
|
| 7 |
|
| 8 |
|
config.json
CHANGED
|
@@ -1,12 +1,13 @@
|
|
| 1 |
{
|
|
|
|
| 2 |
"architectures": [
|
| 3 |
"EncoderDecoderModel"
|
| 4 |
],
|
| 5 |
"decoder": {
|
| 6 |
-
"_name_or_path": "/
|
| 7 |
"add_cross_attention": true,
|
| 8 |
"architectures": [
|
| 9 |
-
"
|
| 10 |
],
|
| 11 |
"attention_probs_dropout_prob": 0.1,
|
| 12 |
"bad_words_ids": null,
|
|
@@ -73,7 +74,7 @@
|
|
| 73 |
"tokenizer_class": null,
|
| 74 |
"top_k": 50,
|
| 75 |
"top_p": 1.0,
|
| 76 |
-
"torch_dtype":
|
| 77 |
"torchscript": false,
|
| 78 |
"transformers_version": "4.18.0",
|
| 79 |
"type_vocab_size": 2,
|
|
@@ -82,11 +83,13 @@
|
|
| 82 |
"use_cache": true,
|
| 83 |
"vocab_size": 31002
|
| 84 |
},
|
|
|
|
|
|
|
| 85 |
"encoder": {
|
| 86 |
-
"_name_or_path": "/
|
| 87 |
"add_cross_attention": false,
|
| 88 |
"architectures": [
|
| 89 |
-
"
|
| 90 |
],
|
| 91 |
"attention_probs_dropout_prob": 0.1,
|
| 92 |
"bad_words_ids": null,
|
|
@@ -153,7 +156,7 @@
|
|
| 153 |
"tokenizer_class": null,
|
| 154 |
"top_k": 50,
|
| 155 |
"top_p": 1.0,
|
| 156 |
-
"torch_dtype":
|
| 157 |
"torchscript": false,
|
| 158 |
"transformers_version": "4.18.0",
|
| 159 |
"type_vocab_size": 2,
|
|
@@ -162,7 +165,16 @@
|
|
| 162 |
"use_cache": true,
|
| 163 |
"vocab_size": 31002
|
| 164 |
},
|
|
|
|
| 165 |
"is_encoder_decoder": true,
|
|
|
|
|
|
|
|
|
|
| 166 |
"model_type": "encoder-decoder",
|
| 167 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 168 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "model/bert2bert-spanish-paraphraser",
|
| 3 |
"architectures": [
|
| 4 |
"EncoderDecoderModel"
|
| 5 |
],
|
| 6 |
"decoder": {
|
| 7 |
+
"_name_or_path": "dccuchile/bert-base-spanish-wwm-cased",
|
| 8 |
"add_cross_attention": true,
|
| 9 |
"architectures": [
|
| 10 |
+
"BertForMaskedLM"
|
| 11 |
],
|
| 12 |
"attention_probs_dropout_prob": 0.1,
|
| 13 |
"bad_words_ids": null,
|
|
|
|
| 74 |
"tokenizer_class": null,
|
| 75 |
"top_k": 50,
|
| 76 |
"top_p": 1.0,
|
| 77 |
+
"torch_dtype": null,
|
| 78 |
"torchscript": false,
|
| 79 |
"transformers_version": "4.18.0",
|
| 80 |
"type_vocab_size": 2,
|
|
|
|
| 83 |
"use_cache": true,
|
| 84 |
"vocab_size": 31002
|
| 85 |
},
|
| 86 |
+
"decoder_start_token_id": 4,
|
| 87 |
+
"early_stopping": true,
|
| 88 |
"encoder": {
|
| 89 |
+
"_name_or_path": "dccuchile/bert-base-spanish-wwm-cased",
|
| 90 |
"add_cross_attention": false,
|
| 91 |
"architectures": [
|
| 92 |
+
"BertForMaskedLM"
|
| 93 |
],
|
| 94 |
"attention_probs_dropout_prob": 0.1,
|
| 95 |
"bad_words_ids": null,
|
|
|
|
| 156 |
"tokenizer_class": null,
|
| 157 |
"top_k": 50,
|
| 158 |
"top_p": 1.0,
|
| 159 |
+
"torch_dtype": null,
|
| 160 |
"torchscript": false,
|
| 161 |
"transformers_version": "4.18.0",
|
| 162 |
"type_vocab_size": 2,
|
|
|
|
| 165 |
"use_cache": true,
|
| 166 |
"vocab_size": 31002
|
| 167 |
},
|
| 168 |
+
"eos_token_id": 5,
|
| 169 |
"is_encoder_decoder": true,
|
| 170 |
+
"length_penalty": 2.0,
|
| 171 |
+
"max_length": 128,
|
| 172 |
+
"min_length": 6,
|
| 173 |
"model_type": "encoder-decoder",
|
| 174 |
+
"no_repeat_ngram_size": 3,
|
| 175 |
+
"num_beams": 4,
|
| 176 |
+
"pad_token_id": 1,
|
| 177 |
+
"torch_dtype": "float32",
|
| 178 |
+
"transformers_version": null,
|
| 179 |
+
"vocab_size": 31002
|
| 180 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b608c377fb4f55b935210920489a91e3fc1c13d9a5e02fc464b5e683ac48efe2
|
| 3 |
+
size 992584811
|