corrected to original config models
Browse files- README.md +1 -1
- config.json +19 -7
- pytorch_model.bin +2 -2
README.md
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
|
3 |
Fine-tuning of a [question generator model](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation) into a rephraser model using a poor-man's translation of the Quora question pairs dataset.
|
4 |
|
5 |
-
- Original
|
6 |
- Custom database: "Poor-man's" translation of duplicated questions in Quora (translated with [Helsinki-NLP/opus-mt-en-es](https://huggingface.co/Helsinki-NLP/opus-mt-en-es))
|
7 |
|
8 |
|
|
|
2 |
|
3 |
Fine-tuning of a [question generator model](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation) into a rephraser model using a poor-man's translation of the Quora question pairs dataset.
|
4 |
|
5 |
+
- Original models: [mrm8488/bert2bert-spanish-question-generation](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation?text=Manuel+vive+en+Murcia%2C+Espa%C3%B1a), which is based on [dccuchile/bert-base-spanish-wwm-cased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-cased) (?).
|
6 |
- Custom database: "Poor-man's" translation of duplicated questions in Quora (translated with [Helsinki-NLP/opus-mt-en-es](https://huggingface.co/Helsinki-NLP/opus-mt-en-es))
|
7 |
|
8 |
|
config.json
CHANGED
@@ -1,12 +1,13 @@
|
|
1 |
{
|
|
|
2 |
"architectures": [
|
3 |
"EncoderDecoderModel"
|
4 |
],
|
5 |
"decoder": {
|
6 |
-
"_name_or_path": "/
|
7 |
"add_cross_attention": true,
|
8 |
"architectures": [
|
9 |
-
"
|
10 |
],
|
11 |
"attention_probs_dropout_prob": 0.1,
|
12 |
"bad_words_ids": null,
|
@@ -73,7 +74,7 @@
|
|
73 |
"tokenizer_class": null,
|
74 |
"top_k": 50,
|
75 |
"top_p": 1.0,
|
76 |
-
"torch_dtype":
|
77 |
"torchscript": false,
|
78 |
"transformers_version": "4.18.0",
|
79 |
"type_vocab_size": 2,
|
@@ -82,11 +83,13 @@
|
|
82 |
"use_cache": true,
|
83 |
"vocab_size": 31002
|
84 |
},
|
|
|
|
|
85 |
"encoder": {
|
86 |
-
"_name_or_path": "/
|
87 |
"add_cross_attention": false,
|
88 |
"architectures": [
|
89 |
-
"
|
90 |
],
|
91 |
"attention_probs_dropout_prob": 0.1,
|
92 |
"bad_words_ids": null,
|
@@ -153,7 +156,7 @@
|
|
153 |
"tokenizer_class": null,
|
154 |
"top_k": 50,
|
155 |
"top_p": 1.0,
|
156 |
-
"torch_dtype":
|
157 |
"torchscript": false,
|
158 |
"transformers_version": "4.18.0",
|
159 |
"type_vocab_size": 2,
|
@@ -162,7 +165,16 @@
|
|
162 |
"use_cache": true,
|
163 |
"vocab_size": 31002
|
164 |
},
|
|
|
165 |
"is_encoder_decoder": true,
|
|
|
|
|
|
|
166 |
"model_type": "encoder-decoder",
|
167 |
-
"
|
|
|
|
|
|
|
|
|
|
|
168 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "model/bert2bert-spanish-paraphraser",
|
3 |
"architectures": [
|
4 |
"EncoderDecoderModel"
|
5 |
],
|
6 |
"decoder": {
|
7 |
+
"_name_or_path": "dccuchile/bert-base-spanish-wwm-cased",
|
8 |
"add_cross_attention": true,
|
9 |
"architectures": [
|
10 |
+
"BertForMaskedLM"
|
11 |
],
|
12 |
"attention_probs_dropout_prob": 0.1,
|
13 |
"bad_words_ids": null,
|
|
|
74 |
"tokenizer_class": null,
|
75 |
"top_k": 50,
|
76 |
"top_p": 1.0,
|
77 |
+
"torch_dtype": null,
|
78 |
"torchscript": false,
|
79 |
"transformers_version": "4.18.0",
|
80 |
"type_vocab_size": 2,
|
|
|
83 |
"use_cache": true,
|
84 |
"vocab_size": 31002
|
85 |
},
|
86 |
+
"decoder_start_token_id": 4,
|
87 |
+
"early_stopping": true,
|
88 |
"encoder": {
|
89 |
+
"_name_or_path": "dccuchile/bert-base-spanish-wwm-cased",
|
90 |
"add_cross_attention": false,
|
91 |
"architectures": [
|
92 |
+
"BertForMaskedLM"
|
93 |
],
|
94 |
"attention_probs_dropout_prob": 0.1,
|
95 |
"bad_words_ids": null,
|
|
|
156 |
"tokenizer_class": null,
|
157 |
"top_k": 50,
|
158 |
"top_p": 1.0,
|
159 |
+
"torch_dtype": null,
|
160 |
"torchscript": false,
|
161 |
"transformers_version": "4.18.0",
|
162 |
"type_vocab_size": 2,
|
|
|
165 |
"use_cache": true,
|
166 |
"vocab_size": 31002
|
167 |
},
|
168 |
+
"eos_token_id": 5,
|
169 |
"is_encoder_decoder": true,
|
170 |
+
"length_penalty": 2.0,
|
171 |
+
"max_length": 128,
|
172 |
+
"min_length": 6,
|
173 |
"model_type": "encoder-decoder",
|
174 |
+
"no_repeat_ngram_size": 3,
|
175 |
+
"num_beams": 4,
|
176 |
+
"pad_token_id": 1,
|
177 |
+
"torch_dtype": "float32",
|
178 |
+
"transformers_version": null,
|
179 |
+
"vocab_size": 31002
|
180 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b608c377fb4f55b935210920489a91e3fc1c13d9a5e02fc464b5e683ac48efe2
|
3 |
+
size 992584811
|