pserna commited on
Commit
4f6f57d
1 Parent(s): dd1dea7

corrected to original config models

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. config.json +19 -7
  3. pytorch_model.bin +2 -2
README.md CHANGED
@@ -2,7 +2,7 @@
2
 
3
  Fine-tuning of a [question generator model](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation) into a rephraser model using a poor-man's translation of the Quora question pairs dataset.
4
 
5
- - Original model: [mrm8488/bert2bert-spanish-question-generation](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation?text=Manuel+vive+en+Murcia%2C+Espa%C3%B1a)
6
  - Custom database: "Poor-man's" translation of duplicated questions in Quora (translated with [Helsinki-NLP/opus-mt-en-es](https://huggingface.co/Helsinki-NLP/opus-mt-en-es))
7
 
8
 
 
2
 
3
  Fine-tuning of a [question generator model](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation) into a rephraser model using a poor-man's translation of the Quora question pairs dataset.
4
 
5
+ - Original models: [mrm8488/bert2bert-spanish-question-generation](https://huggingface.co/mrm8488/bert2bert-spanish-question-generation?text=Manuel+vive+en+Murcia%2C+Espa%C3%B1a), which is based on [dccuchile/bert-base-spanish-wwm-cased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-cased) (?).
6
  - Custom database: "Poor-man's" translation of duplicated questions in Quora (translated with [Helsinki-NLP/opus-mt-en-es](https://huggingface.co/Helsinki-NLP/opus-mt-en-es))
7
 
8
 
config.json CHANGED
@@ -1,12 +1,13 @@
1
  {
 
2
  "architectures": [
3
  "EncoderDecoderModel"
4
  ],
5
  "decoder": {
6
- "_name_or_path": "/tmp/tmpm0i7404y",
7
  "add_cross_attention": true,
8
  "architectures": [
9
- "BertLMHeadModel"
10
  ],
11
  "attention_probs_dropout_prob": 0.1,
12
  "bad_words_ids": null,
@@ -73,7 +74,7 @@
73
  "tokenizer_class": null,
74
  "top_k": 50,
75
  "top_p": 1.0,
76
- "torch_dtype": "float32",
77
  "torchscript": false,
78
  "transformers_version": "4.18.0",
79
  "type_vocab_size": 2,
@@ -82,11 +83,13 @@
82
  "use_cache": true,
83
  "vocab_size": 31002
84
  },
 
 
85
  "encoder": {
86
- "_name_or_path": "/tmp/tmp617aadbn",
87
  "add_cross_attention": false,
88
  "architectures": [
89
- "BertModel"
90
  ],
91
  "attention_probs_dropout_prob": 0.1,
92
  "bad_words_ids": null,
@@ -153,7 +156,7 @@
153
  "tokenizer_class": null,
154
  "top_k": 50,
155
  "top_p": 1.0,
156
- "torch_dtype": "float32",
157
  "torchscript": false,
158
  "transformers_version": "4.18.0",
159
  "type_vocab_size": 2,
@@ -162,7 +165,16 @@
162
  "use_cache": true,
163
  "vocab_size": 31002
164
  },
 
165
  "is_encoder_decoder": true,
 
 
 
166
  "model_type": "encoder-decoder",
167
- "transformers_version": null
 
 
 
 
 
168
  }
 
1
  {
2
+ "_name_or_path": "model/bert2bert-spanish-paraphraser",
3
  "architectures": [
4
  "EncoderDecoderModel"
5
  ],
6
  "decoder": {
7
+ "_name_or_path": "dccuchile/bert-base-spanish-wwm-cased",
8
  "add_cross_attention": true,
9
  "architectures": [
10
+ "BertForMaskedLM"
11
  ],
12
  "attention_probs_dropout_prob": 0.1,
13
  "bad_words_ids": null,
 
74
  "tokenizer_class": null,
75
  "top_k": 50,
76
  "top_p": 1.0,
77
+ "torch_dtype": null,
78
  "torchscript": false,
79
  "transformers_version": "4.18.0",
80
  "type_vocab_size": 2,
 
83
  "use_cache": true,
84
  "vocab_size": 31002
85
  },
86
+ "decoder_start_token_id": 4,
87
+ "early_stopping": true,
88
  "encoder": {
89
+ "_name_or_path": "dccuchile/bert-base-spanish-wwm-cased",
90
  "add_cross_attention": false,
91
  "architectures": [
92
+ "BertForMaskedLM"
93
  ],
94
  "attention_probs_dropout_prob": 0.1,
95
  "bad_words_ids": null,
 
156
  "tokenizer_class": null,
157
  "top_k": 50,
158
  "top_p": 1.0,
159
+ "torch_dtype": null,
160
  "torchscript": false,
161
  "transformers_version": "4.18.0",
162
  "type_vocab_size": 2,
 
165
  "use_cache": true,
166
  "vocab_size": 31002
167
  },
168
+ "eos_token_id": 5,
169
  "is_encoder_decoder": true,
170
+ "length_penalty": 2.0,
171
+ "max_length": 128,
172
+ "min_length": 6,
173
  "model_type": "encoder-decoder",
174
+ "no_repeat_ngram_size": 3,
175
+ "num_beams": 4,
176
+ "pad_token_id": 1,
177
+ "torch_dtype": "float32",
178
+ "transformers_version": null,
179
+ "vocab_size": 31002
180
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4ae07744796cab593ae8515ed390f334b50ad666b84fe2805822ff5f943ebf0
3
- size 992592171
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b608c377fb4f55b935210920489a91e3fc1c13d9a5e02fc464b5e683ac48efe2
3
+ size 992584811