benjamin
/

compoundpiece-stage1

Text2Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

benjamin commited on Jul 24, 2023

Commit

827fbba

•

1 Parent(s): 6a96da3

add pt model, readme

Files changed (3) hide show

README.md +79 -0
config.json +2 -1
pytorch_model.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,79 @@

+---
+license: mit
+language:
+- af
+- az
+- be
+- bg
+- bn
+- ca
+- cs
+- cy
+- da
+- de
+- el
+- en
+- eo
+- es
+- et
+- eu
+- fa
+- fi
+- fr
+- fy
+- ga
+- gl
+- gu
+- he
+- hi
+- hu
+- hy
+- id
+- is
+- it
+- ka
+- kk
+- ky
+- la
+- lt
+- lv
+- mg
+- mk
+- ml
+- mt
+- nl
+- pa
+- pl
+- pt
+- ro
+- ru
+- sk
+- sq
+- sv
+- ta
+- te
+- th
+- tr
+- uk
+- yi
+- yo
+datasets:
+- benjamin/compoundpiece
+---
+CompoundPiece model trained only on Stage 1 training data (self-supervised training on hyphenated and non-hyphenated words scraped from the web). See [CompoundPiece: Evaluating and Improving Decompounding Performance of Language Models](https://arxiv.org/abs/2305.14214).
+# Citation
+```
+@article{minixhofer2023compoundpiece,
+  title={CompoundPiece: Evaluating and Improving Decompounding Performance of Language Models},
+  author={Minixhofer, Benjamin and Pfeiffer, Jonas and Vuli{\'c}, Ivan},
+  journal={arXiv preprint arXiv:2305.14214},
+  year={2023}
+}
+```
+# License
+MIT

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/home/patrick/t5/byt5-base",
   "architectures": [
     "T5ForConditionalGeneration"
   ],
@@ -26,6 +26,7 @@
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
   "tokenizer_class": "ByT5Tokenizer",
   "transformers_version": "4.26.0",
   "use_cache": true,
   "vocab_size": 384

 {
+  "_name_or_path": ".",
   "architectures": [
     "T5ForConditionalGeneration"
   ],
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
   "tokenizer_class": "ByT5Tokenizer",
+  "torch_dtype": "float32",
   "transformers_version": "4.26.0",
   "use_cache": true,
   "vocab_size": 384

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f52371ba6fe38aaaae24eb8321f23d805848674cf4e8f6daaad632af2bb2319
+size 2326696509