PereLluis13 commited on
Commit
708e782
1 Parent(s): 6c864ef

Add tokenizer files

Browse files
Files changed (3) hide show
  1. special_tokens_map.json +1 -0
  2. tokenizer_config.json +1 -0
  3. vocab.json +1 -0
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|"}
vocab.json ADDED
@@ -0,0 +1 @@
 
1
+ {"ά": 0, "ή": 1, "ϊ": 2, "’": 3, "θ": 4, "ο": 5, "«": 6, "τ": 7, "φ": 8, "ό": 9, "ψ": 10, "ΐ": 11, "m": 12, "´": 13, "χ": 14, "ώ": 15, "υ": 16, "β": 17, "ί": 18, "κ": 20, "λ": 21, "η": 22, "ξ": 23, "r": 24, "a": 25, "ύ": 26, "ν": 27, "g": 28, "έ": 29, "α": 30, "ρ": 31, "σ": 32, "μ": 33, "e": 34, "ϋ": 35, "ε": 36, "‘": 37, "o": 38, "ς": 39, "γ": 40, "ζ": 41, "π": 42, "v": 43, "δ": 44, "h": 45, "n": 46, "»": 47, "ω": 48, "ι": 49, "́": 50, "|": 19, "[UNK]": 51, "[PAD]": 52}