gagan3012 commited on
Commit
e75e473
1 Parent(s): 6e2fe90

Initial commit

Browse files
Files changed (3) hide show
  1. special_tokens_map.json +1 -0
  2. tokenizer_config.json +1 -0
  3. vocab.json +1 -0
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|"}
vocab.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"ी": 0, "ल": 1, "ऊ": 2, "र": 3, "त": 4, "ठ": 5, "उ": 6, "ह": 7, "ब": 8, "ृ": 9, "ि": 10, "ऐ": 11, "फ": 12, "घ": 13, "च": 14, "ञ": 15, "ऋ": 16, "ज": 17, "झ": 19, "श": 20, "ङ": 21, "म": 22, "य": 23, "ो": 24, "ढ": 25, "‌": 26, "इ": 27, "न": 28, "थ": 29, "औ": 30, "ओ": 31, "ै": 32, "ए": 33, "ँ": 34, "ध": 35, "ं": 36, "ट": 37, "ख": 38, "ड": 39, "ा": 40, "आ": 41, "व": 42, "द": 43, "ग": 44, "ष": 45, "अ": 46, "ई": 47, "ॠ": 48, "स": 49, "ू": 50, "े": 51, "्": 52, "प": 53, "ु": 54, "छ": 55, "ः": 56, "ौ": 57, "ण": 58, "भ": 59, "‍": 60, "क": 61, "८": 62, "|": 18, "[UNK]": 63, "[PAD]": 64}