tsrivatsav commited on
Commit
f2f6f68
1 Parent(s): 6ea8a36

add tokenizer

Browse files
added_tokens.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "</s>": 28,
3
- "<pad>": 29,
4
- "<s>": 27
5
  }
 
1
  {
2
+ "</s>": 30,
3
+ "<s>": 29
 
4
  }
runs/Jul21_14-56-25_Tejas-XPS22/1658429826.1307015/events.out.tfevents.1658429826.Tejas-XPS22.26960.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6667350dbbaa134b90a85b4e9365896a5ecc703e8ad15659deaec2e22faea416
3
+ size 5385
runs/Jul21_14-56-25_Tejas-XPS22/events.out.tfevents.1658429826.Tejas-XPS22.26960.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cdb35ef0b21503c52f0b11f7ef461f580e1fc312bf01c6a1a94c6b8ae2719a2
3
+ size 5092
special_tokens_map.json CHANGED
@@ -13,17 +13,10 @@
13
  "normalized": true,
14
  "rstrip": false,
15
  "single_word": false
16
- },
17
- {
18
- "content": "<pad>",
19
- "lstrip": false,
20
- "normalized": true,
21
- "rstrip": false,
22
- "single_word": false
23
  }
24
  ],
25
  "bos_token": "<s>",
26
  "eos_token": "</s>",
27
- "pad_token": "<pad>",
28
- "unk_token": "<unk>"
29
  }
 
13
  "normalized": true,
14
  "rstrip": false,
15
  "single_word": false
 
 
 
 
 
 
 
16
  }
17
  ],
18
  "bos_token": "<s>",
19
  "eos_token": "</s>",
20
+ "pad_token": "[PAD]",
21
+ "unk_token": "[UNK]"
22
  }
tokenizer_config.json CHANGED
@@ -3,10 +3,10 @@
3
  "do_lower_case": false,
4
  "eos_token": "</s>",
5
  "name_or_path": "./",
6
- "pad_token": "<pad>",
7
  "replace_word_delimiter_char": " ",
8
  "special_tokens_map_file": null,
9
  "tokenizer_class": "Wav2Vec2CTCTokenizer",
10
- "unk_token": "<unk>",
11
- "word_delimiter_token": "|"
12
  }
 
3
  "do_lower_case": false,
4
  "eos_token": "</s>",
5
  "name_or_path": "./",
6
+ "pad_token": "[PAD]",
7
  "replace_word_delimiter_char": " ",
8
  "special_tokens_map_file": null,
9
  "tokenizer_class": "Wav2Vec2CTCTokenizer",
10
+ "unk_token": "[UNK]",
11
+ "word_delimiter_token": " "
12
  }
vocab.json CHANGED
@@ -1,5 +1,7 @@
1
  {
2
  " ": 0,
 
 
3
  "a": 1,
4
  "b": 2,
5
  "c": 3,
 
1
  {
2
  " ": 0,
3
+ "[PAD]": 28,
4
+ "[UNK]": 27,
5
  "a": 1,
6
  "b": 2,
7
  "c": 3,