Update tokenizer_config.json
Browse files- tokenizer_config.json +1 -1
tokenizer_config.json
CHANGED
@@ -1,6 +1,5 @@
|
|
1 |
{
|
2 |
"bos_token": "<s>",
|
3 |
-
"clean_up_tokenization_spaces": true,
|
4 |
"do_lower_case": false,
|
5 |
"do_normalize": true,
|
6 |
"eos_token": "</s>",
|
@@ -9,6 +8,7 @@
|
|
9 |
"processor_class": "Wav2Vec2Processor",
|
10 |
"replace_word_delimiter_char": " ",
|
11 |
"return_attention_mask": false,
|
|
|
12 |
"tokenizer_class": "Wav2Vec2CTCTokenizer",
|
13 |
"unk_token": "<unk>",
|
14 |
"word_delimiter_token": "|"
|
|
|
1 |
{
|
2 |
"bos_token": "<s>",
|
|
|
3 |
"do_lower_case": false,
|
4 |
"do_normalize": true,
|
5 |
"eos_token": "</s>",
|
|
|
8 |
"processor_class": "Wav2Vec2Processor",
|
9 |
"replace_word_delimiter_char": " ",
|
10 |
"return_attention_mask": false,
|
11 |
+
"special_tokens_map_file": "/root/.cache/huggingface/hub/models--facebook--wav2vec2-base/snapshots/0b5b8e868dd84f03fd87d01f9c4ff0f080fecfe8/special_tokens_map.json",
|
12 |
"tokenizer_class": "Wav2Vec2CTCTokenizer",
|
13 |
"unk_token": "<unk>",
|
14 |
"word_delimiter_token": "|"
|