federicocosta1989 commited on
Commit
10d318c
1 Parent(s): c561e41

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. vocab.json +23 -23
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  license: apache-2.0
3
- base_model: facebook/wav2vec2-base
4
  tags:
5
  - generated_from_trainer
 
6
  datasets:
7
  - common_voice_13_0
8
  model-index:
 
1
  ---
2
  license: apache-2.0
 
3
  tags:
4
  - generated_from_trainer
5
+ base_model: facebook/wav2vec2-base
6
  datasets:
7
  - common_voice_13_0
8
  model-index:
vocab.json CHANGED
@@ -1,27 +1,27 @@
1
  {
2
  "[PAD]": 24,
3
  "[UNK]": 23,
4
- "a": 21,
5
- "b": 2,
6
- "d": 3,
7
- "e": 16,
8
- "g": 5,
9
- "h": 15,
10
- "i": 10,
11
- "j": 4,
12
- "k": 22,
13
- "l": 12,
14
- "m": 18,
15
- "n": 0,
16
- "o": 9,
17
- "p": 6,
18
- "s": 1,
19
- "t": 8,
20
- "u": 19,
21
- "w": 20,
22
- "y": 13,
23
- "|": 7,
24
- "é": 11,
25
- "ñ": 17,
26
- "ô": 14
27
  }
 
1
  {
2
  "[PAD]": 24,
3
  "[UNK]": 23,
4
+ "a": 6,
5
+ "b": 5,
6
+ "d": 0,
7
+ "e": 15,
8
+ "g": 7,
9
+ "h": 9,
10
+ "i": 16,
11
+ "j": 8,
12
+ "k": 20,
13
+ "l": 17,
14
+ "m": 22,
15
+ "n": 1,
16
+ "o": 12,
17
+ "p": 11,
18
+ "s": 10,
19
+ "t": 18,
20
+ "u": 13,
21
+ "w": 4,
22
+ "y": 14,
23
+ "|": 2,
24
+ "é": 21,
25
+ "ñ": 3,
26
+ "ô": 19
27
  }