jonatasgrosman commited on
Commit
28eea7f
1 Parent(s): cc70113
alphabet.json ADDED
@@ -0,0 +1 @@
 
1
+ {"labels": ["", "<s>", "</s>", "⁇", " ", "'", "-", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "à", "á", "â", "ã", "ç", "é", "ê", "í", "ó", "ô", "õ", "ú", "ü"], "is_bpe": false}
language_model/attrs.json ADDED
@@ -0,0 +1 @@
 
1
+ {"alpha": 0.5, "beta": 1.5, "unk_score_offset": -10.0, "score_boundary": true}
language_model/lm.binary ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85fcd2ff940b967b801090070c2325c0c3b3005fc0e26e167f44fcddc56e2439
3
+ size 1182518752
language_model/unigrams.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1b261381b8dabfbf647e1343be2e3ab126f07058fe4d0ba451017ecaf0d3fdd
3
+ size 8054189
preprocessor_config.json CHANGED
@@ -5,5 +5,6 @@
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
  "return_attention_mask": true,
8
- "sampling_rate": 16000
 
9
  }
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
  "return_attention_mask": true,
8
+ "sampling_rate": 16000,
9
+ "processor_class": "Wav2Vec2ProcessorWithLM"
10
  }
vocab.json CHANGED
@@ -1 +1 @@
1
- {"<pad>": 0, "<s>": 1, "</s>": 2, "<unk>": 3, "|": 4, "'": 5, "-": 6, "A": 7, "B": 8, "C": 9, "D": 10, "E": 11, "F": 12, "G": 13, "H": 14, "I": 15, "J": 16, "K": 17, "L": 18, "M": 19, "N": 20, "O": 21, "P": 22, "Q": 23, "R": 24, "S": 25, "T": 26, "U": 27, "V": 28, "W": 29, "X": 30, "Y": 31, "Z": 32, "À": 33, "Á": 34, "Â": 35, "Ã": 36, "Ç": 37, "É": 38, "Ê": 39, "Í": 40, "Ó": 41, "Ô": 42, "Õ": 43, "Ú": 44, "Ü": 45}
1
+ {"<pad>": 0, "<s>": 1, "</s>": 2, "<unk>": 3, "|": 4, "'": 5, "-": 6, "a": 7, "b": 8, "c": 9, "d": 10, "e": 11, "f": 12, "g": 13, "h": 14, "i": 15, "j": 16, "k": 17, "l": 18, "m": 19, "n": 20, "o": 21, "p": 22, "q": 23, "r": 24, "s": 25, "t": 26, "u": 27, "v": 28, "w": 29, "x": 30, "y": 31, "z": 32, "à": 33, "á": 34, "â": 35, "ã": 36, "ç": 37, "é": 38, "ê": 39, "í": 40, "ó": 41, "ô": 42, "õ": 43, "ú": 44, "ü": 45}