Updated alphabet

Files changed (3) hide show

alphabet.json CHANGED Viewed

	@@ -1,3 +1 @@
1	- {"labels": ["'", " ", "1", "A", "0", "Z", "S", "E", "K", "3", "Ö", "V", "H", "~~X", "~~Å", "M", "C", "8", "R", "J", "I", "5", "~~6", "U", "~~P", "~~D", "Q", "~~N", "~~4", "2", "~~B", "W", "7", "", "~~G", "F", "T", "~~Ä", "L", "O", "Y", "É", "9", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m"~~, "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e4", "\u00e5", "\u00e9", "\u00f4", "\u00f6", "\u00fc", "\u2047", "", "<s>", "</s>"~~], "is_bpe": false}
2	-
3	-


1	+ {"labels": ["", "R", "Z", "<s>", " ", "0", "9", "G", "F", "3", "L", "E", "Y", "Å", "A", "U", "J", "X", "T", "I", "M", "P", "N", "B", "É", "7", "</s>", "Ä", "1", "4", "C", "Ö", "⁇", "H", "V", "'", "5", "K", "W", "Q", "O", "6", "2", "8", "D", "S"], "is_bpe": false}

lm.py CHANGED Viewed

@@ -22,8 +22,5 @@ input_values = processor(resampled_audio, return_tensors="pt").input_values
 with torch.no_grad():
     logits = model(input_values).logits
-    import pdb
-    pdb.set_trace()
     transcription = processor.batch_decode(logits.numpy()).text
     print(transcription)

 with torch.no_grad():
     logits = model(input_values).logits
     transcription = processor.batch_decode(logits.numpy()).text
     print(transcription)

preprocessor_config.json CHANGED Viewed

@@ -5,5 +5,8 @@
   "padding_side": "right",
   "padding_value": 0,
   "return_attention_mask": true,
-  "sampling_rate": 16000
 }

   "padding_side": "right",
   "padding_value": 0,
   "return_attention_mask": true,
+  "sampling_rate": 16000,
+	"processor_class": "Wav2Vec2ProcessorWithLM"
 }