cahya commited on
Commit
ef9c04d
1 Parent(s): b878951

add run_evaluation.py

Browse files
Files changed (1) hide show
  1. run_evaluation.py +3 -1
run_evaluation.py CHANGED
@@ -22,7 +22,9 @@ class KenLM:
22
  vocab_dict = tokenizer.get_vocab()
23
  self.vocabulary = [x[0] for x in sorted(vocab_dict.items(), key=lambda x: x[1], reverse=False)]
24
  self.vocabulary = self.vocabulary[:-2]
25
- self.decoder = build_ctcdecoder(self.vocabulary, model_name, unigrams=unigrams)
 
 
26
 
27
  @staticmethod
28
  def lm_postprocess(text):
 
22
  vocab_dict = tokenizer.get_vocab()
23
  self.vocabulary = [x[0] for x in sorted(vocab_dict.items(), key=lambda x: x[1], reverse=False)]
24
  self.vocabulary = self.vocabulary[:-2]
25
+ with open(unigrams, "r") as f:
26
+ unigrams_text = f.read()
27
+ self.decoder = build_ctcdecoder(self.vocabulary, model_name, unigrams=unigrams_text)
28
 
29
  @staticmethod
30
  def lm_postprocess(text):