edia_full_en / modules /module_crowsPairs.py
nanom's picture
First commit
e8aad19
from modules.module_customPllLabel import CustomPllLabel
from modules.module_pllScore import PllScore
from typing import Dict, List
class CrowsPairs:
def __init__(
self,
language_model, # LanguageModel class instance
errorManager # ErrorManager class instance
) -> None:
self.Label = CustomPllLabel()
self.pllScore = PllScore(
language_model=language_model
)
self.errorManager = errorManager
def errorChecking(
self,
sent_list: List[str],
) -> str:
out_msj = ""
mandatory_sents = [0,1]
for sent_id, sent in enumerate(sent_list):
c_sent = sent.strip()
if c_sent:
if not self.pllScore.sentIsCorrect(c_sent):
out_msj = ['CROWS-PAIRS_BAD_FORMATTED_SENTENCE', sent_id+1]
break
else:
if sent_id in mandatory_sents:
out_msj = ['CROWS-PAIRS_MANDATORY_SENTENCE_MISSING', sent_id+1]
break
return self.errorManager.process(out_msj)
def rank(
self,
sent_list: List[str],
) -> Dict[str, float]:
err = self.errorChecking(sent_list)
if err:
raise Exception(err)
all_plls_scores = {}
for sent in sent_list:
if sent:
all_plls_scores[sent] = self.pllScore.compute(sent)
return all_plls_scores