"""Define constant values used across the project.""" class DefaultTokens(object): PAD = '' BOS = '' EOS = '' UNK = '' MASK = '' VOCAB_PAD = 'averyunlikelytoken' SENT_FULL_STOPS = [".", "?", "!"] PHRASE_TABLE_SEPARATOR = '|||' ALIGNMENT_SEPARATOR = ' ||| ' class CorpusName(object): VALID = 'valid' TRAIN = 'train' SAMPLE = 'sample' class SubwordMarker(object): SPACER = '▁' JOINER = '■' BEGIN_UPPERCASE = "⦅mrk_begin_case_region_U⦆" END_UPPERCASE = "⦅mrk_end_case_region_U⦆" BEGIN_CASED = "⦅mrk_case_modifier_C⦆" class ModelTask(object): LANGUAGE_MODEL = 'lm' SEQ2SEQ = 'seq2seq'