"""Define constant values used across the project.""" class DefaultTokens(object): PAD = "" BOS = "" EOS = "" UNK = "" MASK = "" VOCAB_PAD = "averyunlikelytoken" SENT_FULL_STOPS = [".", "?", "!"] PHRASE_TABLE_SEPARATOR = "|||" ALIGNMENT_SEPARATOR = " ||| " SEP = "⦅newline⦆" MASK_BEFORE = "⦅_mask_before_⦆" class CorpusName(object): VALID = "valid" TRAIN = "train" SAMPLE = "sample" INFER = "infer" class CorpusTask(object): TRAIN = "train" VALID = "valid" INFER = "infer" class SubwordMarker(object): SPACER = "▁" JOINER = "■" BEGIN_UPPERCASE = "⦅mrk_begin_case_region_U⦆" END_UPPERCASE = "⦅mrk_end_case_region_U⦆" BEGIN_CASED = "⦅mrk_case_modifier_C⦆" class ModelTask(object): LANGUAGE_MODEL = "lm" SEQ2SEQ = "seq2seq"