""" utils.py - Utility functions for the project. """ def postprocess(text:str): """ postprocess - remove common values in scraped dataset Args: text (str): the text to postprocess """ replacements = { "ENA":"", "Enron":"", "Enron Corporation":"", "Sony Pictures Entertainment":"", "Columbia Pictures":"", "Sony":"", "Columbia":"", "Hillary":"Jane", "Clinton":"Smith", "Amy":"Jane", "Sara":"Jane", "Harambe":"Jane", "Pascal":"", } # replace common values, also check lowercase for k, v in replacements.items(): text = text.replace(k, v) text = text.replace(k.lower(), v) return text def clear(**kwargs): """for use with buttons""" return ""