from langchain.document_loaders import BSHTMLLoader, DirectoryLoader bshtml_dir_loader = DirectoryLoader('./data/', loader_cls = BSHTMLLoader) data = bshtml_dir_loader.load() import pickle with open("shakespeare.pkl", "wb") as fp: pickle.dump(data, fp)