Nikit_PDF_Chatbot / chatfuncs /ingest_borough_plan.py
Sean-Case
Changed embedding model, added reference to chat model on front page
275393f
raw
history blame
483 Bytes
import ingest as ing
borough_plan_text, file_names = ing.parse_file([open("Lambeth_2030-Our_Future_Our_Lambeth.pdf")])
print("Borough plan text created")
print(borough_plan_text)
borough_plan_docs = ing.text_to_docs(borough_plan_text)
print("Borough plan docs created")
embedding_model = "BAAI/bge-base-en-v1.5"
embeddings = ing.load_embeddings(model_name = embedding_model)
ing.embed_faiss_save_to_zip(borough_plan_docs, save_to="faiss_embedding", model_name = embedding_model)