Spaces:

anakin87
/

fact-checking-rocks

Running

fact-checking-rocks / app_utils /backend_utils.py

anakin87

various improvements

4c2a969 over 2 years ago

2.05 kB

	import shutil
	from haystack.document_stores import FAISSDocumentStore
	from haystack.nodes import EmbeddingRetriever
	from haystack.pipelines import Pipeline

	import streamlit as st

	from app_utils.entailment_checker import EntailmentChecker

	from app_utils.config import STATEMENTS_PATH, INDEX_DIR, RETRIEVER_MODEL, RETRIEVER_MODEL_FORMAT, NLI_MODEL

	# cached to make index and models load only at start
	@st.cache(hash_funcs={"builtins.SwigPyObject": lambda _: None}, allow_output_mutation=True)
	def start_haystack():
	"""
	load document store, retriever, reader and create pipeline
	"""
	shutil.copy(f'{INDEX_DIR}/faiss_document_store.db', '.')
	document_store = FAISSDocumentStore(
	faiss_index_path=f'{INDEX_DIR}/my_faiss_index.faiss',
	faiss_config_path=f'{INDEX_DIR}/my_faiss_index.json')
	print(f'Index size: {document_store.get_document_count()}')

	retriever = EmbeddingRetriever(
	document_store=document_store,
	embedding_model=RETRIEVER_MODEL,
	model_format=RETRIEVER_MODEL_FORMAT
	)

	entailment_checker = EntailmentChecker(model_name_or_path=NLI_MODEL,
	use_gpu=False)


	pipe = Pipeline()
	pipe.add_node(component=retriever, name="retriever", inputs=["Query"])
	pipe.add_node(component=entailment_checker, name="ec", inputs=["retriever"])
	return pipe

	pipe = start_haystack()
	# the pipeline is not included as parameter of the following function,
	# because it is difficult to cache
	@st.cache(persist=True, allow_output_mutation=True)
	def query(question: str, retriever_top_k: int = 5):
	"""Run query and get answers"""
	params = {"retriever": {"top_k": retriever_top_k}}
	results = pipe.run(question, params=params)
	print(results)
	return results

	@st.cache()
	def load_questions():
	"""Load statements from file"""
	with open(STATEMENTS_PATH) as fin:
	questions = [line.strip() for line in fin.readlines()
	if not line.startswith('#')]
	return questions