Spaces:

tosin2013
/

question_answering_app

Sleeping

App Files Files Community

question_answering_app / app.py

tosin2013

Update app.py

21adb3e verified about 1 year ago

raw

history blame

3.29 kB

	import gradio as gr
	from transformers import pipeline
	import PyPDF2
	import markdown

	# Preload models
	models = {
	"distilbert-base-uncased-distilled-squad": "distilbert-base-uncased-distilled-squad",
	"roberta-base-squad2": "deepset/roberta-base-squad2",
	"bert-large-uncased-whole-word-masking-finetuned-squad": "bert-large-uncased-whole-word-masking-finetuned-squad",
	"albert-base-v2": "twmkn9/albert-base-v2-squad2",
	"xlm-roberta-large-squad2": "deepset/xlm-roberta-large-squad2"
	}

	loaded_models = {}

	def load_model(model_name):
	if model_name not in loaded_models:
	loaded_models[model_name] = pipeline("question-answering", model=models[model_name])
	return loaded_models[model_name]

	def answer_question(model_name, file, question, status):
	status = "Loading model..."
	model = load_model(model_name)

	if file is not None:
	if file.type == "application/pdf":
	pdf_reader = PyPDF2.PdfFileReader(file)
	context = ""
	for page_num in range(pdf_reader.numPages):
	context += pdf_reader.getPage(page_num).extract_text()
	elif file.name.endswith(".md"):
	context = file.read().decode('utf-8')
	context = markdown.markdown(context)
	else:
	context = file.read().decode('utf-8')
	else:
	context = ""

	result = model(question=question, context=context)
	answer = result['answer']
	score = result['score']

	# Explain score
	score_explanation = f"The confidence score ranges from 0 to 1, where a higher score indicates higher confidence in the answer's correctness. In this case, the score is {score:.2f}. A score closer to 1 implies the model is very confident about the answer."

	status = "Model loaded"
	return answer, f"{score:.2f}", score_explanation, status

	# Define the Gradio interface
	with gr.Blocks() as interface:
	gr.Markdown(
	"""
	# Question Answering System
	Upload a document (text, PDF, or Markdown) and ask questions to get answers based on the context.

	Supported File Types: `.txt`, `.pdf`, `.md`
	""")

	with gr.Row():
	model_dropdown = gr.Dropdown(
	choices=list(models.keys()),
	label="Select Model",
	value="distilbert-base-uncased-distilled-squad"
	)

	with gr.Row():
	file_input = gr.File(label="Upload Document", file_types=["text", "pdf", "markdown"])
	question_input = gr.Textbox(lines=2, placeholder="Enter your question here...", label="Question")

	with gr.Row():
	answer_output = gr.Textbox(label="Answer")
	score_output = gr.Textbox(label="Confidence Score")
	explanation_output = gr.Textbox(label="Score Explanation")

	with gr.Row():
	submit_button = gr.Button("Submit")

	status_output = gr.Markdown(value="")

	def on_submit(model_name, file, question):
	return answer_question(model_name, file, question, status="Loading model...")

	submit_button.click(
	on_submit,
	inputs=[model_dropdown, file_input, question_input],
	outputs=[answer_output, score_output, explanation_output, status_output]
	)

	if __name__ == "__main__":
	interface.launch()