Spaces:

benintw
/

hello_world_RAG

Sleeping

App Files Files Community

hello_world_RAG / my_ollama.py

benintw

Upload 3 files

e878e8a verified about 1 year ago

raw

history blame contribute delete

2.13 kB

	"""
	This works.

	reference: https://www.youtube.com/watch?v=CPgp8MhmGVY
	"""

	# Imports
	import gradio as gr
	from langchain_community.llms import Ollama
	from langchain_community.document_loaders import WebBaseLoader
	from langchain.text_splitter import RecursiveCharacterTextSplitter

	# dont use this embeddings
	# from langchain.embeddings import GPT4AllEmbeddings
	# from langchain_community.embeddings import GPT4AllEmbeddings

	# from langchain.embeddings import SentenceTransformerEmbeddings
	from langchain_community.embeddings import SentenceTransformerEmbeddings

	# from langchain.vectorstores import Chroma
	from langchain_community.vectorstores import Chroma

	from langchain.chains import RetrievalQA


	# Instantiate the Ollama model
	ollama = Ollama(
	# base_url="http://localhost:3000",
	model="llama3"
	)

	# Load the webpage content using WebBaseLoader
	loader = WebBaseLoader("https://en.wikipedia.org/wiki/Tsai_Ing-wen")
	data = loader.load()

	# Split the text into manageable chunks using RecursiveCharacterTextSplitter
	text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)
	all_splits = text_splitter.split_documents(data)

	# Instantiate SentenceTransformers embeddings with the specified model
	sentence_embeddings = SentenceTransformerEmbeddings(model_name="all-MiniLM-L6-v2")

	# Create the vector store from the document splits and embeddings
	vectorstore = Chroma.from_documents(documents=all_splits, embedding=sentence_embeddings)

	# Create a QA chain using the Ollama model and the vector store retriever
	qachain = RetrievalQA.from_chain_type(ollama, retriever=vectorstore.as_retriever())


	# Function to handle the question and return the answer
	def answer_question(question):
	response = qachain({"query": question})
	return response["result"]


	# Create a Gradio interface
	interface = gr.Interface(
	fn=answer_question,
	inputs="text",
	outputs="text",
	title="RAG Model QA Interface",
	description="Ask a question about Tsai Ing-wen and get an answer from the Retrieval-Augmented Generation model.",
	)

	# Launch the Gradio interface
	interface.launch(share=True)