Spaces:

hasanriaz121
/

tafsir-rag-v2

Sleeping

App Files Files Community

hasanriaz121 commited on May 15

Commit

7c02716

•

1 Parent(s): a9afbae

Added files

Browse files

Files changed (5) hide show

docs.pkl +3 -0
llm.py +26 -0
main.py +73 -0
requirements.txt +7 -0
store.py +17 -0

docs.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce3d8ea1903d18cef3d930e538c93c8640598be027bba6918a2c1016173aae47
+size 1592911

llm.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from langchain_core.prompts import ChatPromptTemplate
+from langchain_core.output_parsers import StrOutputParser
+from langchain_core.runnables import RunnablePassthrough
+from langchain_groq import ChatGroq
+rag_template = """
+Provide a summary from the context, which contains interpretations of Quranic Texts that highlight the importance of the topic mentioned in the question. Do not include the Quranic Texts themselves, but mention which Surah and verse.
+Context:
+{context}
+Question:
+{question}
+"""
+def create_chain(retreiver):
+    llm=ChatGroq(api_key="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"
+                 ,model="mixtral-8x7b-32768")
+    rag_prompt=ChatPromptTemplate.from_template(rag_template)
+    rag_chain=({"context":retreiver,"question":RunnablePassthrough()}
+               | rag_prompt
+               | llm
+               | StrOutputParser()
+               )
+    return rag_chain

main.py ADDED Viewed

	@@ -0,0 +1,73 @@

+import gradio as gr
+from fastapi import FastAPI
+from pydantic import BaseModel
+from contextlib import asynccontextmanager
+from dotenv import load_dotenv
+from llm import create_chain
+from store import create_store,get_retreiver,save_retreiver
+# load_dotenv()
+# @asynccontextmanager
+# async def lifespan(app: FastAPI):
+#     # Load the ML model
+#     global chain,store
+#     # store=create_store()
+#     # chain=create_chain(store.as_retriever())
+#     yield
+#     # Clean up the ML models and release the resources
+app = FastAPI()
+@app.on_event("startup")
+async def startup():
+    global chain,store
+    store=create_store()
+    chain=create_chain(store.as_retriever())
+class Request(BaseModel):
+    prompt : str
+class Response(BaseModel):
+    response : str
+def greet(message,history):
+    return message
+@app.post("/predict")
+async def invoke_api(message,history="Abc"):
+    return chain.invoke(message)
+@app.post("/test",response_model=Response)
+async def predict_api(prompt:Request):
+    response = greet(Request.prompt)
+    return response
+async def invoke(message,history):
+    return chain.invoke(message)
+@app.get("/save_retreiver")
+async def save_retreiver_api():
+    save_retreiver(store)
+demo = gr.ChatInterface(
+    fn=invoke,
+    title="LLM App",
+    undo_btn="Delete Previous",
+    clear_btn="Clear",
+)
+app = gr.mount_gradio_app(app, demo, path="/")
+# if __name__ == "__main__":
+#     # mounting at the root path
+#     uvicorn.run(
+#         app="main:app",
+#         host="localhost",#os.getenv("UVICORN_HOST"),
+#         port=8000#int(os.getenv("UVICORN_PORT"))
+#     )

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+langchain_core
+langchain_groq
+langchain_community
+gradio==4.8.0
+fastapi
+uvicorn
+pydantic

store.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from langchain_community.vectorstores import Chroma
+from langchain_community.embeddings import OllamaEmbeddings
+from langchain_community.embeddings.huggingface import HuggingFaceEmbeddings
+import pickle
+def create_store():
+    docs=pickle.load(open("docs.pkl","rb"))
+    embeds=HuggingFaceEmbeddings(model_name="BAAI/bge-base-en-v1.5")
+    store=Chroma.from_documents(documents=docs,embedding=embeds)
+    return store
+def get_retreiver(store:Chroma):
+    return store.as_retriever()
+def save_retreiver(store:Chroma):
+    pickle.dump(store.as_retriever(),open("retreiver.pkl","wb"))