Spaces:

qfisch
/

pdf-rag-mistral-7b

Running

App Files Files Community

Quentin Fisch commited on Feb 28

Commit

efb5688

•

1 Parent(s): 5c4f525

feat(demo): add demo files

Browse files

Files changed (3) hide show

app.py +79 -0
confluence_rag.py +185 -0
requirements.txt +4 -0

app.py ADDED Viewed

	@@ -0,0 +1,79 @@

+"""
+Gradio UI for Mistral 7B with RAG
+"""
+import os
+from typing import List
+import gradio as gr
+from langchain_core.runnables.base import RunnableSequence
+import numpy as np
+from confluence_rag import generate_rag_chain, load_pdf, store_vector, load_multiple_pdf
+def initialize_chain(file: gr.File) -> RunnableSequence:
+    """
+    Initializes the chain with the given file.
+    If no file is provided, the llm is used without RAG.
+    Args:
+        file (gr.File): file to initialize the chain with
+    Returns:
+        RunnableSequence: the chain
+    """
+    if file is None:
+        return generate_rag_chain()
+    if len(file) == 1:
+        pdf = load_pdf(file[0].name)
+    else:
+        pdf = load_multiple_pdf([f.name for f in file])
+    retriever = store_vector(pdf)
+    return generate_rag_chain(retriever)
+def invoke_chain(message: str, history: List[str], file: gr.File = None) -> str:
+    """
+    Invokes the chain with the given message and updates the chain if a new file is provided.
+    Args:
+        message (str): message to invoke the chain with
+        history (List[str]): history of messages
+        file (gr.File, optional): file to update the chain with. Defaults to None.
+    Returns:
+        str: the response of the chain
+    """
+    # Check if file is provided and exists
+    if file is not None and not np.all([os.path.exists(f.name) for f in file]) or len(file) == 0:
+        return "Error: File not found."
+    if file is not None and not np.all([f.name.endswith(".pdf") for f in file]):
+        return "Error: File is not a pdf."
+    chain = initialize_chain(file)
+    return chain.invoke(message)
+def create_demo() -> gr.Interface:
+    """
+    Creates and returns a Gradio Chat Interface.
+    Returns:
+        gr.Interface: the Gradio Chat Interface
+    """
+    return gr.ChatInterface(
+        invoke_chain,
+        additional_inputs=[gr.File(label="File", file_count='multiple')],
+        title="Mistral 7B with RAG",
+        description="Ask questions to Mistral about your pdf document.",
+        theme="soft",
+    )
+if __name__ == "__main__":
+    demo = create_demo()
+    demo.launch()

confluence_rag.py ADDED Viewed

	@@ -0,0 +1,185 @@

+import os
+from typing import List
+from langchain_community.document_loaders import UnstructuredPDFLoader
+from langchain_community.embeddings import HuggingFaceInferenceAPIEmbeddings
+from langchain_community.llms.huggingface_endpoint import HuggingFaceEndpoint
+from langchain.prompts import ChatPromptTemplate
+from langchain.schema.output_parser import StrOutputParser
+from langchain.schema.runnable import RunnablePassthrough
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_community.vectorstores.chroma import Chroma
+from langchain_core.runnables.base import RunnableSequence
+from langchain_core.vectorstores import VectorStoreRetriever
+from dotenv import load_dotenv
+load_dotenv()
+HF_API_KEY = os.environ["HF_API_KEY"]
+class MistralOutputParser(StrOutputParser):
+    """OutputParser that parser llm result from Mistral API"""
+    def parse(self, text: str) -> str:
+        """
+        Returns the input text with no changes.
+        Args:
+            text (str): text to parse
+        Returns:
+            str: parsed text
+        """
+        return text.split("[/INST]")[-1].strip()
+def load_pdf(
+    document_path: str,
+    mode: str = "single",
+    strategy: str = "fast",
+    chunk_size: int = 500,
+    chunk_overlap: int = 0,
+) -> List[str]:
+    """
+    Load a pdf document and split it into chunks of text.
+    Args:
+        document_path (Path): path to the pdf document
+        mode (str, optional): mode of the loader. Defaults to "single".
+        strategy (str, optional): strategy of the loader. Defaults to "fast".
+        chunk_size (int, optional): size of the chunks. Defaults to 500.
+        chunk_overlap (int, optional): overlap of the chunks. Defaults to 0.
+    Returns:
+        List[str]: list of chunks of text
+    """
+    # Load the document
+    loader = UnstructuredPDFLoader(
+        document_path,
+        mode=mode,
+        strategy=strategy,
+    )
+    docs = loader.load()
+    # Split the document into chunks of text
+    text_splitter = RecursiveCharacterTextSplitter(
+        chunk_size=chunk_size, chunk_overlap=chunk_overlap
+    )
+    all_splits = text_splitter.split_documents(docs)
+    return all_splits
+def store_vector(all_splits: List[str]) -> VectorStoreRetriever:
+    """
+    Store vector of each chunk of text.
+    Args:
+        all_splits (List[str]): list of chunks of text
+    Returns:
+        VectorStoreRetriever: retriever that can be used to retrieve the vector of a chunk of text
+    """
+    # Use the HuggingFace distilbert-base-uncased model to embed the text
+    embeddings_model_url = (
+        "https://api-inference.huggingface.co/models/distilbert-base-uncased"
+    )
+    embeddings = HuggingFaceInferenceAPIEmbeddings(
+        endpoint_url=embeddings_model_url,
+        api_key=HF_API_KEY,
+    )
+    # Store the embeddings of each chunk of text into ChromaDB
+    vector_store = Chroma.from_documents(all_splits, embeddings)
+    retriever = vector_store.as_retriever()
+    return retriever
+def generate_mistral_rag_prompt() -> ChatPromptTemplate:
+    """
+    Generate a prompt for Mistral API wiht RAG.
+    Returns:
+        ChatPromptTemplate: prompt for Mistral API
+    """
+    template = "<s>[INST] {context} {prompt} [/INST]"
+    prompt_template = ChatPromptTemplate.from_template(template)
+    return prompt_template
+def generate_mistral_simple_prompt() -> ChatPromptTemplate:
+    """
+    Generate a simple prompt for Mistral without RAG.
+    Returns:
+        ChatPromptTemplate: prompt for Mistral API
+    """
+    template = "[INST] {prompt} [/INST]"
+    prompt_template = ChatPromptTemplate.from_template(template)
+    return prompt_template
+def generate_rag_chain(retriever: VectorStoreRetriever = None) -> RunnableSequence:
+    """
+    Generate a RAG chain with Mistral API and ChromaDB.
+    Args:
+        Retriever (VectorStoreRetriever): retriever that can be used to retrieve the vector of a chunk of text
+    Returns:
+        RunnableSequence: RAG chain
+    """
+    # Use the Mistral Free prototype API
+    mistral_url = (
+        "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2"
+    )
+    model_endpoint = HuggingFaceEndpoint(
+        endpoint_url=mistral_url,
+        huggingfacehub_api_token=HF_API_KEY,
+        task="text2text-generation",
+    )
+    # Use a custom output parser
+    output_parser = MistralOutputParser()
+    # If no retriever is provided, use a simple prompt
+    if retriever is None:
+        entry = {"prompt": RunnablePassthrough()}
+        return entry | generate_mistral_simple_prompt() | model_endpoint | output_parser
+    # If a retriever is provided, use a RAG prompt
+    retrieval = {"context": retriever, "prompt": RunnablePassthrough()}
+    return retrieval | generate_mistral_rag_prompt() | model_endpoint | output_parser
+def load_multiple_pdf(document_paths: List[str]) -> List[str]:
+    """
+    Load multiple pdf documents and split them into chunks of text.
+    Args:
+        document_paths (List[str]): list of paths to the pdf documents
+    Returns:
+        List[str]: list of chunks of text
+    """
+    docs = []
+    for document_path in document_paths:
+        loader = UnstructuredPDFLoader(
+            document_path,
+            mode="single",
+            strategy="fast",
+        )
+        docs.extend(loader.load())
+    text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=25)
+    all_splits = text_splitter.split_documents(docs)
+    return all_splits

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+langchain==0.1.9
+chromadb==0.4.24
+unstructured[pdf]
+gradio