Spaces:

bstraehle
/

rag

Running

App Files Files Community

bstraehle commited on Dec 17, 2023

Commit

38ee3ac

1 Parent(s): bb0e9c1

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -9

app.py CHANGED Viewed

@@ -28,6 +28,16 @@ MONGODB_COLLECTION_NAME = "gpt-4"
 MONGODB_COLLECTION = client[MONGODB_DB_NAME][MONGODB_COLLECTION_NAME]
 MONGODB_INDEX_NAME = "default"
 template = """If you don't know the answer, just say that you don't know, don't try to make up an answer. Keep the answer as concise as possible. Always say
               "🧠 Thanks for using the app - Bernd" at the end of the answer. """
@@ -48,8 +58,6 @@ YOUTUBE_URL_1 = "https://www.youtube.com/watch?v=--khbXchTeE"
 YOUTUBE_URL_2 = "https://www.youtube.com/watch?v=hdhZwyf24mE"
 YOUTUBE_URL_3 = "https://www.youtube.com/watch?v=vw-KWfKwvTQ"
-MODEL_NAME  = "gpt-4"
 def document_loading_splitting():
     # Document loading
     docs = []
@@ -96,16 +104,18 @@ def document_retrieval_mongodb(llm, prompt):
 def llm_chain(llm, prompt):
     llm_chain = LLMChain(llm = llm, prompt = LLM_CHAIN_PROMPT)
-    result = llm_chain.run({"question": prompt})
-    return result
 def rag_chain(llm, prompt, db):
     rag_chain = RetrievalQA.from_chain_type(llm,
                                             chain_type_kwargs = {"prompt": RAG_CHAIN_PROMPT},
                                             retriever = db.as_retriever(search_kwargs = {"k": 3}),
                                             return_source_documents = True)
-    result = rag_chain({"query": prompt})
-    return result["result"]
 def invoke(openai_api_key, rag_option, prompt):
     if (openai_api_key == ""):
@@ -115,9 +125,9 @@ def invoke(openai_api_key, rag_option, prompt):
     if (prompt == ""):
         raise gr.Error("Prompt is required.")
     try:
-        llm = ChatOpenAI(model_name = MODEL_NAME,
                          openai_api_key = openai_api_key,
-                         temperature = 0)
         if (rag_option == "Chroma"):
             #splits = document_loading_splitting()
             #document_storage_chroma(splits)
@@ -155,7 +165,8 @@ description = """<strong>Overview:</strong> Context-aware multimodal reasoning a
                  <a href='https://www.mongodb.com/blog/post/introducing-atlas-vector-search-build-intelligent-applications-semantic-search-ai'>MongoDB</a> vector search.
                  <strong>Speech-to-text</strong> via <a href='https://openai.com/research/whisper'>whisper-1</a> model, <strong>text embedding</strong> via
                  <a href='https://openai.com/blog/new-and-improved-embedding-model'>text-embedding-ada-002</a> model, and <strong>text generation</strong> via
-                 <a href='""" + WEB_URL + """'>gpt-4</a> model. Implementation via AI-first <a href='https://www.langchain.com/'>LangChain</a> toolkit."""
 gr.close_all()
 demo = gr.Interface(fn=invoke,

 MONGODB_COLLECTION = client[MONGODB_DB_NAME][MONGODB_COLLECTION_NAME]
 MONGODB_INDEX_NAME = "default"
+config = {
+    "model": "gpt-4",
+    "temperature": 0,
+}
+wandb_api_key = os.environ["WANDB_API_KEY"]
+wandb.login(key = wandb_api_key)
+wandb.init(project = "openai-llm-rag", config = config)
+config = wandb.config
 template = """If you don't know the answer, just say that you don't know, don't try to make up an answer. Keep the answer as concise as possible. Always say
               "🧠 Thanks for using the app - Bernd" at the end of the answer. """
 YOUTUBE_URL_2 = "https://www.youtube.com/watch?v=hdhZwyf24mE"
 YOUTUBE_URL_3 = "https://www.youtube.com/watch?v=vw-KWfKwvTQ"
 def document_loading_splitting():
     # Document loading
     docs = []
 def llm_chain(llm, prompt):
     llm_chain = LLMChain(llm = llm, prompt = LLM_CHAIN_PROMPT)
+    completion = llm_chain.run({"question": prompt})
+    wandb.log({"prompt": prompt, "completion": completion})
+    return completion
 def rag_chain(llm, prompt, db):
     rag_chain = RetrievalQA.from_chain_type(llm,
                                             chain_type_kwargs = {"prompt": RAG_CHAIN_PROMPT},
                                             retriever = db.as_retriever(search_kwargs = {"k": 3}),
                                             return_source_documents = True)
+    completion = rag_chain({"query": prompt})
+    wandb.log({"prompt": prompt, "completion": completion})
+    return completion["result"]
 def invoke(openai_api_key, rag_option, prompt):
     if (openai_api_key == ""):
     if (prompt == ""):
         raise gr.Error("Prompt is required.")
     try:
+        llm = ChatOpenAI(model_name = config.model,
                          openai_api_key = openai_api_key,
+                         temperature = config.temperature)
         if (rag_option == "Chroma"):
             #splits = document_loading_splitting()
             #document_storage_chroma(splits)
                  <a href='https://www.mongodb.com/blog/post/introducing-atlas-vector-search-build-intelligent-applications-semantic-search-ai'>MongoDB</a> vector search.
                  <strong>Speech-to-text</strong> via <a href='https://openai.com/research/whisper'>whisper-1</a> model, <strong>text embedding</strong> via
                  <a href='https://openai.com/blog/new-and-improved-embedding-model'>text-embedding-ada-002</a> model, and <strong>text generation</strong> via
+                 <a href='""" + WEB_URL + """'>gpt-4</a> model. Implementation via AI-first <a href='https://www.langchain.com/'>LangChain</a> toolkit.
+                 Model performance evaluation via <a href='https://wandb.ai/bstraehle'>Weights & Biases</a>."""
 gr.close_all()
 demo = gr.Interface(fn=invoke,