Spaces:

mbudisic
/

PsTuts-RAG

Sleeping

mbudisic commited on Jun 5

Commit

e86ca95

1 Parent(s): 4df9c16

refactor: Update search_help function and improve logging

- Simplified the signature of the `search_help` function by removing unnecessary parameters.
- Enhanced logging throughout the `search_help` function to provide better insights into its execution flow.
- Updated the `create_transcript_rag_chain` function to accept only `Configuration` type, improving type safety.
- Refactored datastore loading in the `graph` function to utilize async for better performance.

Files changed (3) hide show

pstuts_rag/pstuts_rag/datastore.py +1 -1
pstuts_rag/pstuts_rag/nodes.py +32 -13
pstuts_rag/pstuts_rag/rag_for_transcripts.py +4 -8

pstuts_rag/pstuts_rag/datastore.py CHANGED Viewed

@@ -152,7 +152,7 @@ class Datastore:
         except ValueError:
             self.qdrant_client.get_collection(self.collection_name)
             logging.info(f"Collection {self.collection_name} already exists.")
-            self.reload = not (self.config.eva_reinitialize)
         # wrapper around the client
         self.vector_store = QdrantVectorStore(

         except ValueError:
             self.qdrant_client.get_collection(self.collection_name)
             logging.info(f"Collection {self.collection_name} already exists.")
+            self.reload = self.config.eva_reinitialize
         # wrapper around the client
         self.vector_store = QdrantVectorStore(

pstuts_rag/pstuts_rag/nodes.py CHANGED Viewed

@@ -151,9 +151,7 @@ def research(state: TutorialState, config: RunnableConfig):
     }
-async def search_help(
-    state: TutorialState, config: RunnableConfig
-) -> Command[Literal["search_help", "route_is_complete"]]:
     """Search Adobe Help documentation for relevant information.
     Args:
@@ -164,11 +162,16 @@ async def search_help(
         dict: Updated state with search results message and URL references
     """
-    configurable = Configuration.from_runnable_config(config)
     cls = get_chat_api(configurable.llm_api)
     llm = cls(model=configurable.llm_tool_model, temperature=0)
     prompt = NODE_PROMPTS["search_summary"]
     adobe_help_search = TavilySearchResults(
         max_results=2,
         include_domains=["helpx.adobe.com"],
@@ -177,10 +180,13 @@ async def search_help(
         include_images=True,
         response_format="content_and_artifact",  # Always returns artifacts
     )
     query = state["search_query"][-1]
     decision = state["search_permission"]
     if decision == YesNoAsk.ASK:
         response = interrupt(
             (
@@ -191,9 +197,7 @@ async def search_help(
         logging.info(f"Permission response '{response}'")
         decision = YesNoAsk.YES if "yes" in response.strip() else YesNoAsk.NO
-        return Command(
-            update={"search_permission": decision}, goto=search_help.__name__
-        )
     response = {
         "messages": [],
@@ -207,18 +211,23 @@ async def search_help(
         longform = f"Query '{query}' is permitted."
     else:
         longform = f"Query '{query}' is NOT permitted."
     response["messages"].append({"role": "human", "content": longform})
     if decision == YesNoAsk.YES:
         results = await adobe_help_search.ainvoke(query)
         urls = list(r["url"] for r in results)
         tool = TavilyExtract(
             extract_depth="advanced",
             include_images=False,
         )
         results = await tool.ainvoke({"urls": urls})
@@ -235,12 +244,14 @@ async def search_help(
             query=query,
             text="\n***\n".join(all_text),
         )
         url_summary = await llm.ainvoke([HumanMessage(content=prompt)])
         response["messages"].append(url_summary)
         response["url_references"].extend(results["results"])
-    return Command(update=response, goto=route_is_complete.__name__)
 async def search_rag(
@@ -256,7 +267,10 @@ async def search_rag(
         dict: Updated state with RAG response and video references
     """
-    chain = create_transcript_rag_chain(datastore, config)
     query = state["search_query"][-1]
     response = await chain.ainvoke({"question": query})
@@ -519,7 +533,7 @@ def initialize(
     graph_builder.add_edge(init_state.__name__, route_is_relevant.__name__)
     graph_builder.add_edge(research.__name__, search_help.__name__)
     graph_builder.add_edge(research.__name__, search_rag.__name__)
-    # graph_builder.add_edge(search_help.__name__, route_is_complete.__name__)
     graph_builder.add_edge(search_rag.__name__, route_is_complete.__name__)
     graph_builder.add_edge(write_answer.__name__, END)
@@ -567,8 +581,13 @@ async def graph(config: RunnableConfig = None):
     # Start datastore population as background task (non-blocking)
     if initialize_datastore:
-        asyncio.create_task(
-            _datastore.from_json_globs(Configuration().transcript_glob)
-        )
     return _compiled_graph

     }
+async def search_help(state: TutorialState, config: RunnableConfig):
     """Search Adobe Help documentation for relevant information.
     Args:
         dict: Updated state with search results message and URL references
     """
+    configurable = await asyncio.to_thread(
+        Configuration.from_runnable_config, config
+    )
+    logging.info("search_help: loaded config")
     cls = get_chat_api(configurable.llm_api)
     llm = cls(model=configurable.llm_tool_model, temperature=0)
     prompt = NODE_PROMPTS["search_summary"]
+    logging.info("search_help: configured llm")
     adobe_help_search = TavilySearchResults(
         max_results=2,
         include_domains=["helpx.adobe.com"],
         include_images=True,
         response_format="content_and_artifact",  # Always returns artifacts
     )
+    logging.info("search_help: configured tavily")
     query = state["search_query"][-1]
     decision = state["search_permission"]
     if decision == YesNoAsk.ASK:
+        logging.info("search_help: asking permission")
         response = interrupt(
             (
         logging.info(f"Permission response '{response}'")
         decision = YesNoAsk.YES if "yes" in response.strip() else YesNoAsk.NO
+        return {"search_permission": decision}
     response = {
         "messages": [],
         longform = f"Query '{query}' is permitted."
     else:
         longform = f"Query '{query}' is NOT permitted."
+    logging.info("search_help: %s", longform)
     response["messages"].append({"role": "human", "content": longform})
     if decision == YesNoAsk.YES:
+        logging.info("search_help: searching")
         results = await adobe_help_search.ainvoke(query)
+        logging.info("search_help: results")
         urls = list(r["url"] for r in results)
         tool = TavilyExtract(
             extract_depth="advanced",
             include_images=False,
         )
+        logging.info("search_help: extract text")
         results = await tool.ainvoke({"urls": urls})
             query=query,
             text="\n***\n".join(all_text),
         )
+        logging.info("search_help: text extracted. summarizing.")
         url_summary = await llm.ainvoke([HumanMessage(content=prompt)])
         response["messages"].append(url_summary)
         response["url_references"].extend(results["results"])
+        logging.info("search_help: summary complete.")
+    return response
 async def search_rag(
         dict: Updated state with RAG response and video references
     """
+    configurable = await asyncio.to_thread(
+        Configuration.from_runnable_config, config
+    )
+    chain = create_transcript_rag_chain(datastore, configurable)
     query = state["search_query"][-1]
     response = await chain.ainvoke({"question": query})
     graph_builder.add_edge(init_state.__name__, route_is_relevant.__name__)
     graph_builder.add_edge(research.__name__, search_help.__name__)
     graph_builder.add_edge(research.__name__, search_rag.__name__)
+    graph_builder.add_edge(search_help.__name__, route_is_complete.__name__)
     graph_builder.add_edge(search_rag.__name__, route_is_complete.__name__)
     graph_builder.add_edge(write_answer.__name__, END)
     # Start datastore population as background task (non-blocking)
     if initialize_datastore:
+        async def load_datastore():
+            configurable = await asyncio.to_thread(Configuration)
+            await asyncio.to_thread(
+                _datastore.from_json_globs, configurable.transcript_glob
+            )
+        asyncio.create_task(load_datastore())
     return _compiled_graph

pstuts_rag/pstuts_rag/rag_for_transcripts.py CHANGED Viewed

@@ -107,7 +107,7 @@ def strip_think_tags(input: str) -> str:
 def create_transcript_rag_chain(
     datastore: Datastore,
-    config: Union[RunnableConfig, Configuration] = Configuration(),
 ) -> Runnable:
     """Create a Retrieval-Augmented Generation (RAG) chain for video transcript search.
@@ -119,19 +119,15 @@ def create_transcript_rag_chain(
     Args:
         datastore: The DatastoreManager containing video transcript embeddings
-        config: Configuration object or RunnableConfig with model and retrieval settings
     Returns:
         Runnable: A LangChain runnable that processes questions and returns
                  answers with embedded references to source video segments
     """
-    # Handle both Configuration objects and RunnableConfig dictionaries
-    configurable = (
-        config
-        if isinstance(config, Configuration)
-        else Configuration.from_runnable_config(config)
-    )
     # Select the appropriate chat model class based on configuration
     cls = ChatAPISelector.get(configurable.llm_api, ChatOpenAI)

 def create_transcript_rag_chain(
     datastore: Datastore,
+    config: Configuration = Configuration(),
 ) -> Runnable:
     """Create a Retrieval-Augmented Generation (RAG) chain for video transcript search.
     Args:
         datastore: The DatastoreManager containing video transcript embeddings
+        config: Configuration object with model and retrieval settings
     Returns:
         Runnable: A LangChain runnable that processes questions and returns
                  answers with embedded references to source video segments
     """
+    # Use the Configuration object directly
+    configurable = config
     # Select the appropriate chat model class based on configuration
     cls = ChatAPISelector.get(configurable.llm_api, ChatOpenAI)