general_chat

Running

App Files Files Community

pvanand commited on Jun 29

Commit

9078d82

•

1 Parent(s): 5a22824

Update helper_functions_api.py

Browse files

Files changed (1) hide show

helper_functions_api.py +25 -30

helper_functions_api.py CHANGED Viewed

@@ -96,10 +96,8 @@ Guidelines for extraction:
 SysPromptDefault = "You are an expert AI, complete the given task. Do not add any additional comments."
 SysPromptSearch = """You are a search query generator, create a concise Google search query, focusing only on the main topic and omitting additional redundant details, include year if necessory, 2024, Do not add any additional comments. OUTPUT ONLY THE SEARCH QUERY
                         #Additional instructions:
-                        ##Use the following search operators if necessory
-                        OR #to cover multiple topics
-                        * #wildcard to match any word or phrase
-                        AND #to include specific topics."""
 import tiktoken # Used to limit tokens
 encoding = tiktoken.encoding_for_model("gpt-3.5-turbo") # Instead of Llama3 using available option/ replace if found anything better
@@ -172,32 +170,29 @@ def remove_stopwords(text):
     return ' '.join(filtered_text)
 def rephrase_content(data_format, content, query):
-    if data_format == "Structured data":
-        return together_response(f"""Here is the scraped website data:
-                                    <scraped_data>
-                                    {content}
-                                    </scraped_data>
-                                    Your task is to extract information from this data that is relevant to the following query:
-                                    <query>{query}</query>
-                                    """,
-            SysPrompt=SysPromptData,
-            max_tokens=900,
-        )
-    elif data_format == "Quantitative data":
-        return together_response(
-            f"return only the numerical or quantitative data regarding the query: {{{query}}} structured into .md tables, using the scraped context:{{{limit_tokens(content,token_limit=1000)}}}",
-            SysPrompt=SysPromptData,
-            max_tokens=500,
-        )
-    else:
-        return together_response(
-            f"return only the factual information regarding the query: {{{query}}} using the scraped context:{{{limit_tokens(content,token_limit=1000)}}}",
-            SysPrompt=SysPromptData,
-            max_tokens=500,
-        )
 def fetch_content(url):
     try:

 SysPromptDefault = "You are an expert AI, complete the given task. Do not add any additional comments."
 SysPromptSearch = """You are a search query generator, create a concise Google search query, focusing only on the main topic and omitting additional redundant details, include year if necessory, 2024, Do not add any additional comments. OUTPUT ONLY THE SEARCH QUERY
                         #Additional instructions:
+                        ##Use the following search operator if necessory
+                        OR #to cover multiple topics"""
 import tiktoken # Used to limit tokens
 encoding = tiktoken.encoding_for_model("gpt-3.5-turbo") # Instead of Llama3 using available option/ replace if found anything better
     return ' '.join(filtered_text)
 def rephrase_content(data_format, content, query):
+    try:
+        if data_format == "Structured data":
+            return together_response(
+                f"""return only the relevant information regarding the query: {{{query}}}. Output should be concise chunks of \
+                paragraphs or tables or both, extracted from the following scraped context {{{limit_tokens(content,token_limit=2000)}}}""",
+                SysPrompt=SysPromptData,
+                max_tokens=900,
+            )
+        elif data_format == "Quantitative data":
+            return together_response(
+                f"return only the numerical or quantitative data regarding the query: {{{query}}} structured into .md tables, using the scraped context:{{{limit_tokens(content,token_limit=2000)}}}",
+                SysPrompt=SysPromptData,
+                max_tokens=500,
+            )
+        else:
+            return together_response(
+                f"return only the relevant information regarding the query: {{{query}}} using the scraped context:{{{limit_tokens(content,token_limit=2000)}}}",
+                SysPrompt=SysPromptData,
+                max_tokens=500,
+            )
+    except Exception as e:
+        print(f"An error occurred: {str(e)}")
+        return limit_tokens(content,token_limit=500)
 def fetch_content(url):
     try: