Spaces:

InvestmentResearchAI
/

LLM-ADE-dev

App Files Files Community

WilliamGazeley commited on May 7

Commit

c124df1

•

1 Parent(s): 0583c4b

Initial untested rag code

Browse files

Files changed (11) hide show

.gitignore +7 -0
app.py +17 -17
config.py +13 -0
functioncall.py +163 -0
functions.py +314 -0
prompt_assets/few_shot.json +8 -0
prompt_assets/sys_prompt.yml +43 -0
prompter.py +76 -0
schema.py +23 -0
utils.py +149 -0
validator.py +132 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,7 @@

+.env
+# Python
+__pycache__/
+# vLLM
+inference_logs/

app.py CHANGED Viewed

@@ -1,12 +1,14 @@
 import os
 import huggingface_hub
 import streamlit as st
 from vllm import LLM, SamplingParams
 sys_msg = """You are an expert financial advisor named IRAI. You have a comprehensive understanding of finance and investing with experience and expertise in all areas of finance.
 #Objective:
 Answer questions accurately and truthfully given your current knowledge.  You do not have access to up-to-date current market data; this will be available in the future. Answer the question directly.
-Style and tone:
 Answer in a friendly and engaging manner representing a top female investment professional working at a leading investment bank.
 #Audience:
 The questions will be asked by top technology executives and CFO of large fintech companies and successful startups.
@@ -15,24 +17,18 @@ Direct answer to question, concise yet insightful."""
 @st.cache_resource(show_spinner="Loading model..")
 def init_llm():
-    huggingface_hub.login(token=os.getenv("HF_TOKEN"))
-    llm = LLM(model="InvestmentResearchAI/LLM-ADE-dev")
-    tok = llm.get_tokenizer()
-    tok.eos_token = '<|im_end|>' # Override to use turns
     return llm
 def get_response(prompt):
     try:
-        convo = [
-            {"role": "system", "content": sys_msg},
-            {"role": "user", "content": prompt},
-        ]
-        llm = init_llm()
-        prompts = [llm.get_tokenizer().apply_chat_template(convo, tokenize=False)]
-        sampling_params = SamplingParams(temperature=0.3, top_p=0.95, max_tokens=500, stop_token_ids=[128009])
-        outputs = llm.generate(prompts, sampling_params)
-        for output in outputs:
-            return output.outputs[0].text
     except Exception as e:
         return f"An error occurred: {str(e)}"
@@ -52,6 +48,10 @@ def main():
 llm = init_llm()
-if __name__ == "__main__":
-    main()

 import os
 import huggingface_hub
 import streamlit as st
+from config import config
 from vllm import LLM, SamplingParams
+from functioncall import ModelInference
 sys_msg = """You are an expert financial advisor named IRAI. You have a comprehensive understanding of finance and investing with experience and expertise in all areas of finance.
 #Objective:
 Answer questions accurately and truthfully given your current knowledge.  You do not have access to up-to-date current market data; this will be available in the future. Answer the question directly.
+#Style and tone:
 Answer in a friendly and engaging manner representing a top female investment professional working at a leading investment bank.
 #Audience:
 The questions will be asked by top technology executives and CFO of large fintech companies and successful startups.
 @st.cache_resource(show_spinner="Loading model..")
 def init_llm():
+    huggingface_hub.login(token=os.getenv("HF_TOKEN"), new_session=False)
+    llm = ModelInference(chat_template='chatml')
     return llm
 def get_response(prompt):
     try:
+        return llm.generate_function_call(
+            prompt,
+            config.chat_template,
+            config.num_fewshot,
+            config.max_depth
+        )
     except Exception as e:
         return f"An error occurred: {str(e)}"
 llm = init_llm()
+def main_headless():
+    while True:
+        input_text = input("Enter your text here: ")
+        print(get_response(input_text))
+if __name__ == "__main__":
+    main_headless()

config.py ADDED Viewed

	@@ -0,0 +1,13 @@

+from pydantic import Field
+from pydantic_settings import BaseSettings
+class Config(BaseSettings):
+    hf_token: str = Field(...)
+    model: str = Field("InvestmentResearchAI/LLM-ADE-dev")
+    chat_template: str = Field("chatml", description="Chat template for prompt formatting")
+    num_fewshot: int | None = Field(None, description="Option to use json mode examples")
+    load_in_4bit: str = Field("False", description="Option to load in 4bit with bitsandbytes")
+    max_depth: int = Field(5, description="Maximum number of recursive iteration")
+config = Config(_env_file=".env")

functioncall.py ADDED Viewed

	@@ -0,0 +1,163 @@

+import argparse
+import torch
+import json
+from config import config
+from vllm import LLM, SamplingParams
+from transformers import BitsAndBytesConfig
+import functions
+from prompter import PromptManager
+from validator import validate_function_call_schema
+from utils import (
+    inference_logger,
+    get_assistant_message,
+    get_chat_template,
+    validate_and_extract_tool_calls
+)
+class ModelInference:
+    def __init__(self, chat_template: str, load_in_4bit: bool = False):
+        self.prompter = PromptManager()
+        self.bnb_config = None
+        if load_in_4bit == "True": # Never use this
+            self.bnb_config = BitsAndBytesConfig(
+                load_in_4bit=True,
+                bnb_4bit_quant_type="nf4",
+                bnb_4bit_use_double_quant=True,
+            )
+        self.model = LLM(model=config.model)
+        self.tokenizer = self.model.get_tokenizer()
+        self.tokenizer.pad_token = self.tokenizer.eos_token
+        self.tokenizer.padding_side = "left"
+        if self.tokenizer.chat_template is None:
+            print("No chat template defined, getting chat_template...")
+            self.tokenizer.chat_template = get_chat_template(chat_template)
+        inference_logger.info(self.model.config)
+        inference_logger.info(self.model.generation_config)
+        inference_logger.info(self.tokenizer.special_tokens_map)
+    def process_completion_and_validate(self, completion, chat_template):
+        assistant_message = get_assistant_message(completion, chat_template, self.tokenizer.eos_token)
+        if assistant_message:
+            validation, tool_calls, error_message = validate_and_extract_tool_calls(assistant_message)
+            if validation:
+                inference_logger.info(f"parsed tool calls:\n{json.dumps(tool_calls, indent=2)}")
+                return tool_calls, assistant_message, error_message
+            else:
+                tool_calls = None
+                return tool_calls, assistant_message, error_message
+        else:
+            inference_logger.warning("Assistant message is None")
+            raise ValueError("Assistant message is None")
+    def execute_function_call(self, tool_call):
+        function_name = tool_call.get("name")
+        function_to_call = getattr(functions, function_name, None)
+        function_args = tool_call.get("arguments", {})
+        inference_logger.info(f"Invoking function call {function_name} ...")
+        function_response = function_to_call(*function_args.values())
+        results_dict = f'{{"name": "{function_name}", "content": {function_response}}}'
+        return results_dict
+    def run_inference(self, prompt):
+        sampling_params = SamplingParams(
+            temperature=0.8,
+            top_p=0.95,
+            repetition_penalty=1.1,
+            max_tokens=500,
+            stop_token_ids=[128009])
+        outputs = self.model.generate([prompt], sampling_params)
+        for output in outputs:
+            return output.outputs[0].text
+    def generate_function_call(self, query, chat_template, num_fewshot, max_depth=5):
+        try:
+            depth = 0
+            user_message = f"{query}\nThis is the first turn and you don't have <tool_results> to analyze yet"
+            chat = [{"role": "user", "content": user_message}]
+            tools = functions.get_openai_tools()
+            prompt = self.prompter.generate_prompt(chat, tools, num_fewshot)
+            completion = self.run_inference(prompt)
+            def recursive_loop(prompt, completion, depth):
+                nonlocal max_depth
+                tool_calls, assistant_message, error_message = self.process_completion_and_validate(completion, chat_template)
+                prompt.append({"role": "assistant", "content": assistant_message})
+                tool_message = f"Agent iteration {depth} to assist with user query: {query}\n"
+                if tool_calls:
+                    inference_logger.info(f"Assistant Message:\n{assistant_message}")
+                    for tool_call in tool_calls:
+                        validation, message = validate_function_call_schema(tool_call, tools)
+                        if validation:
+                            try:
+                                function_response = self.execute_function_call(tool_call)
+                                tool_message += f"<tool_response>\n{function_response}\n</tool_response>\n"
+                                inference_logger.info(f"Here's the response from the function call: {tool_call.get('name')}\n{function_response}")
+                            except Exception as e:
+                                inference_logger.info(f"Could not execute function: {e}")
+                                tool_message += f"<tool_response>\nThere was an error when executing the function: {tool_call.get('name')}\nHere's the error traceback: {e}\nPlease call this function again with correct arguments within XML tags <tool_call></tool_call>\n</tool_response>\n"
+                        else:
+                            inference_logger.info(message)
+                            tool_message += f"<tool_response>\nThere was an error validating function call against function signature: {tool_call.get('name')}\nHere's the error traceback: {message}\nPlease call this function again with correct arguments within XML tags <tool_call></tool_call>\n</tool_response>\n"
+                    prompt.append({"role": "tool", "content": tool_message})
+                    depth += 1
+                    if depth >= max_depth:
+                        print(f"Maximum recursion depth reached ({max_depth}). Stopping recursion.")
+                        return
+                    completion = self.run_inference(prompt)
+                    recursive_loop(prompt, completion, depth)
+                elif error_message:
+                    inference_logger.info(f"Assistant Message:\n{assistant_message}")
+                    tool_message += f"<tool_response>\nThere was an error parsing function calls\n Here's the error stack trace: {error_message}\nPlease call the function again with correct syntax<tool_response>"
+                    prompt.append({"role": "tool", "content": tool_message})
+                    depth += 1
+                    if depth >= max_depth:
+                        print(f"Maximum recursion depth reached ({max_depth}). Stopping recursion.")
+                        return
+                    completion = self.run_inference(prompt)
+                    recursive_loop(prompt, completion, depth)
+                else:
+                    inference_logger.info(f"Assistant Message:\n{assistant_message}")
+            recursive_loop(prompt, completion, depth)
+        except Exception as e:
+            inference_logger.error(f"Exception occurred: {e}")
+            raise e
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Run recursive function calling loop")
+    parser.add_argument("--model_path", type=str, help="Path to the model folder")
+    parser.add_argument("--chat_template", type=str, default="chatml", help="Chat template for prompt formatting")
+    parser.add_argument("--num_fewshot", type=int, default=None, help="Option to use json mode examples")
+    parser.add_argument("--load_in_4bit", type=str, default="False", help="Option to load in 4bit with bitsandbytes")
+    parser.add_argument("--query", type=str, default="I need the current stock price of Tesla (TSLA)")
+    parser.add_argument("--max_depth", type=int, default=5, help="Maximum number of recursive iteration")
+    args = parser.parse_args()
+    # specify custom model path
+    if args.model_path:
+        inference = ModelInference(args.model_path, args.chat_template, args.load_in_4bit)
+    else:
+        model_path = 'InvestmentResearchAI/LLM-ADE-dev'
+        inference = ModelInference(model_path, args.chat_template, args.load_in_4bit)
+    # Run the model evaluator
+    inference.generate_function_call(args.query, args.chat_template, args.num_fewshot, args.max_depth)

functions.py ADDED Viewed

	@@ -0,0 +1,314 @@

+import re
+import inspect
+import requests
+import pandas as pd
+import yfinance as yf
+import concurrent.futures
+from typing import List
+from bs4 import BeautifulSoup
+from utils import inference_logger
+from langchain.tools import tool
+from langchain_core.utils.function_calling import convert_to_openai_tool
+@tool
+def code_interpreter(code_markdown: str) -> dict | str:
+    """
+    Execute the provided Python code string on the terminal using exec.
+    The string should contain valid, executable and pure Python code in markdown syntax.
+    Code should also import any required Python packages.
+    Args:
+        code_markdown (str): The Python code with markdown syntax to be executed.
+            For example: ```python\n<code-string>\n```
+    Returns:
+        dict | str: A dictionary containing variables declared and values returned by function calls,
+            or an error message if an exception occurred.
+    Note:
+        Use this function with caution, as executing arbitrary code can pose security risks.
+    """
+    try:
+        # Extracting code from Markdown code block
+        code_lines = code_markdown.split('\n')[1:-1]
+        code_without_markdown = '\n'.join(code_lines)
+        # Create a new namespace for code execution
+        exec_namespace = {}
+        # Execute the code in the new namespace
+        exec(code_without_markdown, exec_namespace)
+        # Collect variables and function call results
+        result_dict = {}
+        for name, value in exec_namespace.items():
+            if callable(value):
+                try:
+                    result_dict[name] = value()
+                except TypeError:
+                    # If the function requires arguments, attempt to call it with arguments from the namespace
+                    arg_names = inspect.getfullargspec(value).args
+                    args = {arg_name: exec_namespace.get(arg_name) for arg_name in arg_names}
+                    result_dict[name] = value(**args)
+            elif not name.startswith('_'):  # Exclude variables starting with '_'
+                result_dict[name] = value
+        return result_dict
+    except Exception as e:
+        error_message = f"An error occurred: {e}"
+        inference_logger.error(error_message)
+        return error_message
+@tool
+def google_search_and_scrape(query: str) -> dict:
+    """
+    Performs a Google search for the given query, retrieves the top search result URLs,
+    and scrapes the text content and table data from those pages in parallel.
+    Args:
+        query (str): The search query.
+    Returns:
+        list: A list of dictionaries containing the URL, text content, and table data for each scraped page.
+    """
+    num_results = 2
+    url = 'https://www.google.com/search'
+    params = {'q': query, 'num': num_results}
+    headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.61 Safari/537.3'}
+    inference_logger.info(f"Performing google search with query: {query}\nplease wait...")
+    response = requests.get(url, params=params, headers=headers)
+    soup = BeautifulSoup(response.text, 'html.parser')
+    urls = [result.find('a')['href'] for result in soup.find_all('div', class_='tF2Cxc')]
+    inference_logger.info(f"Scraping text from urls, please wait...")
+    [inference_logger.info(url) for url in urls]
+    with concurrent.futures.ThreadPoolExecutor(max_workers=5) as executor:
+        futures = [executor.submit(lambda url: (url, requests.get(url, headers=headers).text if isinstance(url, str) else None), url) for url in urls[:num_results] if isinstance(url, str)]
+        results = []
+        for future in concurrent.futures.as_completed(futures):
+            url, html = future.result()
+            soup = BeautifulSoup(html, 'html.parser')
+            paragraphs = [p.text.strip() for p in soup.find_all('p') if p.text.strip()]
+            text_content = ' '.join(paragraphs)
+            text_content = re.sub(r'\s+', ' ', text_content)
+            table_data = [[cell.get_text(strip=True) for cell in row.find_all('td')] for table in soup.find_all('table') for row in table.find_all('tr')]
+            if text_content or table_data:
+                results.append({'url': url, 'content': text_content, 'tables': table_data})
+    return results
+@tool
+def get_current_stock_price(symbol: str) -> float:
+  """
+  Get the current stock price for a given symbol.
+  Args:
+    symbol (str): The stock symbol.
+  Returns:
+    float: The current stock price, or None if an error occurs.
+  """
+  try:
+    stock = yf.Ticker(symbol)
+    # Use "regularMarketPrice" for regular market hours, or "currentPrice" for pre/post market
+    current_price = stock.info.get("regularMarketPrice", stock.info.get("currentPrice"))
+    return current_price if current_price else None
+  except Exception as e:
+    print(f"Error fetching current price for {symbol}: {e}")
+    return None
+@tool
+def get_stock_fundamentals(symbol: str) -> dict:
+    """
+    Get fundamental data for a given stock symbol using yfinance API.
+    Args:
+        symbol (str): The stock symbol.
+    Returns:
+        dict: A dictionary containing fundamental data.
+            Keys:
+                - 'symbol': The stock symbol.
+                - 'company_name': The long name of the company.
+                - 'sector': The sector to which the company belongs.
+                - 'industry': The industry to which the company belongs.
+                - 'market_cap': The market capitalization of the company.
+                - 'pe_ratio': The forward price-to-earnings ratio.
+                - 'pb_ratio': The price-to-book ratio.
+                - 'dividend_yield': The dividend yield.
+                - 'eps': The trailing earnings per share.
+                - 'beta': The beta value of the stock.
+                - '52_week_high': The 52-week high price of the stock.
+                - '52_week_low': The 52-week low price of the stock.
+    """
+    try:
+        stock = yf.Ticker(symbol)
+        info = stock.info
+        fundamentals = {
+            'symbol': symbol,
+            'company_name': info.get('longName', ''),
+            'sector': info.get('sector', ''),
+            'industry': info.get('industry', ''),
+            'market_cap': info.get('marketCap', None),
+            'pe_ratio': info.get('forwardPE', None),
+            'pb_ratio': info.get('priceToBook', None),
+            'dividend_yield': info.get('dividendYield', None),
+            'eps': info.get('trailingEps', None),
+            'beta': info.get('beta', None),
+            '52_week_high': info.get('fiftyTwoWeekHigh', None),
+            '52_week_low': info.get('fiftyTwoWeekLow', None)
+        }
+        return fundamentals
+    except Exception as e:
+        print(f"Error getting fundamentals for {symbol}: {e}")
+        return {}
+@tool
+def get_financial_statements(symbol: str) -> dict:
+    """
+    Get financial statements for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    dict: Dictionary containing financial statements (income statement, balance sheet, cash flow statement).
+    """
+    try:
+        stock = yf.Ticker(symbol)
+        financials = stock.financials
+        return financials
+    except Exception as e:
+        print(f"Error fetching financial statements for {symbol}: {e}")
+        return {}
+@tool
+def get_key_financial_ratios(symbol: str) -> dict:
+    """
+    Get key financial ratios for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    dict: Dictionary containing key financial ratios.
+    """
+    try:
+        stock = yf.Ticker(symbol)
+        key_ratios = stock.info
+        return key_ratios
+    except Exception as e:
+        print(f"Error fetching key financial ratios for {symbol}: {e}")
+        return {}
+@tool
+def get_analyst_recommendations(symbol: str) -> pd.DataFrame:
+    """
+    Get analyst recommendations for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    pd.DataFrame: DataFrame containing analyst recommendations.
+    """
+    try:
+        stock = yf.Ticker(symbol)
+        recommendations = stock.recommendations
+        return recommendations
+    except Exception as e:
+        print(f"Error fetching analyst recommendations for {symbol}: {e}")
+        return pd.DataFrame()
+@tool
+def get_dividend_data(symbol: str) -> pd.DataFrame:
+    """
+    Get dividend data for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    pd.DataFrame: DataFrame containing dividend data.
+    """
+    try:
+        stock = yf.Ticker(symbol)
+        dividends = stock.dividends
+        return dividends
+    except Exception as e:
+        print(f"Error fetching dividend data for {symbol}: {e}")
+        return pd.DataFrame()
+@tool
+def get_company_news(symbol: str) -> pd.DataFrame:
+    """
+    Get company news and press releases for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    pd.DataFrame: DataFrame containing company news and press releases.
+    """
+    try:
+        news = yf.Ticker(symbol).news
+        return news
+    except Exception as e:
+        print(f"Error fetching company news for {symbol}: {e}")
+        return pd.DataFrame()
+@tool
+def get_technical_indicators(symbol: str) -> pd.DataFrame:
+    """
+    Get technical indicators for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    pd.DataFrame: DataFrame containing technical indicators.
+    """
+    try:
+        indicators = yf.Ticker(symbol).history(period="max")
+        return indicators
+    except Exception as e:
+        print(f"Error fetching technical indicators for {symbol}: {e}")
+        return pd.DataFrame()
+@tool
+def get_company_profile(symbol: str) -> dict:
+    """
+    Get company profile and overview for a given stock symbol.
+    Args:
+    symbol (str): The stock symbol.
+    Returns:
+    dict: Dictionary containing company profile and overview.
+    """
+    try:
+        profile = yf.Ticker(symbol).info
+        return profile
+    except Exception as e:
+        print(f"Error fetching company profile for {symbol}: {e}")
+        return {}
+def get_openai_tools() -> List[dict]:
+    functions = [
+        code_interpreter,
+        google_search_and_scrape,
+        get_current_stock_price,
+        get_company_news,
+        get_company_profile,
+        get_stock_fundamentals,
+        get_financial_statements,
+        get_key_financial_ratios,
+        get_analyst_recommendations,
+        get_dividend_data,
+        get_technical_indicators
+    ]
+    tools = [convert_to_openai_tool(f) for f in functions]
+    return tools

prompt_assets/few_shot.json ADDED Viewed

	@@ -0,0 +1,8 @@

+[
+    {
+        "example": "```\nSYSTEM: You are a helpful assistant who has access to functions. Use them if required\n<tools>[\n {\n \"name\": \"calculate_distance\",\n \"description\": \"Calculate the distance between two locations\",\n \"parameters\": {\n \"type\": \"object\",\n \"properties\": {\n \"origin\": {\n \"type\": \"string\",\n \"description\": \"The starting location\"\n },\n \"destination\": {\n \"type\": \"string\",\n \"description\": \"The destination location\"\n },\n \"mode\": {\n \"type\": \"string\",\n \"description\": \"The mode of transportation\"\n }\n },\n \"required\": [\n \"origin\",\n \"destination\",\n \"mode\"\n ]\n }\n },\n {\n \"name\": \"generate_password\",\n \"description\": \"Generate a random password\",\n \"parameters\": {\n \"type\": \"object\",\n \"properties\": {\n \"length\": {\n \"type\": \"integer\",\n \"description\": \"The length of the password\"\n }\n },\n \"required\": [\n \"length\"\n ]\n }\n }\n]\n\n</tools>\nUSER: Hi, I need to know the distance from New York to Los Angeles by car.\nASSISTANT:\n<tool_call>\n{\"arguments\": {\"origin\": \"New York\",\n \"destination\": \"Los Angeles\", \"mode\": \"car\"}, \"name\": \"calculate_distance\"}\n</tool_call>\n```\n"
+    },
+    {
+        "example": "```\nSYSTEM: You are a helpful assistant with access to functions. Use them if required\n<tools>[\n {\n \"name\": \"calculate_distance\",\n \"description\": \"Calculate the distance between two locations\",\n \"parameters\": {\n \"type\": \"object\",\n \"properties\": {\n \"origin\": {\n \"type\": \"string\",\n \"description\": \"The starting location\"\n },\n \"destination\": {\n \"type\": \"string\",\n \"description\": \"The destination location\"\n },\n \"mode\": {\n \"type\": \"string\",\n \"description\": \"The mode of transportation\"\n }\n },\n \"required\": [\n \"origin\",\n \"destination\",\n \"mode\"\n ]\n }\n },\n {\n \"name\": \"generate_password\",\n \"description\": \"Generate a random password\",\n \"parameters\": {\n \"type\": \"object\",\n \"properties\": {\n \"length\": {\n \"type\": \"integer\",\n \"description\": \"The length of the password\"\n }\n },\n \"required\": [\n \"length\"\n ]\n }\n }\n]\n\n</tools>\nUSER: Can you help me generate a random password with a length of 8 characters?\nASSISTANT:\n<tool_call>\n{\"arguments\": {\"length\": 8}, \"name\": \"generate_password\"}\n</tool_call>\n```"
+    }
+]

prompt_assets/sys_prompt.yml ADDED Viewed

	@@ -0,0 +1,43 @@

+Role: |
+  You are an expert financial advisor named IRAI. You have a comprehensive understanding of finance and investing with experience and expertise in all areas of finance.
+  You are a function calling AI agent with self-recursion.
+  You can call only one function at a time and analyse data you get from function response.
+  You are provided with function signatures within <tools></tools> XML tags.
+  The current date is: {date}.
+Objective: |
+  You may use agentic frameworks for reasoning and planning to help with user query.
+  Please call a function and wait for function results to be provided to you in the next iteration.
+  Don't make assumptions about what values to plug into function arguments.
+  Once you have called a function, results will be fed back to you within <tool_response></tool_response> XML tags.
+  Don't make assumptions about tool results if <tool_response> XML tags are not present since function hasn't been executed yet.
+  Analyze the data once you get the results and call another function.
+  At each iteration please continue adding the your analysis to previous summary.
+  Your final response should directly answer the user query with an anlysis or summary of the results of function calls.
+Tools: |
+  Here are the available tools:
+  <tools> {tools} </tools>
+  If the provided function signatures doesn't have the function you must call, you may write executable python code in markdown syntax and call code_interpreter() function as follows:
+  <tool_call>
+  {{"arguments": {{"code_markdown": <python-code>, "name": "code_interpreter"}}}}
+  </tool_call>
+  Make sure that the json object above with code markdown block is parseable with json.loads() and the XML block with XML ElementTree.
+Examples: |
+  Here are some example usage of functions:
+  {examples}
+Schema: |
+  Use the following pydantic model json schema for each tool call you will make:
+  {schema}
+Instructions: |
+  At the very first turn you don't have <tool_results> so you shouldn't not make up the results.
+  Please keep a running summary with analysis of previous function results and summaries from previous iterations.
+  Do not stop calling functions until the task has been accomplished or you've reached max iteration of 10.
+  Calling multiple functions at once can overload the system and increase cost so call one function at a time please.
+  If you plan to continue with analysis, always call another function.
+  For each function call return a valid json object (using doulbe quotes) with function name and arguments within <tool_call></tool_call> XML tags as follows:
+  <tool_call>
+  {{"arguments": <args-dict>, "name": <function-name>}}
+  </tool_call>
+Style and tone: |
+  Answer in a friendly and engaging manner representing a top female investment professional working at a leading investment bank.
+Audience: |
+  The questions will be asked by top technology executives and CFO of large fintech companies and successful startups.

prompter.py ADDED Viewed

	@@ -0,0 +1,76 @@

+import datetime
+from pydantic import BaseModel
+from typing import Dict
+from schema import FunctionCall
+from utils import (
+    get_fewshot_examples
+)
+import yaml
+import json
+import os
+class PromptSchema(BaseModel):
+    Role: str
+    Objective: str
+    Tools: str
+    Examples: str
+    Schema: str
+    Instructions: str
+class PromptManager:
+    def __init__(self):
+        self.script_dir = os.path.dirname(os.path.abspath(__file__))
+    def format_yaml_prompt(self, prompt_schema: PromptSchema, variables: Dict) -> str:
+        formatted_prompt = ""
+        for field, value in prompt_schema.dict().items():
+            if field == "Examples" and variables.get("examples") is None:
+                continue
+            formatted_value = value.format(**variables)
+            if field == "Instructions":
+                formatted_prompt += f"{formatted_value}"
+            else:
+                formatted_value = formatted_value.replace("\n", " ")
+                formatted_prompt += f"{formatted_value}"
+        return formatted_prompt
+    def read_yaml_file(self, file_path: str) -> PromptSchema:
+        with open(file_path, 'r') as file:
+            yaml_content = yaml.safe_load(file)
+        prompt_schema = PromptSchema(
+            Role=yaml_content.get('Role', ''),
+            Objective=yaml_content.get('Objective', ''),
+            Tools=yaml_content.get('Tools', ''),
+            Examples=yaml_content.get('Examples', ''),
+            Schema=yaml_content.get('Schema', ''),
+            Instructions=yaml_content.get('Instructions', ''),
+        )
+        return prompt_schema
+    def generate_prompt(self, user_prompt, tools, num_fewshot=None):
+        prompt_path = os.path.join(self.script_dir, 'prompt_assets', 'sys_prompt.yml')
+        prompt_schema = self.read_yaml_file(prompt_path)
+        if num_fewshot is not None:
+            examples = get_fewshot_examples(num_fewshot)
+        else:
+            examples = None
+        schema_json = json.loads(FunctionCall.schema_json())
+        variables = {
+            "date": datetime.date.today(),
+            "tools": tools,
+            "examples": examples,
+            "schema": schema_json
+        }
+        sys_prompt = self.format_yaml_prompt(prompt_schema, variables)
+        prompt = [
+                {'content': sys_prompt, 'role': 'system'}
+            ]
+        prompt.extend(user_prompt)
+        return prompt

schema.py ADDED Viewed

	@@ -0,0 +1,23 @@

+from pydantic import BaseModel
+from typing import List, Dict, Literal, Optional
+class FunctionCall(BaseModel):
+    arguments: dict
+    """
+    The arguments to call the function with, as generated by the model in JSON
+    format. Note that the model does not always generate valid JSON, and may
+    hallucinate parameters not defined by your function schema. Validate the
+    arguments in your code before calling your function.
+    """
+    name: str
+    """The name of the function to call."""
+class FunctionDefinition(BaseModel):
+    name: str
+    description: Optional[str] = None
+    parameters: Optional[Dict[str, object]] = None
+class FunctionSignature(BaseModel):
+    function: FunctionDefinition
+    type: Literal["function"]

utils.py ADDED Viewed

	@@ -0,0 +1,149 @@

+import ast
+import os
+import re
+import json
+import logging
+import datetime
+import xml.etree.ElementTree as ET
+from logging.handlers import RotatingFileHandler
+logging.basicConfig(
+    format="%(asctime)s,%(msecs)03d %(levelname)-8s [%(filename)s:%(lineno)d] %(message)s",
+    datefmt="%Y-%m-%d:%H:%M:%S",
+    level=logging.INFO,
+)
+script_dir = os.path.dirname(os.path.abspath(__file__))
+now = datetime.datetime.now()
+log_folder = os.path.join(script_dir, "inference_logs")
+os.makedirs(log_folder, exist_ok=True)
+log_file_path = os.path.join(
+    log_folder, f"function-calling-inference_{now.strftime('%Y-%m-%d_%H-%M-%S')}.log"
+)
+# Use RotatingFileHandler from the logging.handlers module
+file_handler = RotatingFileHandler(log_file_path, maxBytes=0, backupCount=0)
+file_handler.setLevel(logging.INFO)
+formatter = logging.Formatter("%(asctime)s,%(msecs)03d %(levelname)-8s [%(filename)s:%(lineno)d] %(message)s", datefmt="%Y-%m-%d:%H:%M:%S")
+file_handler.setFormatter(formatter)
+inference_logger = logging.getLogger("function-calling-inference")
+inference_logger.addHandler(file_handler)
+def get_fewshot_examples(num_fewshot):
+    """return a list of few shot examples"""
+    example_path = os.path.join(script_dir, 'prompt_assets', 'few_shot.json')
+    with open(example_path, 'r') as file:
+        examples = json.load(file)  # Use json.load with the file object, not the file path
+    if num_fewshot > len(examples):
+        raise ValueError(f"Not enough examples (got {num_fewshot}, but there are only {len(examples)} examples).")
+    return examples[:num_fewshot]
+def get_chat_template(chat_template):
+    """read chat template from jinja file"""
+    template_path = os.path.join(script_dir, 'chat_templates', f"{chat_template}.j2")
+    if not os.path.exists(template_path):
+        print
+        inference_logger.error(f"Template file not found: {chat_template}")
+        return None
+    try:
+        with open(template_path, 'r') as file:
+            template = file.read()
+        return template
+    except Exception as e:
+        print(f"Error loading template: {e}")
+        return None
+def get_assistant_message(completion, chat_template, eos_token):
+    """define and match pattern to find the assistant message"""
+    completion = completion.strip()
+    if chat_template == "zephyr":
+        assistant_pattern = re.compile(r'<\|assistant\|>((?:(?!<\|assistant\|>).)*)$', re.DOTALL)
+    elif chat_template == "chatml":
+        assistant_pattern = re.compile(r'<\|im_start\|>\s*assistant((?:(?!<\|im_start\|>\s*assistant).)*)$', re.DOTALL)
+    elif chat_template == "vicuna":
+        assistant_pattern = re.compile(r'ASSISTANT:\s*((?:(?!ASSISTANT:).)*)$', re.DOTALL)
+    else:
+        raise NotImplementedError(f"Handling for chat_template '{chat_template}' is not implemented.")
+    assistant_match = assistant_pattern.search(completion)
+    if assistant_match:
+        assistant_content = assistant_match.group(1).strip()
+        if chat_template == "vicuna":
+            eos_token = f"</s>{eos_token}"
+        return assistant_content.replace(eos_token, "")
+    else:
+        assistant_content = None
+        inference_logger.info("No match found for the assistant pattern")
+        return assistant_content
+def validate_and_extract_tool_calls(assistant_content):
+    validation_result = False
+    tool_calls = []
+    error_message = None
+    try:
+        # wrap content in root element
+        xml_root_element = f"<root>{assistant_content}</root>"
+        root = ET.fromstring(xml_root_element)
+        # extract JSON data
+        for element in root.findall(".//tool_call"):
+            json_data = None
+            try:
+                json_text = element.text.strip()
+                try:
+                    # Prioritize json.loads for better error handling
+                    json_data = json.loads(json_text)
+                except json.JSONDecodeError as json_err:
+                    try:
+                        # Fallback to ast.literal_eval if json.loads fails
+                        json_data = ast.literal_eval(json_text)
+                    except (SyntaxError, ValueError) as eval_err:
+                        error_message = f"JSON parsing failed with both json.loads and ast.literal_eval:\n"\
+                                        f"- JSON Decode Error: {json_err}\n"\
+                                        f"- Fallback Syntax/Value Error: {eval_err}\n"\
+                                        f"- Problematic JSON text: {json_text}"
+                        inference_logger.error(error_message)
+                        continue
+            except Exception as e:
+                error_message = f"Cannot strip text: {e}"
+                inference_logger.error(error_message)
+            if json_data is not None:
+                tool_calls.append(json_data)
+                validation_result = True
+    except ET.ParseError as err:
+        error_message = f"XML Parse Error: {err}"
+        inference_logger.error(f"XML Parse Error: {err}")
+    # Return default values if no valid data is extracted
+    return validation_result, tool_calls, error_message
+def extract_json_from_markdown(text):
+    """
+    Extracts the JSON string from the given text using a regular expression pattern.
+    Args:
+        text (str): The input text containing the JSON string.
+    Returns:
+        dict: The JSON data loaded from the extracted string, or None if the JSON string is not found.
+    """
+    json_pattern = r'```json\r?\n(.*?)\r?\n```'
+    match = re.search(json_pattern, text, re.DOTALL)
+    if match:
+        json_string = match.group(1)
+        try:
+            data = json.loads(json_string)
+            return data
+        except json.JSONDecodeError as e:
+            print(f"Error decoding JSON string: {e}")
+    else:
+        print("JSON string not found in the text.")
+    return None

validator.py ADDED Viewed

	@@ -0,0 +1,132 @@

+import ast
+import json
+from jsonschema import validate
+from pydantic import ValidationError
+from utils import inference_logger, extract_json_from_markdown
+from schema import FunctionCall, FunctionSignature
+def validate_function_call_schema(call, signatures):
+    try:
+        call_data = FunctionCall(**call)
+    except ValidationError as e:
+        return False, str(e)
+    for signature in signatures:
+        try:
+            signature_data = FunctionSignature(**signature)
+            if signature_data.function.name == call_data.name:
+                # Validate types in function arguments
+                for arg_name, arg_schema in signature_data.function.parameters.get('properties', {}).items():
+                    if arg_name in call_data.arguments:
+                        call_arg_value = call_data.arguments[arg_name]
+                        if call_arg_value:
+                            try:
+                                validate_argument_type(arg_name, call_arg_value, arg_schema)
+                            except Exception as arg_validation_error:
+                                return False, str(arg_validation_error)
+                # Check if all required arguments are present
+                required_arguments = signature_data.function.parameters.get('required', [])
+                result, missing_arguments = check_required_arguments(call_data.arguments, required_arguments)
+                if not result:
+                    return False, f"Missing required arguments: {missing_arguments}"
+                return True, None
+        except Exception as e:
+            # Handle validation errors for the function signature
+            return False, str(e)
+    # No matching function signature found
+    return False, f"No matching function signature found for function: {call_data.name}"
+def check_required_arguments(call_arguments, required_arguments):
+    missing_arguments = [arg for arg in required_arguments if arg not in call_arguments]
+    return not bool(missing_arguments), missing_arguments
+def validate_enum_value(arg_name, arg_value, enum_values):
+    if arg_value not in enum_values:
+        raise Exception(
+            f"Invalid value '{arg_value}' for parameter {arg_name}. Expected one of {', '.join(map(str, enum_values))}"
+        )
+def validate_argument_type(arg_name, arg_value, arg_schema):
+    arg_type = arg_schema.get('type', None)
+    if arg_type:
+        if arg_type == 'string' and 'enum' in arg_schema:
+            enum_values = arg_schema['enum']
+            if None not in enum_values and enum_values != []:
+                try:
+                    validate_enum_value(arg_name, arg_value, enum_values)
+                except Exception as e:
+                    # Propagate the validation error message
+                    raise Exception(f"Error validating function call: {e}")
+        python_type = get_python_type(arg_type)
+        if not isinstance(arg_value, python_type):
+            raise Exception(f"Type mismatch for parameter {arg_name}. Expected: {arg_type}, Got: {type(arg_value)}")
+def get_python_type(json_type):
+    type_mapping = {
+        'string': str,
+        'number': (int, float),
+        'integer': int,
+        'boolean': bool,
+        'array': list,
+        'object': dict,
+        'null': type(None),
+    }
+    return type_mapping[json_type]
+def validate_json_data(json_object, json_schema):
+    valid = False
+    error_message = None
+    result_json = None
+    try:
+        # Attempt to load JSON using json.loads
+        try:
+            result_json = json.loads(json_object)
+        except json.decoder.JSONDecodeError:
+            # If json.loads fails, try ast.literal_eval
+            try:
+                result_json = ast.literal_eval(json_object)
+            except (SyntaxError, ValueError) as e:
+                try:
+                    result_json = extract_json_from_markdown(json_object)
+                except Exception as e:
+                    error_message = f"JSON decoding error: {e}"
+                    inference_logger.info(f"Validation failed for JSON data: {error_message}")
+                    return valid, result_json, error_message
+        # Return early if both json.loads and ast.literal_eval fail
+        if result_json is None:
+            error_message = "Failed to decode JSON data"
+            inference_logger.info(f"Validation failed for JSON data: {error_message}")
+            return valid, result_json, error_message
+        # Validate each item in the list against schema if it's a list
+        if isinstance(result_json, list):
+            for index, item in enumerate(result_json):
+                try:
+                    validate(instance=item, schema=json_schema)
+                    inference_logger.info(f"Item {index+1} is valid against the schema.")
+                except ValidationError as e:
+                    error_message = f"Validation failed for item {index+1}: {e}"
+                    break
+        else:
+            # Default to validation without list
+            try:
+                validate(instance=result_json, schema=json_schema)
+            except ValidationError as e:
+                error_message = f"Validation failed: {e}"
+    except Exception as e:
+        error_message = f"Error occurred: {e}"
+    if error_message is None:
+        valid = True
+        inference_logger.info("JSON data is valid against the schema.")
+    else:
+        inference_logger.info(f"Validation failed for JSON data: {error_message}")
+    return valid, result_json, error_message