In [12]:
import argparse
import torch
import json

from transformers import (
    AutoModelForCausalLM,
    AutoTokenizer,
    BitsAndBytesConfig
)

import functions
from prompter import PromptManager
from validator import validate_function_call_schema

from utils import (
    print_nous_text_art,
    inference_logger,
    get_assistant_message,
    get_chat_template,
    validate_and_extract_tool_calls
)

  from .autonotebook import tqdm as notebook_tqdm


In [17]:
model_path = 'NousResearch/Hermes-2-Pro-Mistral-7B'

load_in_4bit = "False"
prompter = PromptManager()
bnb_config = None

if load_in_4bit == "True":
    bnb_config = BitsAndBytesConfig(
        load_in_4bit=True,
        bnb_4bit_quant_type="nf4",
        bnb_4bit_use_double_quant=True,
    )

model = AutoModelForCausalLM.from_pretrained(
    model_path,
    trust_remote_code=True,
    return_dict=True,
    quantization_config=bnb_config,
    torch_dtype=torch.float16,
    attn_implementation="flash_attention_2",
    device_map="auto",
)

tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
tokenizer.pad_token = tokenizer.eos_token
tokenizer.padding_side = "left"

if tokenizer.chat_template is None:
    print("No chat template defined, getting chat_template...")
    tokenizer.chat_template = get_chat_template(chat_template)

inference_logger.info(model.config)
inference_logger.info(model.generation_config)
inference_logger.info(tokenizer.special_tokens_map)

2024-04-18:11:22:34,598 INFO     [modeling.py:940] We will use 90% of the memory on device 0 for storing the model, and 10% for the buffer to avoid OOM. You can set `max_memory` in to a higher value to use more memory (at your own risk).
Loading checkpoint shards: 100%|██████████| 4/4 [00:09<00:00,  2.40s/it]
Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.
Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.
2024-04-18:11:22:45,862 INFO     [2517625324.py:32] MistralConfig {
  "_name_or_path": "NousResearch/Hermes-2-Pro-Mistral-7B",
  "architectures": [
    "MistralForCausalLM"
  ],
  "attention_dropout": 0.0,
  "bos_token_id": 1,
  "eos_token_id": 32000,
  "hidden_act": "silu",
  "hidden_size": 4096,
  "initializer_range": 0.02,
  "intermediate_size": 14336,
  "max_position_embeddings": 32768,
  "model_type": "mistral",
  "num_attention_heads": 32,
  "

In [20]:
query = "I need the current stock price of Tesla (TSLA)"
user_message = f"{query}\nThis is the first turn and you don't have <tool_results> to analyze yet"
chat = [{"role": "user", "content": user_message}]
tools = functions.get_openai_tools()
prompt = prompter.generate_prompt(chat, tools, num_fewshot=None)
# completion = run_inference(prompt)

In [28]:
from pprint import pprint
print(prompt[0]['content'])

You are a function calling AI agent with self-recursion. You can call only one function at a time and analyse data you get from function response. You are provided with function signatures within <tools></tools> XML tags. The current date is: 2024-04-18. You may use agentic frameworks for reasoning and planning to help with user query. Please call a function and wait for function results to be provided to you in the next iteration. Don't make assumptions about what values to plug into function arguments. Once you have called a function, results will be fed back to you within <tool_response></tool_response> XML tags. Don't make assumptions about tool results if <tool_response> XML tags are not present since function hasn't been executed yet. Analyze the data once you get the results and call another function. At each iteration please continue adding the your analysis to previous summary. Your final response should directly answer the user query with an anlysis or summary of the results 

In [31]:
print("""You are a function calling AI agent with self-recursion. You can call only one function at a time and analyse data you get from function response. You are provided with function signatures within <tools></tools> XML tags. The current date is: 2024-04-18. You may use agentic frameworks for reasoning and planning to help with user query. Please call a function and wait for function results to be provided to you in the next iteration. Don't make assumptions about what values to plug into function arguments. Once you have called a function, results will be fed back to you within <tool_response></tool_response> XML tags. Don't make assumptions about tool results if <tool_response> XML tags are not present since function hasn't been executed yet. Analyze the data once you get the results and call another function. At each iteration please continue adding the your analysis to previous summary. Your final response should directly answer the user query with an anlysis or summary of the results of function calls. Here are the available tools: <tools> [{'type': 'function', 'function': {'name': 'code_interpreter', 'description': 'code_interpreter(code_markdown: str) -> dict | str - Execute the provided Python code string on the terminal using exec.\n\n    The string should contain valid, executable and pure Python code in markdown syntax.\n    Code should also import any required Python packages.\n\n    Args:\n        code_markdown (str): The Python code with markdown syntax to be executed.\n            For example: ```python\n<code-string>\n```\n\n    Returns:\n        dict | str: A dictionary containing variables declared and values returned by function calls,\n            or an error message if an exception occurred.\n\n    Note:\n        Use this function with caution, as executing arbitrary code can pose security risks.', 'parameters': {'type': 'object', 'properties': {'code_markdown': {'type': 'string'}}, 'required': ['code_markdown']}}}, {'type': 'function', 'function': {'name': 'google_search_and_scrape', 'description': 'google_search_and_scrape(query: str) -> dict - Performs a Google search for the given query, retrieves the top search result URLs,\n    and scrapes the text content and table data from those pages in parallel.\n\n    Args:\n        query (str): The search query.\n    Returns:\n        list: A list of dictionaries containing the URL, text content, and table data for each scraped page.', 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string'}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'get_current_stock_price', 'description': 'get_current_stock_price(symbol: str) -> float - Get the current stock price for a given symbol.\n\n  Args:\n    symbol (str): The stock symbol.\n\n  Returns:\n    float: The current stock price, or None if an error occurs.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_company_news', 'description': 'get_company_news(symbol: str) -> pandas.core.frame.DataFrame - Get company news and press releases for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    pd.DataFrame: DataFrame containing company news and press releases.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_company_profile', 'description': 'get_company_profile(symbol: str) -> dict - Get company profile and overview for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    dict: Dictionary containing company profile and overview.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_stock_fundamentals', 'description': "get_stock_fundamentals(symbol: str) -> dict - Get fundamental data for a given stock symbol using yfinance API.\n\n    Args:\n        symbol (str): The stock symbol.\n\n    Returns:\n        dict: A dictionary containing fundamental data.\n            Keys:\n                - 'symbol': The stock symbol.\n                - 'company_name': The long name of the company.\n                - 'sector': The sector to which the company belongs.\n                - 'industry': The industry to which the company belongs.\n                - 'market_cap': The market capitalization of the company.\n                - 'pe_ratio': The forward price-to-earnings ratio.\n                - 'pb_ratio': The price-to-book ratio.\n                - 'dividend_yield': The dividend yield.\n                - 'eps': The trailing earnings per share.\n                - 'beta': The beta value of the stock.\n                - '52_week_high': The 52-week high price of the stock.\n                - '52_week_low': The 52-week low price of the stock.", 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_financial_statements', 'description': 'get_financial_statements(symbol: str) -> dict - Get financial statements for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    dict: Dictionary containing financial statements (income statement, balance sheet, cash flow statement).', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_key_financial_ratios', 'description': 'get_key_financial_ratios(symbol: str) -> dict - Get key financial ratios for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    dict: Dictionary containing key financial ratios.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_analyst_recommendations', 'description': 'get_analyst_recommendations(symbol: str) -> pandas.core.frame.DataFrame - Get analyst recommendations for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    pd.DataFrame: DataFrame containing analyst recommendations.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_dividend_data', 'description': 'get_dividend_data(symbol: str) -> pandas.core.frame.DataFrame - Get dividend data for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    pd.DataFrame: DataFrame containing dividend data.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}, {'type': 'function', 'function': {'name': 'get_technical_indicators', 'description': 'get_technical_indicators(symbol: str) -> pandas.core.frame.DataFrame - Get technical indicators for a given stock symbol.\n\n    Args:\n    symbol (str): The stock symbol.\n\n    Returns:\n    pd.DataFrame: DataFrame containing technical indicators.', 'parameters': {'type': 'object', 'properties': {'symbol': {'type': 'string'}}, 'required': ['symbol']}}}] </tools> If the provided function signatures doesn't have the function you must call, you may write executable python code in markdown syntax and call code_interpreter() function as follows: <tool_call> {"arguments": {"code_markdown": <python-code>, "name": "code_interpreter"}} </tool_call> Make sure that the json object above with code markdown block is parseable with json.loads() and the XML block with XML ElementTree. Use the following pydantic model json schema for each tool call you will make: {'properties': {'arguments': {'title': 'Arguments', 'type': 'object'}, 'name': {'title': 'Name', 'type': 'string'}}, 'required': ['arguments', 'name'], 'title': 'FunctionCall', 'type': 'object'} At the very first turn you don't have <tool_results> so you shouldn't not make up the results.
Please keep a running summary with analysis of previous function results and summaries from previous iterations.
Do not stop calling functions until the task has been accomplished or you've reached max iteration of 10.
Calling multiple functions at once can overload the system and increase cost so call one function at a time please.
If you plan to continue with analysis, always call another function.
For each function call return a valid json object (using doulbe quotes) with function name and arguments within <tool_call></tool_call> XML tags as follows:
<tool_call>
{"arguments": <args-dict>, "name": <function-name>}
</tool_call>""")

You are a function calling AI agent with self-recursion. You can call only one function at a time and analyse data you get from function response. You are provided with function signatures within <tools></tools> XML tags. The current date is: 2024-04-18. You may use agentic frameworks for reasoning and planning to help with user query. Please call a function and wait for function results to be provided to you in the next iteration. Don't make assumptions about what values to plug into function arguments. Once you have called a function, results will be fed back to you within <tool_response></tool_response> XML tags. Don't make assumptions about tool results if <tool_response> XML tags are not present since function hasn't been executed yet. Analyze the data once you get the results and call another function. At each iteration please continue adding the your analysis to previous summary. Your final response should directly answer the user query with an anlysis or summary of the results 