In [2]:
import sys

from smolagents.models import Model

In [9]:
from smolagents.models import OpenAIServerModel
import os
from dotenv import load_dotenv
load_dotenv()

model_id="nvdev/meta/llama-3.1-405b-instruct"
base_url = 'https://integrate.api.nvidia.com/v1'

model=OpenAIServerModel(model_id=model_id,
        api_base=base_url,
        api_key=os.environ["NV_DEV_API_KEY"],
        temperature=0.1)

In [4]:
from smolagents import CodeAgent

agent = CodeAgent(tools=[], model=model, add_base_tools=False)

agent.run(
    "Could you give me the 11th number in the Fibonacci sequence?",
)

55

---
## modifying system prompt of the CodeAgent


Default system prompt : 

```
You are an expert assistant who can solve any task using code blobs. You will be given a task to solve as best you can.
To do so, you have been given access to a list of tools: these tools are basically Python functions which you can call with code.
To solve the task, you must plan forward to proceed in a series of steps, in a cycle of 'Thought:', 'Code:', and 'Observation:' sequences.

At each step, in the 'Thought:' sequence, you should first explain your reasoning towards solving the task and the tools that you want to use.
Then in the 'Code:' sequence, you should write the code in simple Python. The code sequence must end with '<end_code>' sequence.
During each intermediate step, you can use 'print()' to save whatever important information you will then need.
These print outputs will then appear in the 'Observation:' field, which will be available as input for the next step.
In the end you have to return a final answer using the `final_answer` tool.

Here are a few examples using notional tools:
---

{examples}

Above example were using notional tools that might not exist for you. On top of performing computations in the Python code snippets that you create, you only have access to these tools:

{{tool_descriptions}}

{{managed_agents_descriptions}}

Here are the rules you should always follow to solve your task:
1. Always provide a 'Thought:' sequence, and a 'Code:\n```py' sequence ending with '```<end_code>' sequence, else you will fail.
2. Use only variables that you have defined!
3. Always use the right arguments for the tools. DO NOT pass the arguments as a dict as in 'answer = wiki({'query': "What is the place where James Bond lives?"})', but use the arguments directly as in 'answer = wiki(query="What is the place where James Bond lives?")'.
4. Take care to not chain too many sequential tool calls in the same code block, especially when the output format is unpredictable. For instance, a call to search has an unpredictable return format, so do not have another tool call that depends on its output in the same block: rather output results with print() to use them in the next block.
5. Call a tool only when needed, and never re-do a tool call that you previously did with the exact same parameters.
6. Don't name any new variable with the same name as a tool: for instance don't name a variable 'final_answer'.
7. Never create any notional variables in our code, as having these in your logs might derail you from the true variables.
8. You can use imports in your code, but only from the following list of modules: {{authorized_imports}}
9. The state persists between code executions: so if in one step you've created variables or imported modules, these will all persist.
10. Don't give up! You're in charge of solving the task, not providing directions to solve it.

Now Begin! If you solve the task correctly, you will receive a reward of $1,000,000.
```

As yo can see, there are placeholders like "{{tool_descriptions}}": these will be used upon agent initialization to insert certain automatically generated descriptions of tools or managed agents.

So while you can overwrite this system prompt template by passing your custom prompt as an argument to the system_prompt parameter, your new system promptmust contain the following placeholders:

* "{{tool_descriptions}}" to insert tool descriptions.
* "{{managed_agents_description}}" to insert the description for managed agents if there are any.
* For CodeAgent only: "{{authorized_imports}}" to insert the list of authorized imports.


In [11]:
agent.system_prompt_template

'You are an expert assistant who can solve any task using code blobs. You will be given a task to solve as best you can.\nTo do so, you have been given access to a list of tools: these tools are basically Python functions which you can call with code.\nTo solve the task, you must plan forward to proceed in a series of steps, in a cycle of \'Thought:\', \'Code:\', and \'Observation:\' sequences.\n\nAt each step, in the \'Thought:\' sequence, you should first explain your reasoning towards solving the task and the tools that you want to use.\nThen in the \'Code:\' sequence, you should write the code in simple Python. The code sequence must end with \'<end_code>\' sequence.\nDuring each intermediate step, you can use \'print()\' to save whatever important information you will then need.\nThese print outputs will then appear in the \'Observation:\' field, which will be available as input for the next step.\nIn the end you have to return a final answer using the `final_answer` tool.\n\nHere

In [6]:
from smolagents import CodeAgent, HfApiModel, tool
@tool 
def query_google(user_query : str)-> str :
    """query google search engine per input user query

    Args:
        user_query: the user input
    """
    import requests
    from bs4 import BeautifulSoup
    from bs4.element import Comment
   
    output = parse_google_search(user_query)
    return output
def parse_google_search(query):
    #prefix_and_query = 'site%3Awww.nvidia.com%2Fen-us++' + query.replace(' ','+').replace('?','%3F')
    header = {'User-Agent': "Mozilla/5.0 (Windows NT 6.1; rv:109.0) Gecko/20100101 Firefox/113.0"}
    data = requests.get(f'https://www.google.com/search?q={query}', headers=header)
    soup = BeautifulSoup(data.content, "html.parser")
    top_N = 1
    count = 0
    results = []

    for g in soup.find_all('div', {'class': 'g'}):
        try:
            urls = []
            titles = []
            if count < top_N:
                out = g.find_all('a')[0]
                title = g.find('h3').text
                url = out.get("href")
                results.append([url, title])
                #print(f"counter is now {str(count)}")
            else:
                #print(f"counter is now {str(count)} , exiting for loop")
                break
        except:
            pass
        count += 1

    return '\n'.join(results)




In [18]:
from typing import Optional
from smolagents import CodeAgent, tool
from langchain.document_loaders import WebBaseLoader
@tool 
def query_google(user_query : str)-> str :
    """query google search engine per input user query

    Args:
        user_query: the user input
    """
    from langchain.document_loaders import WebBaseLoader
    import requests
    from bs4 import BeautifulSoup
    url=parse_google_search(user_query)   
    print(url)
    output = fetch_text_from_url(url)
    return output
def parse_google_search(query):
    #prefix_and_query = 'site%3Awww.nvidia.com%2Fen-us++' + query.replace(' ','+').replace('?','%3F')
    import requests
    from bs4 import BeautifulSoup
    header = {'User-Agent': "Mozilla/5.0 (Windows NT 6.1; rv:109.0) Gecko/20100101 Firefox/113.0"}
    data = requests.get(f'https://www.google.com/search?q={query}', headers=header)
    soup = BeautifulSoup(data.content, "html.parser")
    top_N = 1
    count = 0
    results = []

    for g in soup.find_all('div', {'class': 'g'}):
        try:
            urls = []
            titles = []
            if count < top_N:
                out = g.find_all('a')[0]
                title = g.find('h3').text
                url = out.get("href")
                results.append([url, title])
                #print(f"counter is now {str(count)}")
            else:
                #print(f"counter is now {str(count)} , exiting for loop")
                break
        except:
            pass
        count += 1

    return url
def fetch_text_from_url(url):
    from langchain.document_loaders import WebBaseLoader
    loader = WebBaseLoader(url)
    scrape_data = loader.load()
    str_output = scrape_data[0].page_content.replace('\n', '')
    return str_output
### equip CodeAgent with web-browsing capability
agent = CodeAgent(tools=[query_google], model=model, additional_authorized_imports=["langchain","requests","bs4"])
agent.run("how do I update submodule with a specific cherry-picked commit in VScode?")

https://miroslav-slapka.medium.com/handle-git-submodules-with-ease-55621afdb7bb


https://miroslav-slapka.medium.com/handle-git-submodules-with-ease-55621afdb7bb


'To update a submodule with a specific cherry-picked commit in VSCode, click on the synchronization icon next to the branch name in the Source Control panel or use the command `git submodule update --remote --merge`.'

In [10]:
agent.run(
    "write a python function to convert image at this path '/workspace/sample.png' to base64 string",
)

'Cannot convert image to base64 string without permission to read files'

In [14]:
agent.run(
    "Can you write python code for webpage scraping, use this url: https://developer.nvidia.com/blog/build-your-first-human-in-the-loop-ai-agent-with-nvidia-nim/, do NOT execute the code, I just want to see the python code snippet.",
)

'Code snippet successfully printed'