In [1]:
from langchain_chroma import Chroma
from langchain_openai import OpenAIEmbeddings

vectorstore_path = "./chroma"

db = Chroma(
    persist_directory=vectorstore_path,
    embedding_function=OpenAIEmbeddings(model="text-embedding-3-small")
)

In [7]:
retriever = db.as_retriever(search_kwargs={"k": 5})
documents = retriever.invoke("Does knowing how to build RAGs helpful for getting a job in Machine Learning")
for doc in documents:
    print(doc.page_content)

**Responsibilities**

*   Work closely with stakeholders to understand user requirements and translate them into scalable AI solutions.
*   Continuously monitor and refine LLM systems to ensure optimal performance and alignment with evolving business needs.
*   Experiment with and implement state-of-the-art methodologies to improve AI model performance and reliability.
*   Collaborate with the broader team to prioritize and deliver impactful features on time.

**Skillset & Experience**

*   Proven experience deploying and optimizing large language models in production environments.
*   Hands-on expertise in designing and implementing retrieval-augmented generation (RAG) systems.
*   A strong background in building evaluation frameworks and improving AI systems iteratively.
*   Familiarity with cloud platforms such as Google Cloud Platform (GCP) or similar environments.
*   Adaptability and a problem-solving mindset to thrive in fast-paced, high-ambiguity situations.
**We're interested 

In [2]:
import os
import getpass
from langchain_community.tools.tavily_search import TavilySearchResults

def _set_env(var: str):
    if not os.environ.get(var):
        os.environ[var] = getpass.getpass(f"{var}: ")

_set_env("OPENAI_API_KEY")
_set_env("TAVILY_API_KEY")
os.environ["TOKENIZERS_PARALLELISM"] = "true"

web_search_tool = TavilySearchResults(max_results=4)
web_search_tool.invoke({'query': "What is deepseek"})

[{'url': 'https://ai.nd.edu/news/deepseek-explained-what-is-it-and-is-it-safe-to-use/',
  'content': 'DeepSeek refers to a new set of frontier AI models from a Chinese startup of the same name. DeepSeek has caused quite a stir in the AI world this week by demonstrating capabilities competitive with – or in some cases, better than – the latest models from OpenAI, while purportedly costing only a fraction of the money and compute power to create. DeepSeek models and their derivatives are all available for public download on Hugging Face, a prominent site for sharing AI/ML models. Did DeepSeek steal data to build its models? OpenAI recently accused DeepSeek of inappropriately using data pulled from one of its models to train DeepSeek. More About the DeepSeek Models'},
 {'url': 'https://www.techtarget.com/WhatIs/feature/DeepSeek-explained-Everything-you-need-to-know',
  'content': "DeepSeek, a Chinese AI firm, is disrupting the industry with its low-cost, open source large language models,