In [None]:
import os

os.environ["LOG_LEVEL"] = "debug"

In [None]:
from tt_bot.retrievals import WebRetrieval
from tt_bot.search_engines import GoogleSearchEngine
from tt_bot.text_encoders import OpenAIEncoder
from tt_bot.web_extractors import (
    HTMLExtractor,
    WikiExtractor,
    LinkedinExtractor,
)

from tt_bot.logger import get_logger
from tt_bot.utils.json_data import get_pretty

In [None]:
logger = get_logger(__name__)

In [None]:
search_engine = GoogleSearchEngine()
text_encoder = OpenAIEncoder()
extractors = {
    "html": HTMLExtractor(),
    "wikipedia": WikiExtractor(),
    "linkedin": LinkedinExtractor(),
}

web_retrieval = WebRetrieval(
    search_engine=search_engine,
    text_encoder=text_encoder,
    extractors=extractors,
)

In [None]:
query_text = "who is Julián Ansaldo?"
retrieval_responses = await web_retrieval.retrieve(query_text=query_text)
logger.info(get_pretty(list(map(dict, retrieval_responses))))