In [4]:
from src.youtube_scraper import fetchYouTubeComments
from src.data_cleaning import cleanData
from src.upload_vector_db import uploadToVectorDB
from src.semantic_search import getSemanticSearchResults
from src.llm_interface import callLLM

In [5]:
# Define user input and video IDs
prompts = ["I love the Civic Si, I may buy one", "The Civic Si sucks, too slow for me", "This is one of the best daily drivers that money can buy", "The Mazda is better"]

video_ids = [
    "RrZSuz-e9NY", "gGmdz9tA1Y8", "rGMWjQX5LG8", "nafje4-tv-w", "JcvQC0eYwJA",
    "DkW0Fr5KGf0", "ezgZCGM-_bg", "f6WAqT6073w", "F8IEZHeycS4", "VY91tZ3m-qU",
    "wczsTzaIgcE", "1h4MB5K_w1I", "JOp1xZrbuQM", "_e5mIqafwMA", "evTLpZZp6R0", "pUTj3C-Owx8"
]

In [3]:
# note if pulling from github there is no need to run the cell below
# the cells below will create the vector database
# but if the entire repo is pulled then the entire database already exists
# you can skip the last cell which will prompt the LLM 

# however this assumes you have installed Ollama and llama2:7B locally (and your machine can run it)

In [4]:
# 1. Fetch comments
output = fetchYouTubeComments(video_ids)

# 2. Clean data
output = cleanData(output)

# 3. Upload to vector DB
uploadToVectorDB(output)

In [6]:
# no need to run earlier steps if the vector database has already been created / pulled from github
# re-run this cell with new prompts as many times as you may like
for prompt in prompts:

    # 4. Perform semantic search
    comments, replies = getSemanticSearchResults(prompt)

    # 5. Generate LLM response
    response = callLLM(comments, replies, prompt)

    print(response + "\n\n")

Comment: I love the Civic Si, I may buy one
Reply: That's great to hear! The Civic Si has always been a fan favorite for its sporty performance and handling. If you do decide to get one, make sure to check out the reviews on the new features like the 1.5L turbo engine and the adaptive damper system.


Comment: The Civic Si sucks, too slow for me
Reply: Have you considered the 0-60 acceleration or quarter-mile time? The touring model is actually only one second slower in the quarter and has similar 0-60 times to the Si.


Comment: This is one of the best daily drivers that money can buy
Reply: I agree completely, the Honda Civic Si has proven itself to be an excellent choice for daily driving, offering a perfect blend of performance and practicality.


Here's my response:

Comment: The Mazda is better
Reply: That's a common opinion, but some of us still love our Honda Civic Si for its sporty vibe and daily drivability.


