In [None]:
import openai
from qdrant_client import QdrantClient

### Embedding function

In [None]:
def get_embedding(text, model="text-embedding-3-small"):
    response = openai.embeddings.create(
        input=text,
        model=model,
    )
    return response.data[0].embedding

### Retrieval function

In [None]:
qdrant_client = QdrantClient(url="http://localhost:6333")

In [None]:
def retrieve_data(query, qdrant_client, k=5):

    query_embedding = get_embedding(query)

    results = qdrant_client.query_points(
        collection_name="Amazon-items-collection-00",
        query=query_embedding,
        limit=k,
    )

    retrieved_context_ids = []
    retrieved_context = []
    similarity_scores = []

    for result in results.points:
        retrieved_context_ids.append(result.payload["parent_asin"])
        retrieved_context.append(result.payload["description"])
        similarity_scores.append(result.score)

    return {
        "retrieved_context_ids": retrieved_context_ids,
        "retrieved_context": retrieved_context,
        "similarity_scores": similarity_scores,
    }

In [None]:
retrieved_context = retrieve_data("What kind of earphones can I get?", qdrant_client, k=10)

In [None]:
retrieved_context

### Format retrieved context function

In [None]:
def process_context(context):

    formatted_context = ""

    for id, chunk in zip(context["retrieved_context_ids"], context["retrieved_context"]):
        formatted_context += f"- {id}: {chunk}\n"

    return formatted_context

In [None]:
preprocessed_context = process_context(retrieved_context)

In [None]:
print(process_context(retrieved_context))

### Create Prompt function

In [None]:
def build_prompt(preprocessed_context, question):

    prompt = f"""
You are a shopping assistant that can answer questions about the products in stock.

You will be given a question and a list of context.

Instructtions:
- You need to answer the question based on the provided context only.
- Never use word context and refer to it as the available products.

Context:
{preprocessed_context}

Question:
{question}
"""

    return prompt

In [None]:
prompt = build_prompt(preprocessed_context, "What kind of earphones can I get?")

In [None]:
print(build_prompt(preprocessed_context, "What kind of earphones can I get?"))

### Generate answer function

In [None]:
def generate_answer(prompt):

    response = openai.chat.completions.create(
        model="gpt-4.1-mini",
        messages=[{"role": "system", "content": prompt}],
        temperature=0.5,
    )

    return response.choices[0].message.content

In [None]:
print(generate_answer(prompt))

### Cimbined RAG Pipeline

In [None]:
def rag_pipeline(question, top_k=5):

    qdrant_client = QdrantClient(url="http://localhost:6333")

    retrieved_context = retrieve_data(question, qdrant_client, top_k)
    preprocessed_context = process_context(retrieved_context)
    prompt = build_prompt(preprocessed_context, question)
    answer = generate_answer(prompt)

    return answer


In [None]:
print(rag_pipeline("Can I get some cool stuff for kids?"))