In [None]:
import faiss
import numpy as np
from sentence_transformers import SentenceTransformer

# Load an embedding model
embed_model = SentenceTransformer("all-MiniLM-L6-v2")

# Sample knowledge base (vector database)
documents = ["Cornell University was founded in 1865.", "LLMs require large datasets for training."]
doc_embeddings = embed_model.encode(documents)

# Build FAISS index for fast retrieval
index = faiss.IndexFlatL2(doc_embeddings.shape[1])
index.add(np.array(doc_embeddings))

# Query input
query = "When was Cornell University founded?"
query_embedding = embed_model.encode([query])

# Retrieve most relevant document
_, closest_doc_index = index.search(np.array(query_embedding), 1)
best_match = documents[closest_doc_index[0][0]]

print(f"Retrieved Fact: {best_match}")