In [None]:
"""
Example usage of the optimized LLM Model class.

This script demonstrates how to use the Model class for text generation
with different configurations including chat-based generation.
"""


from llm import Model


In [None]:

model = Model("meta-llama/Llama-3.2-3B-Instruct")


In [None]:
response = model.generate(
    prompt="Explain to me a brand new take on the classic trolly problem.",
    max_new_tokens= 450, 
    temperature= 0.7, 
    typical_p = .9,
    length_penalty=.8,
    # top_p = .95,
    # top_k= 50,
    no_repeat_ngram_size=3,
    repetition_penalty=1.2,
    messages=[
        {"role": "system", "content": "You are an assistant. You are skilled in philosophy, and love to play devils advocate."},
    ]
)

print(response)


In [None]:
model.db_conn.execute("""
SELECT * FROM messages
""")
df=model.db_conn.fetch_df()
df

In [2]:
from vector_db import VectorDB

# Create and clear the database
db = VectorDB()
db.clear_db()

# Add documents
doc1_id = db.add_document("This is a document about artificial intelligence.")
doc2_id = db.add_document("Vector databases are useful for similarity search.")

# Add multiple documents at once
ids = db.add_documents([
    "Python is a popular programming language.",
    "Embedding models convert text to vectors.",
    "FAISS is a library for efficient similarity search."
])

print(f"Database now contains {db.get_document_count()} documents")

# Search for similar documents
print("\nSearch: How do AI systems work?")
results = db.search("How do AI systems work?", k=3)
for doc, score in results:
    print(f"Score: {score:.4f}, Document: {doc}")

# Search for similar documents
print("\nSearch: pink unicorn")
results = db.search("pink unicorn", k=3)
for doc, score in results:
    print(f"Score: {score:.4f}, Document: {doc}")

Created new vector database
Database cleared
Database now contains 5 documents

Search: How do AI systems work?
Score: 0.7732, Document: This is a document about artificial intelligence.
Score: 0.6081, Document: Python is a popular programming language.
Score: 0.5993, Document: Embedding models convert text to vectors.

Search: pink unicorn
Score: 0.5702, Document: Python is a popular programming language.
Score: 0.5423, Document: This is a document about artificial intelligence.
Score: 0.5270, Document: Vector databases are useful for similarity search.
