In [1]:
import chromadb

In [2]:
# Create client
client = chromadb.Client()

In [3]:
# Create collection
collection = client.create_collection("toyota_cars")

In [4]:
print(f"Collection created: {collection.name}")
print(f"Documents: {collection.count()}")

Collection created: toyota_cars
Documents: 0


In [5]:
# Add Toyota Corolla
collection.add(
    documents=["Toyota Corolla: Affordable sedan, excellent fuel efficiency, perfect for daily commuting"],
    ids=["corolla_2024"],
    metadatas=[{"model": "Corolla", "type": "Sedan", "price": 22000}]
)

In [6]:
print(f"Documents: {collection.count()}")

Documents: 1


In [7]:
# Add multiple cars
collection.add(
    documents=[
        "Toyota RAV4: Versatile SUV, hybrid available, great for families",
        "Toyota Camry: Premium sedan, powerful engine, ideal for professionals"
    ],
    ids=["rav4_2024", "camry_2024"],
    metadatas=[
        {"model": "RAV4", "type": "SUV", "price": 28000},
        {"model": "Camry", "type": "Sedan", "price": 26000}
    ]
)

In [8]:
print(f"Documents: {collection.count()}")

Documents: 3


In [9]:
# Query for family car

results = collection.query(
    query_texts=["family car"],
    n_results=2
)


In [10]:
results

{'ids': [['rav4_2024', 'corolla_2024']],
 'embeddings': None,
 'documents': [['Toyota RAV4: Versatile SUV, hybrid available, great for families',
   'Toyota Corolla: Affordable sedan, excellent fuel efficiency, perfect for daily commuting']],
 'uris': None,
 'included': ['metadatas', 'documents', 'distances'],
 'data': None,
 'metadatas': [[{'type': 'SUV', 'price': 28000, 'model': 'RAV4'},
   {'type': 'Sedan', 'price': 22000, 'model': 'Corolla'}]],
 'distances': [[1.1892693042755127, 1.2542636394500732]]}

In [11]:
results['documents'][0]

['Toyota RAV4: Versatile SUV, hybrid available, great for families',
 'Toyota Corolla: Affordable sedan, excellent fuel efficiency, perfect for daily commuting']

In [12]:
results['documents'][0][1]

'Toyota Corolla: Affordable sedan, excellent fuel efficiency, perfect for daily commuting'

In [13]:
results['metadatas'][0][1]

{'type': 'Sedan', 'price': 22000, 'model': 'Corolla'}

In [14]:
results['ids'][0][1]

'corolla_2024'

In [15]:
for i in range(len(results['documents'][0])):
    doc = results['documents'][0][i]
    metadata = results['metadatas'][0][i]
    
    print(f"{i+1}. {metadata['model']} ({metadata['type']})")
    print(f"   Price: ${metadata['price']:,}\n")

1. RAV4 (SUV)
   Price: $28,000

2. Corolla (Sedan)
   Price: $22,000



In [16]:
# Get all documents
all_docs = collection.get()

In [17]:
all_docs['ids']

['corolla_2024', 'rav4_2024', 'camry_2024']

In [18]:

print("Collection contents:\n")

for i, doc_id in enumerate(all_docs['ids']):
    metadata = all_docs['metadatas'][i]
    print(f"{i+1}. {doc_id}")
    print(f"   Model: {metadata['model']}")
    print(f"   Type: {metadata['type']}")
    print(f"   Price: ${metadata['price']:,}\n")


Collection contents:

1. corolla_2024
   Model: Corolla
   Type: Sedan
   Price: $22,000

2. rav4_2024
   Model: RAV4
   Type: SUV
   Price: $28,000

3. camry_2024
   Model: Camry
   Type: Sedan
   Price: $26,000

