Skip to content

Commit 8f24419

Browse files
committed
The starter code is ready to roll.
1 parent 7429f53 commit 8f24419

File tree

12 files changed

+477
-0
lines changed

12 files changed

+477
-0
lines changed

.gitignore

+1
Original file line numberDiff line numberDiff line change
@@ -107,3 +107,4 @@ src/07_mongoengine/service_central/.idea/modules.xml
107107
src/07_mongoengine/service_central/.idea/service_central.iml
108108
src/07_mongoengine/service_central/.idea/inspectionProfiles/profiles_settings.xml
109109
screencaster.xml
110+
.idea

src/08_perf/setup_steps.md

+16
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,16 @@
1+
This section on performance is best performed with a large database of cars and owners.
2+
3+
There is a load_data part of the app which will generate this database but it will take a long time (30 minutes or something like this).
4+
5+
To make things faster, I have included a DB which can be imported in `REPO/data/dealership_db_250k.zip`
6+
7+
To use this database, you simple need to unzip and then restore it with the following command:
8+
9+
In the terminal / command line change into the extracted folder containing the `*.bson` and `*.json`, then type:
10+
11+
`mongorestore --drop --db dealership ./`
12+
13+
On Windows, use `.\` rather than `./`
14+
15+
Now you should have a dealership db in MongoDB. Be sure to check the indexes. You may need to drop them (other than `_id` indexes).
16+
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
from nosql import mongo_setup
2+
from nosql.car import Car
3+
from nosql.owner import Owner
4+
5+
6+
def main():
7+
mongo_setup.init()
8+
9+
print("Computing stats, this WILL take awhile...", flush=True)
10+
11+
cars = list(Car.objects())
12+
print("There are {:,} cars.".format(len(cars)))
13+
14+
owners = list(Owner.objects())
15+
print("There are {:,} owners.".format(len(owners)))
16+
owned_cars = sum((len(o.car_ids) for o in owners))
17+
print("Each owner owns an average of {:.2f} cars.".format(owned_cars / len(owners)))
18+
19+
service_histories = sum((len(c.service_history) for c in cars))
20+
print("There are {:,} service histories.".format(service_histories))
21+
print("Each car has an average of {:.2f} service records.".format(service_histories / len(cars)))
22+
23+
24+
main()
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,169 @@
1+
import nosql.mongo_setup as mongo_setup
2+
import services.car_service as car_service
3+
from nosql.car import Car
4+
from nosql.engine import Engine
5+
from nosql.owner import Owner
6+
7+
from datetime import datetime
8+
import random
9+
from faker import Faker
10+
11+
from nosql.service_record import ServiceRecord
12+
13+
14+
def main():
15+
# large data DB example
16+
car_count = 250_000
17+
owner_count = 100_000
18+
19+
# simple DB example
20+
# car_count = 200
21+
# owner_count = 100
22+
23+
mongo_setup.init()
24+
clear_db()
25+
26+
t0 = datetime.now()
27+
28+
fake = create_faker_and_seed()
29+
owners = create_owners(fake, count=owner_count)
30+
print("Created {:,.0f} owners".format(len(owners)))
31+
cars = create_cars(count=car_count)
32+
print("Created {:,.0f} cars".format(len(cars)))
33+
if cars and owners:
34+
add_cars_to_owners(owners, cars)
35+
create_service_records(cars, fake)
36+
37+
dt = datetime.now() - t0
38+
print("Done in {} sec".format(dt.total_seconds()))
39+
40+
41+
models = [
42+
'Ferrari 488 GTB',
43+
'Ferrari 360 modena',
44+
'F430',
45+
'599 GTB Fiorano',
46+
'458 Italia',
47+
'LaFerrari',
48+
'Testarossa',
49+
'F12 Berlinetta',
50+
'308 GTB/GTS',
51+
'F355',
52+
'California',
53+
'575M Maranello',
54+
'F50',
55+
'F40',
56+
'Enzo Ferrari',
57+
]
58+
59+
service_operations = [
60+
('Oil change', 200),
61+
('New tires', 1000),
62+
('New engine', 15000),
63+
('Body repair', 4000),
64+
('New seat', 5000),
65+
('Tune up', 1500),
66+
('Air filter', 100),
67+
('Flat tire', 200),
68+
]
69+
70+
71+
def create_faker_and_seed():
72+
fake = Faker()
73+
fake.seed(42)
74+
random.seed(42)
75+
return fake
76+
77+
78+
def clear_db():
79+
Car.drop_collection()
80+
Owner.drop_collection()
81+
82+
83+
def create_owners(fake, count=100):
84+
datetime_start = datetime(year=2000, month=1, day=1)
85+
datetime_end = datetime(year=datetime.now().year, month=1, day=1)
86+
87+
owners = []
88+
print("Building owners")
89+
for _ in range(0, count):
90+
owner = Owner()
91+
owner.name = fake.name()
92+
owner.created = fake.date_time_between_dates(datetime_start=datetime_start,
93+
datetime_end=datetime_end,
94+
tzinfo=None)
95+
owners.append(owner)
96+
97+
print("Saving owners")
98+
Owner.objects().insert(owners, load_bulk=True)
99+
100+
return list(Owner.objects())
101+
102+
103+
def create_cars(count=200):
104+
current_car_count = Car.objects().count()
105+
if current_car_count >= count:
106+
print("There are currently {:,} cars. Skipping create.")
107+
return []
108+
109+
count = count - current_car_count
110+
111+
hp_factor = 660
112+
mpg_factor = 21
113+
liters_factor = 4
114+
115+
cars = []
116+
print("Building cars...")
117+
for _ in range(0, count):
118+
model = random.choice(models)
119+
make = 'Ferrari'
120+
year = random.randint(1985, datetime.now().year)
121+
mileage = random.randint(0, 150000)
122+
123+
mpg = int((mpg_factor + mpg_factor * random.random() / 4) * 10) / 10.0
124+
horsepower = int(hp_factor + hp_factor * random.random() / 2)
125+
liters = int((liters_factor + liters_factor * random.random() / 2) * 100) / 100.0
126+
127+
engine = Engine(horsepower=horsepower, liters=liters, mpg=mpg)
128+
car = Car(model=model, make=make, year=year, engine=engine, mileage=mileage)
129+
cars.append(car)
130+
131+
print("Saving cars...")
132+
Car.objects().insert(cars)
133+
134+
return list(Car.objects())
135+
136+
137+
def add_cars_to_owners(owners: list, cars: list):
138+
for o in owners:
139+
counter = random.randint(0, 5)
140+
for _ in range(0, counter):
141+
car = random.choice(cars)
142+
car_service.add_owner(o.id, car.id)
143+
144+
145+
def create_service_records(cars, fake):
146+
datetime_start = datetime(year=2000, month=1, day=1)
147+
datetime_end = datetime(year=datetime.now().year, month=1, day=1)
148+
149+
for car in cars:
150+
counter = random.randint(0, 10)
151+
is_positive = random.randint(0, 1) == 1
152+
for _ in range(0, counter):
153+
s = random.choice(service_operations)
154+
sr = ServiceRecord()
155+
sr.description = s[0]
156+
sr.date = fake.date_time_between_dates(datetime_start=datetime_start,
157+
datetime_end=datetime_end,
158+
tzinfo=None)
159+
sr.price = int(s[1] + (random.random() - .5) * s[1] / 4)
160+
if is_positive:
161+
sr.customer_rating = random.randint(4, 5)
162+
else:
163+
sr.customer_rating = random.randint(1, 3)
164+
car.service_history.append(sr)
165+
car.save()
166+
167+
168+
if __name__ == '__main__':
169+
main()
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
import uuid
2+
import mongoengine
3+
4+
from nosql.engine import Engine
5+
from nosql.service_record import ServiceRecord
6+
7+
8+
class Car(mongoengine.Document):
9+
model = mongoengine.StringField(required=True)
10+
make = mongoengine.StringField(required=True)
11+
year = mongoengine.IntField(required=True)
12+
mileage = mongoengine.IntField(default=0)
13+
vi_number = mongoengine.StringField(default=lambda: str(uuid.uuid4()).replace("-", ''))
14+
15+
engine = mongoengine.EmbeddedDocumentField(Engine, required=True)
16+
service_history = mongoengine.EmbeddedDocumentListField(ServiceRecord)
17+
18+
# no need to reference owners here, that is entirely contained in owner class
19+
20+
meta = {
21+
'db_alias': 'core',
22+
'collection': 'cars',
23+
'indexes': [
24+
]
25+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,10 @@
1+
import uuid
2+
3+
import mongoengine
4+
5+
6+
class Engine(mongoengine.EmbeddedDocument):
7+
horsepower = mongoengine.IntField(required=True)
8+
liters = mongoengine.FloatField(required=True)
9+
mpg = mongoengine.FloatField(required=True)
10+
serial_number = mongoengine.StringField(default=lambda: str(uuid.uuid4()))
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,9 @@
1+
import mongoengine
2+
3+
alias_core = 'core'
4+
5+
6+
def init():
7+
db = 'dealership'
8+
# Other connection options here (server, port, username, etc.)
9+
mongoengine.register_connection(alias=alias_core, name=db)
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
from datetime import datetime
2+
3+
import mongoengine
4+
5+
6+
class Owner(mongoengine.Document):
7+
# show off required (not available in mongo or pymongo directly)
8+
name = mongoengine.StringField(required=True)
9+
10+
# show off default
11+
created = mongoengine.DateTimeField(default=datetime.now)
12+
13+
# allows us to use $set and $inc
14+
number_of_visits = mongoengine.IntField(default=0)
15+
16+
# show off many-to-many modeling with one sided list field
17+
# cars can have multiple owners and an owner can own multiple cares
18+
car_ids = mongoengine.ListField(mongoengine.ObjectIdField())
19+
20+
meta = {
21+
'db_alias': 'core',
22+
'collection': 'owners',
23+
'indexes': [
24+
]
25+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,9 @@
1+
import datetime
2+
import mongoengine
3+
4+
5+
class ServiceRecord(mongoengine.EmbeddedDocument):
6+
date = mongoengine.DateTimeField(default=datetime.datetime.now)
7+
description = mongoengine.StringField()
8+
price = mongoengine.FloatField(required=True)
9+
customer_rating = mongoengine.IntField(required=True) # 1 - 5 satisfaction level.

0 commit comments

Comments
 (0)