In [1]:
# Import dependencies
from pymongo import MongoClient
from pprint import pprint


In [2]:
# Create an instance of MongoClient
mongo = MongoClient(port=27017)


In [3]:
# confirm that the "project_3" database is in MongoDB
print(mongo.list_database_names())

['admin', 'config', 'local', 'project_3', 'uk_food']


In [4]:
# assign the database to a variable name
db = mongo['project_3']

In [5]:
# review the collections in our database
print(db.list_collection_names())

['tsunami_data', 'earthquake_data', 'cleaned_volcanos', 'cleaned_tsunami', 'volcano_data', 'cleaned_earthquake']


In [6]:
# Assign each collection to a variable
volcano = db["volcano_data"]
earthquake = db["earthquake_data"]
tsunami = db["tsunami_data"]
cleaned_earthquake = db["cleaned_earthquake"]
cleaned_volcano = db["cleaned_volcanos"]
cleaned_tsunami = db["cleaned_tsunami"]


In [7]:
pprint(volcano.find_one())

{'_id': ObjectId('66a19ccc5a4773fdb47c0e7b'),
 'country': 'New Zealand',
 'day': 17,
 'deaths': 1,
 'deathsAmountOrder': 1,
 'deathsAmountOrderTotal': 1,
 'deathsTotal': 1,
 'elevation': 516,
 'id': 4521,
 'latitude': -29.27,
 'location': 'Kermadec Is',
 'longitude': -177.92,
 'month': 3,
 'morphology': 'Stratovolcano',
 'name': 'Raoul Island',
 'publish': False,
 'significant': True,
 'status': 'Historical',
 'timeErupt': 'D1',
 'volcanoLocationId': 40203,
 'volcanoLocationNewNum': 242030,
 'volcanoLocationNum': '0402-03=',
 'year': 2006}


In [8]:
# Select useable volcano fields from volcano collection
query = {}
fields = {'year': 1, 'month': 1, 'day': 1, 'location': 1, 'country': 1,
          'latitude': 1, 'longitude': 1, 'elevation': 1, 'morphology': 1,
          'vei': 1, 'deathsTotal': 1, 'damageAmountOrderTotal': 1,
          'housesDestroyedAmountOrderTotal': 1}
v_results = volcano.find(query, fields)
for i in range(2):
    pprint(v_results[i])

{'_id': ObjectId('66a19ccc5a4773fdb47c0e7b'),
 'country': 'New Zealand',
 'day': 17,
 'deathsTotal': 1,
 'elevation': 516,
 'latitude': -29.27,
 'location': 'Kermadec Is',
 'longitude': -177.92,
 'month': 3,
 'morphology': 'Stratovolcano',
 'year': 2006}
{'_id': ObjectId('66a19ccc5a4773fdb47c0e7c'),
 'country': 'Chile',
 'day': 2,
 'deathsTotal': 1,
 'elevation': 1122,
 'latitude': -42.833,
 'location': 'Chile-S',
 'longitude': -72.646,
 'month': 5,
 'morphology': 'Caldera',
 'year': 2008}


In [9]:
# Select useable earthquake fields from earthquake collection
query1 = {}
fields1 = {'year': 1, 'month': 1, 'day': 1, 'locationName': 1, 'country': 1,
          'latitude': 1, 'longitude': 1, 'elevation': 1, 'morphology': 1,
          'eqDepth': 1, 'eqMagnitude': 1, 'deathsTotal': 1, 'damageAmountOrderTotal': 1,
          'housesDestroyedAmountOrderTotal': 1}
e_results = earthquake.find(query1, fields1)
for i in range(2):
    pprint(e_results[i])

{'_id': ObjectId('66a19d0049e2bf6624a72644'),
 'country': 'CHINA',
 'damageAmountOrderTotal': 1,
 'day': 7,
 'eqDepth': 33,
 'eqMagnitude': 6.3,
 'housesDestroyedAmountOrderTotal': 2,
 'latitude': 26.856,
 'locationName': 'CHINA:  YUNNAN PROVINCE:  LIUKU; MYANMAR',
 'longitude': 97.238,
 'month': 6,
 'year': 2000}
{'_id': ObjectId('66a19d0049e2bf6624a72645'),
 'country': 'INDIA',
 'damageAmountOrderTotal': 1,
 'day': 3,
 'eqDepth': 33,
 'eqMagnitude': 4.6,
 'latitude': 22.132,
 'locationName': 'INDIA-BANGLADESH BORDER:  MAHESHKHALI',
 'longitude': 92.771,
 'month': 1,
 'year': 2000}


In [10]:
# Select useable tsunami fields from tsunami collection
query2 = {}
fields2 = {'year': 1, 'month': 1, 'day': 1, 'locationName': 1, 'country': 1,
          'latitude': 1, 'longitude': 1, 'elevation': 1, 'morphology': 1,
          'maxWaterHeight': 1, 'numRunups': 1, 'deathsTotal': 1, 'damageAmountOrderTotal': 1,
          'housesDestroyedAmountOrderTotal': 1}
t_results = tsunami.find(query2, fields2)
for i in range(2):
    pprint(t_results[i])

{'_id': ObjectId('66a19d12b6b79ae31b0d88f1'),
 'country': 'JAPAN',
 'damageAmountOrderTotal': 1,
 'day': 1,
 'deathsTotal': 1,
 'latitude': 34.221,
 'locationName': 'KOZU-SHIMA ISLAND, HONSHU',
 'longitude': 139.131,
 'maxWaterHeight': 0.07,
 'month': 7,
 'numRunups': 4,
 'year': 2000}
{'_id': ObjectId('66a19d12b6b79ae31b0d88f2'),
 'country': 'AUSTRALIA',
 'day': 18,
 'latitude': -13.802,
 'locationName': 'SOUTH INDIAN OCEAN',
 'longitude': 97.453,
 'maxWaterHeight': 0.3,
 'month': 6,
 'numRunups': 1,
 'year': 2000}


In [11]:
# Insert cleaned data into a new collection
cleaned_earthquake.insert_many(e_results)

InsertManyResult([ObjectId('66a19d0049e2bf6624a72644'), ObjectId('66a19d0049e2bf6624a72645'), ObjectId('66a19d0049e2bf6624a72646'), ObjectId('66a19d0049e2bf6624a72647'), ObjectId('66a19d0049e2bf6624a72648'), ObjectId('66a19d0049e2bf6624a72649'), ObjectId('66a19d0049e2bf6624a7264a'), ObjectId('66a19d0049e2bf6624a7264b'), ObjectId('66a19d0049e2bf6624a7264c'), ObjectId('66a19d0049e2bf6624a7264d'), ObjectId('66a19d0049e2bf6624a7264e'), ObjectId('66a19d0049e2bf6624a7264f'), ObjectId('66a19d0049e2bf6624a72650'), ObjectId('66a19d0049e2bf6624a72651'), ObjectId('66a19d0049e2bf6624a72652'), ObjectId('66a19d0049e2bf6624a72653'), ObjectId('66a19d0049e2bf6624a72654'), ObjectId('66a19d0049e2bf6624a72655'), ObjectId('66a19d0049e2bf6624a72656'), ObjectId('66a19d0049e2bf6624a72657'), ObjectId('66a19d0049e2bf6624a72658'), ObjectId('66a19d0049e2bf6624a72659'), ObjectId('66a19d0049e2bf6624a7265a'), ObjectId('66a19d0049e2bf6624a7265b'), ObjectId('66a19d0049e2bf6624a7265c'), ObjectId('66a19d0049e2bf6624a726

In [12]:
cleaned_volcano.insert_many(v_results)

InsertManyResult([ObjectId('66a19ccc5a4773fdb47c0e7b'), ObjectId('66a19ccc5a4773fdb47c0e7c'), ObjectId('66a19ccc5a4773fdb47c0e7d'), ObjectId('66a19ccc5a4773fdb47c0e7e'), ObjectId('66a19ccc5a4773fdb47c0e7f'), ObjectId('66a19ccc5a4773fdb47c0e80'), ObjectId('66a19ccc5a4773fdb47c0e81'), ObjectId('66a19ccc5a4773fdb47c0e82'), ObjectId('66a19ccc5a4773fdb47c0e83'), ObjectId('66a19ccc5a4773fdb47c0e84'), ObjectId('66a19ccc5a4773fdb47c0e85'), ObjectId('66a19ccc5a4773fdb47c0e86'), ObjectId('66a19ccc5a4773fdb47c0e87'), ObjectId('66a19ccc5a4773fdb47c0e88'), ObjectId('66a19ccc5a4773fdb47c0e89'), ObjectId('66a19ccc5a4773fdb47c0e8a'), ObjectId('66a19ccc5a4773fdb47c0e8b'), ObjectId('66a19ccc5a4773fdb47c0e8c'), ObjectId('66a19ccc5a4773fdb47c0e8d'), ObjectId('66a19ccc5a4773fdb47c0e8e'), ObjectId('66a19ccc5a4773fdb47c0e8f'), ObjectId('66a19ccc5a4773fdb47c0e90'), ObjectId('66a19ccc5a4773fdb47c0e91'), ObjectId('66a19ccc5a4773fdb47c0e92'), ObjectId('66a19ccc5a4773fdb47c0e93'), ObjectId('66a19ccc5a4773fdb47c0e

In [13]:
cleaned_tsunami.insert_many(t_results)

InsertManyResult([ObjectId('66a19d12b6b79ae31b0d88f1'), ObjectId('66a19d12b6b79ae31b0d88f2'), ObjectId('66a19d12b6b79ae31b0d88f3'), ObjectId('66a19d12b6b79ae31b0d88f4'), ObjectId('66a19d12b6b79ae31b0d88f5'), ObjectId('66a19d12b6b79ae31b0d88f6'), ObjectId('66a19d12b6b79ae31b0d88f7'), ObjectId('66a19d12b6b79ae31b0d88f8'), ObjectId('66a19d12b6b79ae31b0d88f9'), ObjectId('66a19d12b6b79ae31b0d88fa'), ObjectId('66a19d12b6b79ae31b0d88fb'), ObjectId('66a19d12b6b79ae31b0d88fc'), ObjectId('66a19d12b6b79ae31b0d88fd'), ObjectId('66a19d12b6b79ae31b0d88fe'), ObjectId('66a19d12b6b79ae31b0d88ff'), ObjectId('66a19d12b6b79ae31b0d8900'), ObjectId('66a19d12b6b79ae31b0d8901'), ObjectId('66a19d12b6b79ae31b0d8902'), ObjectId('66a19d12b6b79ae31b0d8903'), ObjectId('66a19d12b6b79ae31b0d8904'), ObjectId('66a19d12b6b79ae31b0d8905'), ObjectId('66a19d12b6b79ae31b0d8906'), ObjectId('66a19d12b6b79ae31b0d8907'), ObjectId('66a19d12b6b79ae31b0d8908'), ObjectId('66a19d12b6b79ae31b0d8909'), ObjectId('66a19d12b6b79ae31b0d89