# Extract UFO JSON Data

### Source: Data.World.com
### URL: https://data.world/timothyrenner/ufo-sightings/workspace/file?filename=nuforc_reports.json

In [2]:
# Use pandas and SQLAlchemy to extract data
import pandas as pd
from sqlalchemy import create_engine
import numpy as np

In [3]:
# Establish path for extracting UFO json file
json_path = "nuforc_reports.json"


In [5]:
# Extract UFO json data into pandas dataframe using above path
ufo_df = pd.read_json(json_path, lines=True)
ufo_df.head()

Unnamed: 0,text,stats,date_time,report_link,city,state,shape,duration,summary,posted
0,My wife was driving southeast on a fairly popu...,Occurred : 12/12/2019 18:43 (Entered as : 12/...,12/12/19 18:43,http://www.nuforc.org/webreports/151/S151739.html,Chester,VA,Light,5 seconds,My wife was driving southeast on a fairly popu...,12/22/19
1,I think that I may caught a UFO on the NBC Nig...,Occurred : 3/22/2019 18:30 (Entered as : 03/2...,3/22/19 18:30,http://www.nuforc.org/webreports/145/S145297.html,Rocky Hill,CT,Circle,3-5 seconds,I think that I may caught a UFO on the NBC Nig...,3/29/19
2,I woke up late in the afternoon 3:30-4pm. I w...,Occurred : 4/1/2019 15:45 (Entered as : April...,April01.19,http://www.nuforc.org/webreports/145/S145556.html,,,,,I woke up late in the afternoon 3:30-4pm. I we...,4/12/19
3,I was driving towards the intersection of fall...,Occurred : 4/17/2019 02:00 (Entered as : 04-1...,4/17/19 02:00,http://www.nuforc.org/webreports/145/S145697.html,Ottawa (Carleton) (Canada),ON,Teardrop,10 seconds,I was driving towards the intersection of fall...,4/18/19
4,"In Peoria, Arizona, I saw a cigar shaped craft...",Occurred : 3/15/2009 18:00 (Entered as : 03/1...,3/15/09 18:00,http://www.nuforc.org/webreports/145/S145723.html,Peoria,NY,Cigar,2 minutes,"In Peoria Arizona, I saw a cigar shaped craft ...",4/18/19


# Clean UFO Data

In [7]:
new_ufo_df = ufo_df

#Remove any data rows that have any empty values
new_ufo_df.dropna(how="any", inplace=True)
new_ufo_df = new_ufo_df.fillna("", inplace=False)

#create new date column to rearrange

new_ufo_df['Updated Date'] = new_ufo_df['date_time']
new_ufo_df['Updated Date'] = new_ufo_df['Updated Date'].map(lambda x: str(x)[:-6])

new_ufo_df




Unnamed: 0,text,stats,date_time,report_link,city,state,shape,duration,summary,posted,Updated Date
0,My wife was driving southeast on a fairly popu...,Occurred : 12/12/2019 18:43 (Entered as : 12/...,12/12/19 18:43,http://www.nuforc.org/webreports/151/S151739.html,Chester,VA,Light,5 seconds,My wife was driving southeast on a fairly popu...,12/22/19,12/12/19
1,I think that I may caught a UFO on the NBC Nig...,Occurred : 3/22/2019 18:30 (Entered as : 03/2...,3/22/19 18:30,http://www.nuforc.org/webreports/145/S145297.html,Rocky Hill,CT,Circle,3-5 seconds,I think that I may caught a UFO on the NBC Nig...,3/29/19,3/22/19
3,I was driving towards the intersection of fall...,Occurred : 4/17/2019 02:00 (Entered as : 04-1...,4/17/19 02:00,http://www.nuforc.org/webreports/145/S145697.html,Ottawa (Carleton) (Canada),ON,Teardrop,10 seconds,I was driving towards the intersection of fall...,4/18/19,4/17/19
4,"In Peoria, Arizona, I saw a cigar shaped craft...",Occurred : 3/15/2009 18:00 (Entered as : 03/1...,3/15/09 18:00,http://www.nuforc.org/webreports/145/S145723.html,Peoria,NY,Cigar,2 minutes,"In Peoria Arizona, I saw a cigar shaped craft ...",4/18/19,3/15/09
5,"The object has flashing lights that are green,...",Occurred : 4/2/2019 20:25 (Entered as : 04/02...,4/2/19 20:25,http://www.nuforc.org/webreports/145/S145476.html,Kirbyville,TX,Disk,15 minutes,"The object has flashing lights that are green,...",4/8/19,4/2/19
...,...,...,...,...,...,...,...,...,...,...,...
88120,4 lights in formation over Tempe appear while ...,Occurred : 10/2/2019 20:00 (Entered as : 10/2...,10/2/19 20:00,http://www.nuforc.org/webreports/149/S149463.html,Tempe,AZ,Formation,3 minutes,4 lights in formation over Tempe appear while ...,10/4/19,10/2/19
88121,2 bright star like lights in the NNW sky two b...,Occurred : 10/2/2019 20:00 (Entered as : 10/0...,10/2/19 20:00,http://www.nuforc.org/webreports/149/S149405.html,Bolivar,MO,Light,20 seconds,"2 bright star like lights in the NNW skys, ((...",10/4/19,10/2/19
88122,10/2/19 @ 8:03PM EST UFO SIGHTING in the 3428...,Occurred : 10/2/2019 20:03 (Entered as : 10/0...,10/2/19 20:03,http://www.nuforc.org/webreports/149/S149424.html,North Port,FL,Formation,20 seconds,I just witnessed a ‘Phoenix Lights’ type of fo...,10/4/19,10/2/19
88123,"Witnessed an orange, slow moving light. Was lo...",Occurred : 10/2/2019 22:00 (Entered as : 10/0...,10/2/19 22:00,http://www.nuforc.org/webreports/149/S149447.html,Black Mountain,NC,Fireball,2 minutes,"Witnessed an orange, slow moving light. Was lo...",10/4/19,10/2/19


In [31]:
#update new date column so that it is in yyyy-mm-dd form
date_list = new_ufo_df['Updated Date'].tolist()
date_list_length = len(date_list)
new_date_list = list()
i=0

while i < (date_list_length-1):
    string = date_list[i] 
    newstr = []
    newstr.append('20')
    newstr.append(string[6])
    new_date_list.insert(i, newstr)
    i = i+1


str_new_date_list = str(new_date_list)[1:-1] 
print(str_new_date_list)

IndexError: string index out of range