## UFO Countries that need cleaned up:

In [1]:
%%capture
import sys
DATA_PATH = '../data/'

In [2]:
# Imports:
import numpy as np
import pandas as pd
import warnings
warnings.filterwarnings('ignore')

In [3]:
# Read in my data:
data = 'https://raw.githubusercontent.com/jmmiddour/Projects/master/UFOs/ufos_countries_to_clean.csv'
ufo = pd.read_csv(data)

# Look at the first 5 rows:
ufo.head()

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,1,2,...,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class
0,58,1994,10,Mon,15,3600.0,Mercedies,mercedies,0,0,...,TX,0,26.149798,-97.913611,0,0,0,0,0,Non-Geometric
1,59,1994,10,Mon,18,120.0,Burnt Hills,burnt,hills,0,...,NY,USA,42.909722,-73.895556,0,0,1,0,0,Geometric
2,60,1994,10,Mon,22,5.0,Pinebergen,pinebergen,0,0,...,AR,USA,34.102778,-91.992222,0,1,1,1,0,Type of Light
3,61,1994,10,Mon,23,3600.0,Toronto (Greater Toronto Area) (Canada),toronto,(greater,toronto,...,ON,Canada,43.666667,-79.416667,0,0,0,0,0,Circular
4,62,1995,10,Tue,19,120.0,Milwaukee,milwaukee,0,0,...,WI,USA,43.038889,-87.906389,1,0,0,0,0,Other


In [4]:
# Look at all the columns in dataframe:
ufo.columns

Index(['Id', 'year', 'month', 'dow', 'hour', 'durations_in_secs', 'city', '0',
       '1', '2', '3', '4', '5', '6', '7', '8', '9', '10', 'state', 'country',
       'latitude', 'longitude', 'color', 'movement', 'elevation', 'sound',
       'hoax', 'shape_class'],
      dtype='object')

In [5]:
# Look at all country rows with 0 and 10 is not 0:
ufo[(ufo['10'] != 0) & (ufo['country'] == 0)]

# Drop column 10, no useful information:
ufo = ufo.drop(columns='10')

# Check my work:
ufo.columns

Index(['Id', 'year', 'month', 'dow', 'hour', 'durations_in_secs', 'city', '0',
       '1', '2', '3', '4', '5', '6', '7', '8', '9', 'state', 'country',
       'latitude', 'longitude', 'color', 'movement', 'elevation', 'sound',
       'hoax', 'shape_class'],
      dtype='object')

In [6]:
# Show all rows and columns:
pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)

# Look at the value counts in the 9 column:
ufo['9'].value_counts()

0            72398
of               2
woods)           2
of)              2
utsalady         1
chico)           1
n)               1
proba            1
(france)         1
c.               1
l.               1
airport)         1
10)              1
15)              1
exit)            1
i-5              1
lasal            1
osage)           1
44)              1
(mexico)         1
to)              1
miles            1
flats)           1
21)              1
i-10             1
)                1
west             1
sd               1
30)              1
5)               1
borde            1
paradise)        1
towards          1
hyw              1
to               1
s.               1
322w)            1
15               1
summit)          1
road)            1
Name: 9, dtype: int64

In [7]:
# Replace country value based on value in 9 column:
ufo.loc[ufo['9'] == '(france)', 'country'] = 'France'
ufo.loc[ufo['9'] == '(mexico)', 'country'] = 'Mexico'

# Drop column 9, no more useful information:
ufo.drop(columns='9', inplace=True)

# Check my work:
ufo['country'].value_counts()

USA            58474
0               7768
Canada          3280
UK              1733
Australia        483
Hawaii           314
Alaska           300
Germany           84
Puerto Rico        3
Mexico             1
France             1
Name: country, dtype: int64

In [8]:
# Look at the value counts of the 8 column:
ufo['8'].value_counts()

0               72348
of                  5
on                  2
(canada)            2
the                 2
of)                 1
se                  1
the)                1
ocean               1
crossing            1
bahama)             1
7                   1
highway)            1
cutoff              1
35&#44              1
&amp;               1
60449               1
island)             1
89)                 1
aprox.)             1
rapids)             1
i81)                1
2)                  1
center              1
laramie)            1
u.                  1
254)                1
(uk/england)        1
01)                 1
interstate          1
highway             1
fl)                 1
10                  1
rocky               1
737                 1
park)               1
rica)               1
memphis)            1
rt                  1
east                1
su                  1
st)                 1
north               1
denmark)            1
tayl)               1
it        

In [9]:
# Look at rows with specific values in column 8:
ufo[(ufo['8'] == '(canada)') | (ufo['8'] == 'canadian') | (ufo['8'] == 'rica)') | (ufo['8'] == '(guatamala)') | (ufo['8'] == '(ecuador)') | (ufo['8'] == 'arabia)') | (ufo['8'] == 'island)') | (ufo['8'] == '(uk/england)') | (ufo['8'] == 'bahama)') | (ufo['8'] == 'ocean') | (ufo['8'] == 'denmark)') | (ufo['8'] == 'cozumel)')]

# Change country values based on values in column 8:
ufo.loc[(ufo['8'] == 'denmark)') | (ufo['8'] == 'cozumel)'), 'country'] = 'Open Water'
ufo.loc[ufo['8'] == 'arabia)', 'country'] = 'Saudi Arabia'
ufo.loc[ufo['8'] == '(guatamala)', 'country'] = 'Guatamala'
ufo.loc[ufo['8'] == 'rica)', 'country'] = 'Costa Rica'
ufo.loc[ufo['8'] == '(ecuador)', 'country'] = 'Ecuador'

# Drop column 8, no more useful information:
ufo.drop(columns='8', inplace=True)

# Check my work:
ufo['country'].value_counts()

USA             58474
0                7762
Canada           3280
UK               1733
Australia         483
Hawaii            314
Alaska            300
Germany            84
Puerto Rico         3
Open Water          2
Ecuador             1
Mexico              1
Saudi Arabia        1
Guatamala           1
France              1
Costa Rica          1
Name: country, dtype: int64

In [10]:
# Look at the value counts of the 7 column:
ufo['7'].value_counts()

0               72225
of                  9
of)                 6
(canada)            5
hwy                 5
on                  4
miles               3
airport)            3
exit)               3
over                2
border)             2
to                  2
river)              2
from                2
the                 2
near                2
&amp;               2
west)               2
south)              2
i-80)               2
highway)            2
5)                  2
25)                 2
i-8)                2
e                   2
and                 2
road)               2
between)            1
drive)              1
hrs                 1
sacramento)         1
76                  1
locan               1
baker               1
an                  1
93)                 1
up)                 1
hill                1
westbound           1
76)                 1
area-               1
cedar               1
nw                  1
dark                1
mm77                1
was       

In [11]:
# Look at rows with specific values in column 7:
ufo[(ufo['7'] == '(canada)') | (ufo['7'] == '(uk/england)') | (ufo['7'] == '(brazil)') | (ufo['7'] == 'honolulu)') | (ufo['7'] == '(costa') | (ufo['7'] == 'ocean)') | (ufo['7'] == '(saudi') | (ufo['7'] == 'australia)') | (ufo['7'] == 'island') | (ufo['7'] == 'manitowoc)')]

# Change country values based on values in column 7:
ufo.loc[(ufo['7'] == '(canada)') & (ufo['state'] == 'NV'),  'country'] = 'Open Water'
ufo.loc[(ufo['7'] == 'honolulu)') | (ufo['7'] == 'ocean)'), 'country'] = 'Open Water'
ufo.loc[ufo['7'] == '(brazil)', 'country'] = 'Brazil'
ufo.loc[ufo['7'] == '(uk/england)', 'country'] = 'UK'

# Drop column 7, no more useful information:
ufo.drop(columns='7', inplace=True)

# Check my work:
ufo['country'].value_counts()

USA             58474
0                7758
Canada           3280
UK               1734
Australia         483
Hawaii            314
Alaska            300
Germany            84
Open Water          5
Puerto Rico         3
Ecuador             1
Mexico              1
Saudi Arabia        1
France              1
Brazil              1
Costa Rica          1
Name: country, dtype: int64

In [12]:
# Look at country and state rows with 0 and 6 is not 0:
ufo[(ufo['6'] != '0') & (ufo['country'] == '0') & (ufo['state'] == '0')]

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,1,2,3,4,5,6,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class
1485,1905,1994,10,Sat,22,120.0,Bry Sur Marne (Near Paris) (France),bry,sur,marne,,(near,paris),(france),0,0,48.834913,2.523649,1,0,0,0,0,Other
1576,1999,2000,10,Sun,1,45.0,Los Americas (Laguna Park 1 Hotel) (Tenerife),los,americas,(laguna,park,1,hotel),(tenerife),0,0,4.52572,-75.6976,0,1,0,0,0,Circular
3885,4447,1995,10,Wed,22,3.0,Sandals Royal Jamaican Resort&#44 Montego Bay ...,sandals,royal,jamaican,resort&#44,montego,bay,(jamaica),0,0,18.466667,-77.916667,1,1,0,1,0,Geometric
8325,9187,2008,11,Fri,19,10.0,Aland Islands (Forty Miles South Of) (Finland),aland,islands,(forty,miles,south,of),(finland),0,0,60.178525,19.91561,0,1,0,0,0,Type of Light
16173,17582,2012,1,Sat,3,600.0,El Tanque De La Fortuna (Costa Rica),el,tanque,de,la,fortuna,(costa,rica),0,0,10.477465,-84.580681,1,0,1,0,0,Other
18496,20033,2007,12,Sun,4,3600.0,San Jose Del Cabo (Baja California) (Mexico),san,jose,del,cabo,(baja,california),(mexico),0,0,23.063656,-109.702438,0,1,1,0,0,Other
19800,21394,2012,12,Sun,19,600.0,Suwon (30 Miles South Of) (South Korea),suwon,(30,miles,south,of),(south,korea),0,0,37.263573,127.028601,0,1,0,0,0,Type of Light
20577,22202,2002,12,Wed,1,600.0,Monterrey (Mexico) (Outside City&#44 On Large ...,monterrey,(mexico),(outside,city&#44,on,large,highway),0,0,25.686614,-100.316113,0,0,0,0,0,Other
21260,22908,2003,1,Sun,19,30.0,Dun Laoghaire (County Dublin (Republic Of Irel...,dun,laoghaire,(county,dublin,(republic,of,ireland),0,0,53.29279,-6.141937,1,1,0,0,0,Type of Light
28695,30729,2009,3,Sun,22,3600.0,Iraq (Above A U. S. Military Camp),iraq,(above,a,u.,s.,military,camp),0,0,33.223191,43.679291,0,1,0,1,0,Geometric


In [13]:
# Look at country and state rows with 0 and 5 is not 0:
ufo[(ufo['5'] != '0') & (ufo['country'] == '0') & (ufo['state'] == '0')]

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,1,2,3,4,5,6,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class
821,1028,2000,10,Thr,11,7620.0,La Serena (Vi&Ntilde;A Del Mar) (Chile),la,serena,(vi&ntilde;a,del,mar),(chile),0,0,0,-29.906301,-71.250204,0,0,1,0,0,Multiple
1270,1496,1998,10,Wed,1,300.0,South Eastern Coast (Republic Of Ireland),south,eastern,coast,(republic,of,ireland),0,0,0,22.564254,114.229432,0,1,1,0,0,Geometric
1485,1905,1994,10,Sat,22,120.0,Bry Sur Marne (Near Paris) (France),bry,sur,marne,,(near,paris),(france),0,0,48.834913,2.523649,1,0,0,0,0,Other
1576,1999,2000,10,Sun,1,45.0,Los Americas (Laguna Park 1 Hotel) (Tenerife),los,americas,(laguna,park,1,hotel),(tenerife),0,0,4.52572,-75.6976,0,1,0,0,0,Circular
3885,4447,1995,10,Wed,22,3.0,Sandals Royal Jamaican Resort&#44 Montego Bay ...,sandals,royal,jamaican,resort&#44,montego,bay,(jamaica),0,0,18.466667,-77.916667,1,1,0,1,0,Geometric
3975,4540,2008,10,Sat,19,900.0,San Jose Del Cabo (Baja&#44 Mexico),san,jose,del,cabo,(baja&#44,mexico),0,0,0,23.063656,-109.702438,1,1,0,0,0,Type of Light
4183,4752,2008,10,Sun,20,240.0,Buenos Aires (Almagro Pale&#44 Belgrano) (Brazil),buenos,aires,(almagro,pale&#44,belgrano),(brazil),0,0,0,-34.603723,-58.381593,0,0,0,0,0,Circular
5841,6506,2007,10,Fri,9,20.0,St. Helier (Jersey Channel Islands) (Uk/England),st.,helier,(jersey,channel,islands),(uk/england),0,0,0,49.186823,-2.106568,0,1,0,0,0,Type of Light
7164,7925,2002,11,Mon,3,72.0,Paris Airport (Near Open Field) (France),paris,airport,(near,open,field),(france),0,0,0,35.296832,-93.685778,0,1,0,0,0,Circular
7348,8179,1997,11,Sat,23,15.0,Hua Hin&#44 Prachuap Kirikan (Thailand) (Near),hua,hin&#44,prachuap,kirikan,(thailand),(near),0,0,0,12.568375,99.957689,0,0,1,0,0,Geometric


In [14]:
# Look at country and state rows with 0 and 4 is not 0:
ufo[(ufo['4'] != '0') & (ufo['country'] == '0') & (ufo['state'] == '0')]

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,1,2,3,4,5,6,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class
821,1028,2000,10,Thr,11,7620.0,La Serena (Vi&Ntilde;A Del Mar) (Chile),la,serena,(vi&ntilde;a,del,mar),(chile),0,0,0,-29.906301,-71.250204,0,0,1,0,0,Multiple
1270,1496,1998,10,Wed,1,300.0,South Eastern Coast (Republic Of Ireland),south,eastern,coast,(republic,of,ireland),0,0,0,22.564254,114.229432,0,1,1,0,0,Geometric
1323,1549,2002,10,Mon,19,300.0,Cagayan De Oro City (Philippines),cagayan,de,oro,city,(philippines),0,0,0,0,8.454236,124.631898,0,0,0,0,0,Circular
1485,1905,1994,10,Sat,22,120.0,Bry Sur Marne (Near Paris) (France),bry,sur,marne,,(near,paris),(france),0,0,48.834913,2.523649,1,0,0,0,0,Other
1576,1999,2000,10,Sun,1,45.0,Los Americas (Laguna Park 1 Hotel) (Tenerife),los,americas,(laguna,park,1,hotel),(tenerife),0,0,4.52572,-75.6976,0,1,0,0,0,Circular
3026,3540,2011,10,Fri,22,120.0,San Jose Del Cabo (Mexico),san,jose,del,cabo,(mexico),0,0,0,0,23.063656,-109.702438,0,0,0,0,0,Type of Light
3885,4447,1995,10,Wed,22,3.0,Sandals Royal Jamaican Resort&#44 Montego Bay ...,sandals,royal,jamaican,resort&#44,montego,bay,(jamaica),0,0,18.466667,-77.916667,1,1,0,1,0,Geometric
3975,4540,2008,10,Sat,19,900.0,San Jose Del Cabo (Baja&#44 Mexico),san,jose,del,cabo,(baja&#44,mexico),0,0,0,23.063656,-109.702438,1,1,0,0,0,Type of Light
4183,4752,2008,10,Sun,20,240.0,Buenos Aires (Almagro Pale&#44 Belgrano) (Brazil),buenos,aires,(almagro,pale&#44,belgrano),(brazil),0,0,0,-34.603723,-58.381593,0,0,0,0,0,Circular
5841,6506,2007,10,Fri,9,20.0,St. Helier (Jersey Channel Islands) (Uk/England),st.,helier,(jersey,channel,islands),(uk/england),0,0,0,49.186823,-2.106568,0,1,0,0,0,Type of Light


In [15]:
# Look at country state rows with 0 and 3 is not 0:
ufo[(ufo['3'] != '0') & (ufo['country'] == '0') & (ufo['state'] == '0')]

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,1,2,3,4,5,6,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class
7,65,1996,10,Thr,20,300.0,Lake Macquarie (Nsw&#44 Australia),lake,macquarie,(nsw&#44,australia),0,0,0,0,0,-33.093373,151.588982,1,0,0,0,0,Type of Light
67,125,2003,10,Fri,23,2700.0,Bickerton (Near Wetherby) (Uk/England),bickerton,(near,wetherby),(uk/england),0,0,0,0,0,53.070884,-2.736506,1,1,0,0,0,Other
738,930,2011,10,Sat,17,180.0,Carrieres Sous Poissy (France),carrieres,sous,poissy,(france),0,0,0,0,0,48.945484,2.037356,1,1,1,1,0,Non-Geometric
821,1028,2000,10,Thr,11,7620.0,La Serena (Vi&Ntilde;A Del Mar) (Chile),la,serena,(vi&ntilde;a,del,mar),(chile),0,0,0,-29.906301,-71.250204,0,0,1,0,0,Multiple
835,1042,2001,10,Fri,19,2.0,Sainte-Suzanne (Near Switzerland) (France),sainte-suzanne,(near,switzerland),(france),0,0,0,0,0,48.097456,-0.349277,1,0,0,0,0,Other
1270,1496,1998,10,Wed,1,300.0,South Eastern Coast (Republic Of Ireland),south,eastern,coast,(republic,of,ireland),0,0,0,22.564254,114.229432,0,1,1,0,0,Geometric
1323,1549,2002,10,Mon,19,300.0,Cagayan De Oro City (Philippines),cagayan,de,oro,city,(philippines),0,0,0,0,8.454236,124.631898,0,0,0,0,0,Circular
1485,1905,1994,10,Sat,22,120.0,Bry Sur Marne (Near Paris) (France),bry,sur,marne,,(near,paris),(france),0,0,48.834913,2.523649,1,0,0,0,0,Other
1500,1920,1995,10,Sun,23,15.0,Split (In Former Yugoslavia),split,(in,former,yugoslavia),0,0,0,0,0,43.508132,16.440193,0,0,0,0,0,Type of Light
1576,1999,2000,10,Sun,1,45.0,Los Americas (Laguna Park 1 Hotel) (Tenerife),los,americas,(laguna,park,1,hotel),(tenerife),0,0,4.52572,-75.6976,0,1,0,0,0,Circular


In [16]:
# Look at country and state rows with 0 and 2 is not 0:
ufo[(ufo['2'] != '0') & (ufo['country'] == '0') & (ufo['state'] == '0')]

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,1,2,3,4,5,6,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class
7,65,1996,10,Thr,20,300.0,Lake Macquarie (Nsw&#44 Australia),lake,macquarie,(nsw&#44,australia),0,0,0,0,0,-33.093373,151.588982,1,0,0,0,0,Type of Light
67,125,2003,10,Fri,23,2700.0,Bickerton (Near Wetherby) (Uk/England),bickerton,(near,wetherby),(uk/england),0,0,0,0,0,53.070884,-2.736506,1,1,0,0,0,Other
286,352,2004,10,Mon,10,1200.0,Nuevo Laredo (Mexico),nuevo,laredo,(mexico),0,0,0,0,0,0,27.477936,-99.549573,1,1,0,0,0,Type of Light
480,671,2000,10,Sun,13,900.0,Yangtzee River (China),yangtzee,river,(china),0,0,0,0,0,0,31.84694,120.872862,0,0,0,0,0,Circular
491,682,2000,10,Sun,22,40.0,Healesville. Victoria (Australia),healesville.,victoria,(australia),0,0,0,0,0,0,-37.653829,145.517006,0,0,0,0,0,Type of Light
677,869,2008,10,Wed,0,300.0,Kuala Lumpur (Malaysia),kuala,lumpur,(malaysia),0,0,0,0,0,0,3.139003,101.686855,1,0,0,0,0,Circular
738,930,2011,10,Sat,17,180.0,Carrieres Sous Poissy (France),carrieres,sous,poissy,(france),0,0,0,0,0,48.945484,2.037356,1,1,1,1,0,Non-Geometric
821,1028,2000,10,Thr,11,7620.0,La Serena (Vi&Ntilde;A Del Mar) (Chile),la,serena,(vi&ntilde;a,del,mar),(chile),0,0,0,-29.906301,-71.250204,0,0,1,0,0,Multiple
829,1036,2000,10,Thr,20,600.0,Brixham&#44 Devon (Uk/England),brixham&#44,devon,(uk/england),0,0,0,0,0,0,50.39514,-3.513924,0,1,1,0,0,Type of Light
835,1042,2001,10,Fri,19,2.0,Sainte-Suzanne (Near Switzerland) (France),sainte-suzanne,(near,switzerland),(france),0,0,0,0,0,48.097456,-0.349277,1,0,0,0,0,Other


In [17]:
# Create lists for each country value that needs to be replaced:
Afghanistan = [43626, 49146]
Africa = [58666, 8407, 28509, 29077, 35682, 37338, 42215, 53767, 64707, 2090, 2349, 7885, 9757, 9765, 11293, 
          15350, 16229, 17875, 18045, 19022, 23699, 21845, 25255, 25404, 25971, 27275, 28264, 30457, 30849, 
          31662, 31982, 32160, 35052, 32322, 40880, 42882, 52543, 62745, 64290, 70762, 70766, 2346, 2347, 
          2791, 3477, 4275, 6261, 7781, 10002, 10244, 13337, 17517, 18254, 18725, 18841, 18969, 19791, 19897, 
          20075, 21863, 22401, 24522, 25401, 25489, 25636, 27191, 28766, 31450, 33944, 34626, 34648, 34850, 
          35010, 35197, 35761, 35847, 36750, 38465, 41848, 41910, 41923, 41924, 42784, 42815, 47239, 47285, 
          47462, 48795, 49035, 49631, 54162, 56598, 61391, 62800, 66250, 66375, 67669, 68371, 68623, 69286, 
          69533, 70503, 70763]
Antarctica = [39507]
Argentina = [12522, 15493, 18456, 58462, 3495, 13170, 22996, 26598, 28461, 37374, 37830, 39563, 39635, 
             46997]
Australia = [7, 7817, 10268, 11434, 13489, 16043, 19723, 19852, 34492, 40126, 59703, 64791, 66824, 40824, 
             491, 2960, 8448, 9839, 9879, 11932, 12467, 13554, 19905, 20727, 20946, 21347, 22807, 23732, 24036, 
             24772, 27920, 28462, 29432, 31184, 37534, 37545, 39453, 41118, 41573, 41813, 42506, 46213, 47786, 
             47790, 47798, 52568, 60079, 66413, 69235, 70587]
Bahamas = [49401, 47080, 48121, 54700, 62661]
Bahrain = [40105]
Barbados = [9796]
Belarus = [20208]
Belgium = [54061, 26852, 40864, 26428, 45467, 51055, 16556, 50855]
Belize = [35240, 4766, 31413]
Bolivia = [31384]
Brazil = [33358, 52168, 57630, 4183, 31606, 14078, 47955, 15001, 15858, 17761, 23029, 27863, 29474, 
          32412, 36524, 40075, 41287, 53312, 46966, 7240, 14775, 14777, 15349, 17021, 17031, 18600, 19940, 
          27325, 31134, 32277, 35408, 42702, 43075, 45645, 57496, 67651, 69264]
BritishVI = [25585, 26354, 12236, 12817, 45490]
Brunei = [28237, 31649, 10064]
Bulgaria = [44212]
Cambodia = [29519]
Canada = [67951]
Caribbean = [16748]
Chile = [821, 21980, 40618, 48144]
China = [51796, 19469, 19544, 62637, 480, 1558, 7196, 10180, 15540, 28253, 28452, 40775, 48078, 51207, 
         66700]
Colombia = [17834, 44328, 19839]
CostaRica = [16173, 21748, 7506, 30200, 65690, 2513, 6344, 15340, 18631, 23412, 27022, 34090, 37671, 
             46253, 70730]
Croatia = [61029, 66688, 47141, 60279, 71052]
Cuba = [10872, 17332, 47950]
Cyprus = [3511, 37950]
CzechRep = [18375, 32882]
Denmark = [39278, 23047, 25520]
DomRep = [35685, 19436, 34798, 3206, 21045, 45286]
EastTimor = [35383]
Ecuador = [62353, 50117]
Egypt = [13935, 36743, 68163]
ElSalvador = [23663]
Finland = [8325, 22799, 37384]
France = [1485, 7164, 59332, 59547, 65071, 69834, 738, 835, 7193, 29791, 34221, 43243, 50295, 64394, 
          71569, 8949, 17809, 19760, 39902, 42609, 44423]
Germany = [16004, 44774, 19261, 32697]
Greece = [52880, 60767, 71461, 44466, 47035, 52425, 58441, 59226, 60419, 61235, 68406, 69345]
Grenadine = [9878]
Guatamala = [17308, 22930, 65447]
Guyana = [25867]
Honduras = [2595, 69197, 57730]
Hungary = [31547]
InSpace = [68126, 15459, 32480, 43589, 48479]
India = [10053, 18916, 28740, 40956, 41809, 65411, 5338, 5911, 11441, 29224, 54056, 64849, 2879, 3075, 
         4211, 4466, 5421, 7971, 11614, 12094, 12383, 12651, 18907, 20353, 32831, 33923, 34358, 36939, 38590, 
         41743, 52642, 54200, 59483, 59992, 65375, 66581, 68374, 70140]
Indonesia = [4048, 11343, 17546]
Ireland = [21260, 1270, 52349, 64807, 67137, 10133, 16808, 16827, 26215, 32405, 48053, 65753, 2452, 3098, 
           3884, 7397, 8610, 11160, 18625, 21558, 24462, 26301, 31251, 37905, 27490, 32734, 50096, 63428, 
           64260, 65140, 67233, 10059, 12057, 14014, 16345, 19946, 24662, 29652, 32445, 33137, 39350, 51840, 
           52631, 58879, 68776, 68778]
Israel = [62780, 6339, 7810, 15351, 16875, 27801, 29729, 34305, 38598, 41077, 43502, 43829, 52962, 56904, 
          60630, 64347, 65560]
Iraq = [28695, 35622, 59741, 34558, 51359, 16042, 16923, 20339, 44940]
Italy = [52148, 61356, 61825, 38361, 51195, 27407, 40295, 48155, 53552, 60703]
Jamaica = [3885, 16412, 16868, 27057]
Japan = [16882, 16284, 68357, 15063, 23088, 39882, 48236, 57677]
Korea = [19800, 2565, 11486, 61779, 71676, 5711, 5944, 10851, 12131, 22639, 23430, 24189, 25641, 71070]
Kosovo = [47811]
Kuwait = [4773, 53397, 24682]
Lebanon = [17797, 52469]
Luxembourg = [13796, 24203]
Malaysia = [38226, 27773, 41115, 677, 4463, 5771, 6348, 13074, 14242, 14494, 18048, 19384, 21071, 21078, 
            21129, 22458, 24091, 24556, 25964, 34463, 38225, 40567, 42050, 43470, 44734, 46654, 53408, 58113, 
            61905, 66648, 68350, 68787]
Maldives = [36527]
Malta = [57774, 22755, 23494, 52607]
Mexico = [67032, 52407, 18496, 20577, 41982, 3975, 14796, 29072, 29418, 36754, 56892, 3026, 8444, 
          9482, 11344, 21781, 24603, 32654, 33916, 43016, 44447, 61850, 68333, 51719, 12966, 15113, 16060, 
          17502, 19903, 20861, 25994, 27472, 28145, 29556, 29618, 30107, 30144, 28276, 32743, 33291, 34446, 
          35765, 36134, 37137, 38437, 42973, 46268, 48899, 43687, 50495, 56888, 58456, 61526, 62848, 67588, 
          67964, 286, 3479, 4044, 8505, 9004, 9997, 10041, 10083, 10513, 10518, 10750, 11420, 11668, 12237, 
          14325, 15060, 16187, 17076, 18120, 18444, 20544, 21433, 23169, 24131, 24299, 24567, 25984, 27239, 
          27977, 28166, 28174, 29153, 29209, 30370, 30443, 31446, 32109, 32110, 32400, 32548, 33456, 35298, 
          36450, 38097, 38098, 38848, 39522, 39739, 39961, 40230, 43060, 44761, 46077, 46186, 47265, 47322, 
          52506, 58674, 59904, 60527, 61894, 66098, 69018, 71290]
Mongolia = [58192, 70868]
Myanmar = [8970]
Netherlands = [44712, 14337, 38036, 67230, 27209, 40607, 48082, 62704, 72303, 10185, 10867, 24673, 28953, 
               33039, 36741, 38691, 39389, 43832, 50369, 53375, 53799, 59774, 61772, 63254, 63780, 71295]
NewZealand = [25794, 14585, 27755, 31730, 20938, 21844, 23958, 24312, 24582, 27666, 28485, 46304, 54014, 
              1150, 2262, 7873, 8559, 9179, 9866, 13125, 13610, 13744, 14841, 15538, 15912, 16767, 17323, 17963, 
              18708, 18965, 19185, 19238, 21513, 22680, 23140, 26631, 27297, 27298, 28175, 28513, 28640, 28744, 
              28902, 29356, 29664, 30828, 31081, 31437, 34240, 34312, 34907, 39909, 42269, 42706, 42994, 43555, 
              43693, 43907, 46468, 46682, 48100, 50602, 52366, 52635, 53597, 53893, 55102, 56570, 57558, 57908,
              61250, 61939, 62177, 62376, 67288, 67454, 68647, 69296]
Nigeria = [36190]
Norway = [33427, 47877]
Oman = [48206]
OpenWater = [40044, 72008, 72240, 48326, 48390, 56749, 59284, 3161, 3311, 15470, 17390, 
             24254, 29031, 29032, 29134, 40098, 48195, 60991, 5291, 12028, 17114, 29437, 32626, 
             37020, 37347, 39491, 39521, 41282, 59765, 44861, 62670, 63355, 66689, 16444, 17566, 
             19772, 20960, 36139, 38089, 43231, 63487, 68659]
Pakistan = [35614, 4328, 45135]
Panama = [29396, 17653, 61445, 43235]
PapuaNewGuinea = [50243]
Peru = [57697]
Philippines = [1323, 39674, 17409, 29935, 39151, 42931, 47612, 10098, 14863, 24575, 26093, 28583, 29792, 
               35743, 35774, 37212, 38062, 38363, 47373, 54632, 57399, 58806, 66514]
Poland = [61691, 43976, 52378]
Portugal = [43562, 8051, 16866, 24643, 37003, 46487, 9949, 38439]
PR = [46002, 16237, 44849, 59395, 3202, 10267, 12490]
Romania = [39471, 6684, 41574, 58390]
Russia = [37812, 48103, 53877]
SaudiArabia = [71033, 54536, 11885, 23381, 62688]
Slovakia = [5248, 10270, 57451]
Slovenia = [50544]
Spain = [1576, 27342, 42302, 42468, 13181, 34552, 44367, 51192, 5610, 21417, 33450, 33562, 41988, 46738, 
         51513, 51706, 51933, 54786, 63049, 60638, 4886, 16332, 21063, 22104, 39545, 46480, 49650, 52245, 
         63496, 63510, 67836]
SriLanka = [13933, 18199, 20576, 25084, 25326, 28876, 32894, 41567, 44304, 44798, 49186, 49386, 49387]
Sweden = [65683, 18391, 70093]
Switzerland = [31170, 32450]
Taiwan = [60318]
Thailand = [7348, 19139, 30852, 8041, 997, 2619, 5921, 5922, 8085, 10497, 22361, 32825, 44933, 55538, 65573]
Trinidad = [10167, 31063, 35741]
Turkey = [13088, 66857]
UAE = [38491, 46017, 4045, 10849, 14575, 25529, 26867, 42831, 59879, 12317, 17234, 22549, 32464]
Ukraine = [22007, 54446]
UK = [5841, 8746, 10006, 11135, 22065, 22741, 30053, 40987, 56914, 6929, 30882, 31033, 53161, 
      53730, 58741, 60695, 64446, 65997, 66194, 70433, 69469, 67, 2081, 2941, 4066, 4261, 6215, 7016, 7902, 
      8418, 8428, 8503, 15072, 15508, 15527, 15635, 15382, 15881, 16196, 16272, 16833, 17925, 18292, 23463, 
      24159, 22400, 24367, 27075, 28517, 31546, 32033, 32034, 33224, 34135, 34524, 37932, 37615, 38131, 
      40397, 43583, 43607, 48088, 48156, 48778, 49265, 49715, 53522, 56865, 58271, 60656, 61321, 60540, 
      61534, 63348, 63537, 63895, 64395, 64560, 65477, 67685, 69881, 70090, 71330, 69434, 829, 1528, 1608, 
      1972, 1975, 2080, 2217, 3176, 3355, 3517, 3743, 3782, 3812, 4830, 5082, 5492, 6208, 6577, 6799, 6821, 
      6946, 7131, 7821, 8058, 8094, 8320, 8330, 8459, 9358, 9524, 9983, 10139, 10433, 11230, 11258, 11566, 
      12189, 12249, 12470, 12738, 13477, 13728, 13735, 13972, 14276, 14291, 15572, 16052, 16095, 16124, 
      16441, 16871, 16897, 17664, 18348, 18697, 18920, 18936, 18939, 19247, 20273, 20966, 21491, 22534, 
      22699, 23138, 23242, 23404, 23445, 23451, 23545, 23778, 24337, 24666, 25166, 25503, 25762, 25774, 
      27009, 28404, 28888, 29056, 29701, 29722, 30033, 30219, 30241, 30338, 30670, 31800, 32138, 32305, 
      32815, 32869, 33383, 33730, 34179, 34437, 34667, 35129, 35452, 35846, 36077, 36989, 37483, 37639, 
      37711, 37898, 38797, 39062, 39873, 39923, 39969, 40450, 40451, 41151, 41160, 41757, 42020, 42438, 
      43080, 44075, 44297, 45330, 46618, 47101, 47144, 47517, 47642, 47770, 47949, 48014, 48212, 48394, 
      48544, 49445, 49570, 51077, 51546, 51902, 51990, 53664, 53746, 53849, 54124, 54288, 54758, 54907, 
      55017, 55189, 57097, 57186, 58443, 59266, 59503, 59620, 60094, 60432, 60535, 60759, 61721, 62841, 
      63028, 63228, 63249, 63413, 63508, 64211, 64450, 65181, 65494, 65751, 66431, 66797, 66881, 66887, 
      68155, 68465, 68487, 69762, 70074, 70262, 72034]
Uruguay = [44634]
USA = [18334, 20432, 32628, 34679, 65731, 67784, 8041, 20312, 27449, 35746, 53307, 53940, 12445, 13562, 
       13626, 32427]
Venezuela = [50356, 9863, 30652, 1777, 15893, 18866, 20853, 48993, 70280]
VietNam = [56977, 31232]
Yugoslavia = [1500]
Zimbabwe = [67395]

# Replace country value for some rows based on values in new columns split from city column:
ufo.loc[Afghanistan, 'country'] = 'Afghanistan'
ufo.loc[Africa, 'country'] = 'Africa'
ufo.loc[Antarctica, 'country'] = 'Antarctica'
ufo.loc[Argentina, 'country'] = 'Argentina'
ufo.loc[Australia, 'country'] = 'Australia'
ufo.loc[Bahamas, 'country'] = 'Bahamas'
ufo.loc[Bahrain, 'country'] = 'Bahrain'
ufo.loc[Belarus, 'country'] = 'Europe'
ufo.loc[Bulgaria, 'country'] = 'Europe'
ufo.loc[Belgium, 'country'] = 'Belgium'
ufo.loc[Belize, 'country'] = 'Belize'
ufo.loc[Bolivia, 'country'] = 'Bolivia'
ufo.loc[Brazil, 'country'] = 'Brazil'
ufo.loc[BritishVI, 'country'] = 'British VI'
ufo.loc[Brunei, 'country'] = 'Brunei'
ufo.loc[Cambodia, 'country'] = 'Asia'
ufo.loc[Canada, 'country'] = 'Canada'
ufo.loc[Barbados, 'country'] = 'Caribbean'
ufo.loc[Caribbean, 'country'] = 'Caribbean'
ufo.loc[Chile, 'country'] = 'Chile'
ufo.loc[China, 'country'] = 'China'
ufo.loc[Colombia, 'country'] = 'Colombia'
ufo.loc[CostaRica, 'country'] = 'Costa Rica'
ufo.loc[Croatia, 'country'] = 'Croatia'
ufo.loc[Cuba, 'country'] = 'Cuba'
ufo.loc[Cyprus, 'country'] = 'Cyprus'
ufo.loc[CzechRep, 'country'] = 'Czech Republic'
ufo.loc[Denmark, 'country'] = 'Denmark'
ufo.loc[DomRep, 'country'] = 'Dominican Republic'
ufo.loc[EastTimor, 'country'] = 'East Timor'
ufo.loc[Ecuador, 'country'] = 'Ecuador'
ufo.loc[Egypt, 'country'] = 'Egypt'
ufo.loc[ElSalvador, 'country'] = 'El Salvador'
ufo.loc[Finland, 'country'] = 'Finland'
ufo.loc[France, 'country'] = 'France'
ufo.loc[Germany, 'country'] = 'Germany'
ufo.loc[Greece, 'country'] = 'Greece'
ufo.loc[Grenadine, 'country'] = 'Grenadine Island'
ufo.loc[Guatamala, 'country'] = 'Guatamala'
ufo.loc[Guyana, 'country'] = 'Guyana'
ufo.loc[Honduras, 'country'] = 'Honduras'
ufo.loc[Hungary, 'country'] = 'Hungary'
ufo.loc[InSpace, 'country'] = 'In Space'
ufo.loc[India, 'country'] = 'India'
ufo.loc[Indonesia, 'country'] = 'Indonesia'
ufo.loc[Iraq, 'country'] = 'Iraq'
ufo.loc[Ireland, 'country'] = 'Ireland'
ufo.loc[Israel, 'country'] = 'Israel'
ufo.loc[Italy, 'country'] = 'Italy'
ufo.loc[Jamaica, 'country'] = 'Jamaica'
ufo.loc[Japan, 'country'] = 'Japan'
ufo.loc[Korea, 'country'] = 'Korea'
ufo.loc[Kosovo, 'country'] = 'Kosovo'
ufo.loc[Kuwait, 'country'] = 'Kuwait'
ufo.loc[Lebanon, 'country'] = 'Lebanon'
ufo.loc[Luxembourg, 'country'] = 'Luxembourg'
ufo.loc[Malaysia, 'country'] = 'Malaysia'
ufo.loc[Maldives, 'country'] = 'Maldives'
ufo.loc[Malta, 'country'] = 'Malta'
ufo.loc[Mexico, 'country'] = 'Mexico'
ufo.loc[Mongolia, 'country'] = 'Mongolia'
ufo.loc[Myanmar, 'country'] = 'Myanmar'
ufo.loc[Netherlands, 'country'] = 'Netherlands'
ufo.loc[NewZealand, 'country'] = 'New Zealand'
ufo.loc[Nigeria, 'country'] = 'Nigeria'
ufo.loc[Norway, 'country'] = 'Norway'
ufo.loc[Oman, 'country'] = 'Oman'
ufo.loc[OpenWater, 'country'] = 'Open Water'
ufo.loc[Pakistan, 'country'] = 'Pakistan'
ufo.loc[Panama, 'country'] = 'Panama'
ufo.loc[PapuaNewGuinea, 'country'] = 'Papua - New Guinea'
ufo.loc[Peru, 'country'] = 'Peru'
ufo.loc[Philippines, 'country'] = 'Philippines'
ufo.loc[Poland, 'country'] = 'Poland'
ufo.loc[Portugal, 'country'] = 'Portugal'
ufo.loc[PR, 'country'] = 'Puerto Rico'
ufo.loc[Romania, 'country'] = 'Romania'
ufo.loc[Russia, 'country'] = 'Russia'
ufo.loc[SaudiArabia, 'country'] = 'Saudi Arabia'
ufo.loc[Slovakia, 'country'] = 'Slovakia'
ufo.loc[Slovenia, 'country'] = 'Slovenia'
ufo.loc[Spain, 'country'] = 'Spain'
ufo.loc[SriLanka, 'country'] = 'Sri Lanka'
ufo.loc[Sweden, 'country'] = 'Sweden'
ufo.loc[Switzerland, 'country'] = 'Switzerland'
ufo.loc[Taiwan, 'country'] = 'Taiwan'
ufo.loc[Thailand, 'country'] = 'Thailand'
ufo.loc[Trinidad, 'country'] = 'Trinidad'
ufo.loc[Turkey, 'country'] = 'Turkey'
ufo.loc[UAE, 'country'] = 'UAE'
ufo.loc[Ukraine, 'country'] = 'Ukraine'
ufo.loc[UK, 'country'] = 'UK'
ufo.loc[Uruguay, 'country'] = 'Uruguay'
ufo.loc[USA, 'country'] = 'USA'
ufo.loc[Venezuela, 'country'] = 'Venezuela'
ufo.loc[VietNam, 'country'] = 'Viet Nam'
ufo.loc[Yugoslavia, 'country'] = 'Yugoslavia'
ufo.loc[Zimbabwe, 'country'] = 'Zimbabwe'


# Drop split columns with no more useful information:
ufo = ufo.drop(columns=['2', '3', '4', '5', '6'])

# Check my work:
ufo['country'].value_counts(sort=False)

Ukraine                   2
Denmark                   3
Pakistan                  3
Hawaii                  314
Costa Rica               16
Uruguay                   1
Alaska                  300
Portugal                  8
Russia                    3
Australia               533
Netherlands              26
Switzerland               2
Maldives                  1
Brazil                   38
East Timor                1
Antarctica                1
Luxembourg                2
Oman                      1
Egypt                     3
Lebanon                   2
Slovakia                  3
Trinidad                  3
Yugoslavia                1
France                   22
Panama                    4
Nigeria                   1
Ireland                  46
Taiwan                    1
Sweden                    3
British VI                5
Africa                  103
Open Water               47
UAE                      13
India                    38
Mongolia                  2
Finland             

In [18]:
# Change all country = 0 to USA if the state does not = 0:
ufo.loc[(ufo['state'] != '0') & (ufo['country'] == '0'), 'country'] = 'USA'

# Change country name to Puerto Rico for state = PR:
ufo.loc[ufo['state'] == 'PR', 'country'] = 'Puerto Rico'

# Check my work:
ufo['country'].value_counts()

USA                   63383
Canada                 3280
UK                     2001
0                      1578
Australia               533
Hawaii                  314
Alaska                  300
Mexico                  121
Africa                  103
Germany                  88
New Zealand              78
Open Water               47
Ireland                  46
India                    38
Brazil                   38
Malaysia                 32
Spain                    31
Netherlands              26
Puerto Rico              26
Philippines              23
France                   22
Israel                   17
Costa Rica               16
China                    15
Korea                    14
Thailand                 14
Argentina                14
UAE                      13
Sri Lanka                13
Greece                   12
Italy                    10
Iraq                      9
Venezuela                 9
Japan                     8
Belgium                   8
Portugal            

In [19]:
# Look at the value counts of 1:
ufo['1'].value_counts()

0                               43384
(canada)                         2479
(uk/england)                     1372
city                             1311
beach                            1094
park                              602
springs                           566
lake                              538
york                              462
valley                            456
angeles                           392
vegas                             382
falls                             373
diego                             337
island                            301
(australia)                       244
hills                             211
grove                             209
bay                               209
hill                              203
creek                             194
jose                              184
francisco                         184
river                             184
heights                           179
(near)                            162
louis       

In [20]:
# Look at rows with specific values in column 1 with 5 or more value counts:
# ufo[(ufo['1'] == '(uk/england)') & (ufo['country'] == '0')].shape  #<--- 65 rows
# ufo[(ufo['1'] == '(australia)') & (ufo['country'] == '0')].shape  #<--- 19 rows
# ufo[(ufo['1'] == '(india)') & (ufo['country'] == '0')].shape  #<--- 147 rows
# ufo[(ufo['1'] == '(uk/scotland)') & (ufo['country'] == '0')].shape  #<--- 8 rows
# ufo[(ufo['1'] == '(mexico)') & (ufo['country'] == '0')].shape  #<--- 87 rows
# ufo[(ufo['1'] == '(germany)') & (ufo['country'] == '0')].shape  #<--- 12 rows
# ufo[(ufo['1'] == '(netherlands)') & (ufo['country'] == '0')].shape  #<--- 84 rows
# ufo[(ufo['1'] == '(uk/wales)') & (ufo['country'] == '0')]  #<--- 2 rows
# ufo[(ufo['1'] == '(spain)') & (ufo['country'] == '0')].shape  #<--- 33 rows
# ufo[(ufo['1'] == '(norway)') & (ufo['country'] == '0')].shape  #<--- 32 rows
# ufo[(ufo['1'] == '(japan)') & (ufo['country'] == '0')].shape  #<--- 29 rows
# ufo[(ufo['1'] == '(belgium)') & (ufo['country'] == '0')].shape  #<--- 29 rows
# ufo[(ufo['1'] == '(sweden)') & (ufo['country'] == '0')].shape  #<--- 28 rows
# ufo[(ufo['1'] == '(france)') & (ufo['country'] == '0')].shape  #<--- 26 rows
# ufo[(ufo['1'] == '(pakistan)') & (ufo['country'] == '0')].shape  #<--- 24 rows
# ufo[(ufo['1'] == '(greece)') & (ufo['country'] == '0')].shape  #<--- 22 rows
# ufo[(ufo['1'] == '(portugal)') & (ufo['country'] == '0')].shape  #<--- 23 rows
# ufo[(ufo['1'] == '(finland)') & (ufo['country'] == '0')].shape  #<--- 22 rows
# ufo[(ufo['1'] == '(turkey)') & (ufo['country'] == '0')].shape  #<--- 22 rows
# ufo[(ufo['1'] == '(china)') & (ufo['country'] == '0')].shape  #<--- 22 rows
# ufo[(ufo['1'] == '(brazil)') & (ufo['country'] == '0')].shape  #<--- 19 rows
# ufo[(ufo['1'] == '(iran)') & (ufo['country'] == '0')].shape  #<--- 19 rows
# ufo[(ufo['1'] == '(romania)') & (ufo['country'] == '0')].shape  #<--- 19 rows
# ufo[(ufo['1'] == '(malaysia)') & (ufo['country'] == '0')].shape  #<--- 18 rows
# ufo[(ufo['1'] == '(cyprus)') & (ufo['country'] == '0')].shape  #<--- 17 rows
# ufo[(ufo['1'] == '(ireland)') & (ufo['country'] == '0')].shape  #<--- 17 rows
# ufo[(ufo['1'] == '(croatia)') & (ufo['country'] == '0')].shape  #<--- 16 rows
# ufo[(ufo['1'] == '(italy)') & (ufo['country'] == '0')].shape  #<--- 16 rows
# ufo[(ufo['1'] == '(denmark)') & (ufo['country'] == '0')].shape  #<--- 15 rows
# ufo[(ufo['1'] == '(israel)') & (ufo['country'] == '0')].shape  #<--- 14 rows
# ufo[(ufo['1'] == '(hungary)') & (ufo['country'] == '0')].shape  #<--- 14 rows
# ufo[(ufo['1'] == '(venezuela)') & (ufo['country'] == '0')].shape  #<--- 12 rows
# ufo[(ufo['1'] == '(poland)') & (ufo['country'] == '0')].shape  #<--- 13 rows
# ufo[(ufo['1'] == '(switzerland)') & (ufo['country'] == '0')].shape  #<--- 13 rows
# ufo[(ufo['1'] == '(iraq)') & (ufo['country'] == '0')].shape  #<--- 12 rows
# ufo[(ufo['1'] == '(bulgaria)') & (ufo['country'] == '0')].shape  #<--- 11 rows
# ufo[(ufo['1'] == '(philippines)') & (ufo['country'] == '0')].shape  #<--- 11 rows
# ufo[(ufo['1'] == '(bangladesh)') & (ufo['country'] == '0')].shape  #<--- 11 rows
# ufo[(ufo['1'] == '(estonia)') & (ufo['country'] == '0')].shape  #<--- 10 rows
# ufo[(ufo['1'] == '(iceland)') & (ufo['country'] == '0')].shape  #<--- 10 rows
# ufo[(ufo['1'] == '(lithuania)') & (ufo['country'] == '0')].shape  #<--- 10 rows
# ufo[(ufo['1'] == '(indonesia)') & (ufo['country'] == '0')].shape  #<--- 10 rows
# ufo[(ufo['1'] == '(lebanon)') & (ufo['country'] == '0')].shape  #<--- 10 rows
# ufo[(ufo['1'] == '(jordan)') & (ufo['country'] == '0')].shape  #<--- 8 rows
# ufo[(ufo['1'] == '(chile)') & (ufo['country'] == '0')].shape  #<--- 8 rows
# ufo[(ufo['1'] == '(ecuador)') & (ufo['country'] == '0')].shape  #<--- 8 rows
# ufo[(ufo['1'] == 'kong') & (ufo['country'] == '0')]  #<--- Only 1 row
# ufo[(ufo['1'] == '(slovenia)') & (ufo['country'] == '0)].shape  #<--- 8 rows
# ufo[(ufo['1'] == '(ukraine)') & (ufo['country'] == '0')].shape  #<--- 7 rows
# ufo[(ufo['1'] == '(colombia)') & (ufo['country'] == '0')].shape  #<--- 7 rows
# ufo[(ufo['1'] == '(thailand)') & (ufo['country'] == '0')].shape  #<--- 7 rows
# ufo[(ufo['1'] == '(afghanistan)') & (ufo['country'] == '0')].shape  #<--- 7 rows
# ufo[(ufo['1'] == '(jamaica)') & (ufo['country'] == '0')].shape  #<--- 6 rows
# ufo[(ufo['1'] == 'republic') & (ufo['country'] == '0')]  #<--- Only 1 row
# ufo[(ufo['1'] == '(trinidad/tobago)') & (ufo['country'] == '0')].shape  #<--- 4 rows
# ufo[(ufo['1'] == '(austria)') & (ufo['country'] == '0')].shape  #<--- 5 rows
# ufo[(ufo['1'] == '(uk/england') & (ufo['country'] == '0')]  #<--- 4 rows
# ufo[(ufo['1'] == '(yugoslavia)') & (ufo['country'] == '0')]  #<--- 5 rows
# ufo[(ufo['1'] == 'zealand') & (ufo['country'] == '0')]  #<--- 5 rows
# ufo[(ufo['1'] == '(kosovo)') & (ufo['country'] == '0')]  #<--- 5rows
# ufo[(ufo['1'] == '(uae)') & (ufo['country'] == '0')]  #<--- 5 rows
# ufo[(ufo['1'] != '0') & (ufo['country'] == '0')]  #<--- Nothing left now.

# Change country values based on values in column 1:
ufo.loc[(ufo['1'] == '(uk/england)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(uk/scotland)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(uk/wales)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(australia)') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['1'] == '(india)') & (ufo['country'] == '0'), 'country'] = 'India'
ufo.loc[(ufo['1'] == '(mexico)') & (ufo['country'] == '0'), 'country'] = 'Mexico'
ufo.loc[(ufo['1'] == '(germany)') & (ufo['country'] == '0'), 'country'] = 'Germany'
ufo.loc[(ufo['1'] == '(netherlands)') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['1'] == '(norway)') & (ufo['country'] == '0'), 'country'] = 'Norway'
ufo.loc[(ufo['1'] == '(japan)') & (ufo['country'] == '0'), 'country'] = 'Japan'
ufo.loc[(ufo['1'] == '(belgium)') & (ufo['country'] == '0'), 'country'] = 'Belgium'
ufo.loc[(ufo['1'] == '(sweden)') & (ufo['country'] == '0'), 'country'] = 'Sweden'
ufo.loc[(ufo['1'] == '(france)') & (ufo['country'] == '0'), 'country'] = 'France'
ufo.loc[(ufo['1'] == '(pakistan)') & (ufo['country'] == '0'), 'country'] = 'Pakistan'
ufo.loc[(ufo['1'] == '(greece)') & (ufo['country'] == '0'), 'country'] = 'Greece'
ufo.loc[(ufo['1'] == '(portugal)') & (ufo['country'] == '0'), 'country'] = 'Portugal'
ufo.loc[(ufo['1'] == '(finland)') & (ufo['country'] == '0'), 'country'] = 'Finland'
ufo.loc[(ufo['1'] == '(turkey)') & (ufo['country'] == '0'), 'country'] = 'Turkey'
ufo.loc[(ufo['1'] == '(china)') & (ufo['country'] == '0'), 'country'] = 'China'
ufo.loc[(ufo['1'] == '(brazil)') & (ufo['country'] == '0'), 'country'] = 'Brazil'
ufo.loc[(ufo['1'] == '(iran)') & (ufo['country'] == '0'), 'country'] = 'Iran'
ufo.loc[(ufo['1'] == '(romania)') & (ufo['country'] == '0'), 'country'] = 'Romania'
ufo.loc[(ufo['1'] == '(malaysia)') & (ufo['country'] == '0'), 'country'] = 'Malaysia'
ufo.loc[(ufo['1'] == '(cyprus)') & (ufo['country'] == '0'), 'country'] = 'Cyprus'
ufo.loc[(ufo['1'] == '(ireland)	') & (ufo['country'] == '0'), 'country'] = 'Ireland'
ufo.loc[(ufo['1'] == '(croatia)') & (ufo['country'] == '0'), 'country'] = 'Croatia'
ufo.loc[(ufo['1'] == '(italy)') & (ufo['country'] == '0'), 'country'] = 'Italy'
ufo.loc[(ufo['1'] == '(denmark)') & (ufo['country'] == '0'), 'country'] = 'Denmark'
ufo.loc[(ufo['1'] == '(israel)') & (ufo['country'] == '0'), 'country'] = 'Israel'
ufo.loc[(ufo['1'] == '(hungary)') & (ufo['country'] == '0'), 'country'] = 'Hungary'
ufo.loc[(ufo['1'] == '(venezuela)') & (ufo['country'] == '0'), 'country'] = 'Venezuela'
ufo.loc[(ufo['1'] == '(poland)') & (ufo['country'] == '0'), 'country'] = 'Poland'
ufo.loc[(ufo['1'] == '(switzerland)') & (ufo['country'] == '0'), 'country'] = 'Switzerland'
ufo.loc[(ufo['1'] == '(iraq)') & (ufo['country'] == '0'), 'country'] = 'Iraq'
ufo.loc[(ufo['1'] == '(bulgaria)') & (ufo['country'] == '0'), 'country'] = 'Bulgaria'
ufo.loc[(ufo['1'] == '(philippines)') & (ufo['country'] == '0'), 'country'] = 'Philippines'
ufo.loc[(ufo['1'] == '(bangladesh)') & (ufo['country'] == '0'), 'country'] = 'Bangladesh'
ufo.loc[(ufo['1'] == '(estonia)') & (ufo['country'] == '0'), 'country'] = 'Estonia'
ufo.loc[(ufo['1'] == '(iceland)') & (ufo['country'] == '0'), 'country'] = 'Iceland'
ufo.loc[(ufo['1'] == '(lithuania)') & (ufo['country'] == '0'), 'country'] = 'Lithuania'
ufo.loc[(ufo['1'] == '(indonesia)') & (ufo['country'] == '0'), 'country'] = 'Indonesia'
ufo.loc[(ufo['1'] == '(lebanon)') & (ufo['country'] == '0'), 'country'] = 'Lebanon'
ufo.loc[(ufo['1'] == '(jordan)') & (ufo['country'] == '0'), 'country'] = 'Jordan'
ufo.loc[(ufo['1'] == '(chile)') & (ufo['country'] == '0'), 'country'] = 'Chile'
ufo.loc[(ufo['1'] == '(ecuador)') & (ufo['country'] == '0'), 'country'] = 'Ecuador'
ufo.loc[(ufo['1'] == 'kong') & (ufo['country'] == '0'), 'country'] = 'Hong Kong'
ufo.loc[(ufo['1'] == '(slovenia)') & (ufo['country'] == '0'), 'country'] = 'Slovenia'
ufo.loc[(ufo['1'] == '(ukraine)') & (ufo['country'] == '0'), 'country'] = 'Ukraine'
ufo.loc[(ufo['1'] == '(colombia)') & (ufo['country'] == '0'), 'country'] = 'Colombia'
ufo.loc[(ufo['1'] == '(thailand)') & (ufo['country'] == '0'), 'country'] = 'Thailand'
ufo.loc[(ufo['1'] == '(afghanistan)') & (ufo['country'] == '0'), 'country'] = 'Afghanistan'
ufo.loc[(ufo['1'] == '(jamaica)') & (ufo['country'] == '0'), 'country'] = 'Jamaica'
ufo.loc[(ufo['1'] == 'republic') & (ufo['country'] == '0'), 'country'] = 'Czech Republic'
ufo.loc[(ufo['1'] == '(trinidad/tobago)') & (ufo['country'] == '0'), 'country'] = 'Trinidad'
ufo.loc[(ufo['1'] == '(austria)') & (ufo['country'] == '0'), 'country'] = 'Austria'
ufo.loc[(ufo['1'] == '(uk/england') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(yugoslavia)') & (ufo['country'] == '0'), 'country'] = 'Yugoslavia'
ufo.loc[(ufo['1'] == 'zealand') & (ufo['country'] == '0'), 'country'] = 'New Zealand'
ufo.loc[(ufo['1'] == '(kosovo)') & (ufo['country'] == '0'), 'country'] = 'Kosovo'
ufo.loc[(ufo['1'] == '(uae)') & (ufo['country'] == '0'), 'country'] = 'UAE'
ufo.loc[(ufo['1'] == '(armenia)') & (ufo['country'] == '0'), 'country'] = 'Armenia'
ufo.loc[(ufo['1'] == 'sinaloa') & (ufo['country'] == '0'), 'country'] = 'Mexico'
ufo.loc[(ufo['1'] == '(spain)') & (ufo['country'] == '0'), 'country'] = 'Spain'
ufo.loc[(ufo['1'] == '(egypt)') & (ufo['country'] == '0'), 'country'] = 'Egypt'
ufo.loc[(ufo['1'] == '(ireland)') & (ufo['country'] == '0'), 'country'] = 'Ireland'
ufo.loc[(ufo['1'] == 'ocean') & (ufo['country'] == '0'), 'country'] = 'Open Water'
ufo.loc[(ufo['1'] == 'sea') & (ufo['country'] == '0'), 'country'] = 'Open Water'
ufo.loc[(ufo['1'] == 'fokani/hims') & (ufo['country'] == '0'), 'country'] = 'Syria'
ufo.loc[(ufo['1'] == '(algeria)') & (ufo['country'] == '0'), 'country'] = 'Algeria'
ufo.loc[(ufo['1'] == '(morocco)') & (ufo['country'] == '0'), 'country'] = 'Morocco'
ufo.loc[(ufo['1'] == '(bosnia)') & (ufo['country'] == '0'), 'country'] = 'Bosnia'
ufo.loc[(ufo['1'] == '(latvia)') & (ufo['country'] == '0'), 'country'] = 'Latvia'
ufo.loc[(ufo['1'] == '(suriname)') & (ufo['country'] == '0'), 'country'] = 'Suriname'
ufo.loc[(ufo['1'] == '(uzbekistan)') & (ufo['country'] == '0'), 'country'] = 'Uzbekistan'
ufo.loc[(ufo['1'] == '(ghana)') & (ufo['country'] == '0'), 'country'] = 'Ghana'
ufo.loc[(ufo['1'] == '(nepal)') & (ufo['country'] == '0'), 'country'] = 'Nepal'
ufo.loc[(ufo['1'] == '(bolivia)') & (ufo['country'] == '0'), 'country'] = 'Bolivia'
ufo.loc[(ufo['1'] == '(bahrain)') & (ufo['country'] == '0'), 'country'] = 'Bahrain'
ufo.loc[(ufo['1'] == '(caribbean)') & (ufo['country'] == '0'), 'country'] = 'Caribbean'
ufo.loc[(ufo['1'] == '(korea)') & (ufo['country'] == '0'), 'country'] = 'Korea'
ufo.loc[(ufo['1'] == 'ireland') & (ufo['country'] == '0'), 'country'] = 'Ireland'
ufo.loc[(ufo['1'] == '(malta)') & (ufo['country'] == '0'), 'country'] = 'Malta'
ufo.loc[(ufo['1'] == '(slovakia)') & (ufo['country'] == '0'), 'country'] = 'Slovakia'
ufo.loc[(ufo['1'] == '(luxemburg)') & (ufo['country'] == '0'), 'country'] = 'Luxembourg'
ufo.loc[(ufo['1'] == '(azerbaijan)') & (ufo['country'] == '0'), 'country'] = 'Azerbaijan'
ufo.loc[(ufo['1'] == '(fiji)') & (ufo['country'] == '0'), 'country'] = 'Fiji'
ufo.loc[(ufo['1'] == '(dubai)') & (ufo['country'] == '0'), 'country'] = 'Dubai'
ufo.loc[(ufo['1'] == 'piedras') & (ufo['country'] == '0'), 'country'] = 'Puerto Rico'
ufo.loc[(ufo['1'] == '(merseyside)(uk/wales)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(maldives)') & (ufo['country'] == '0'), 'country'] = 'Maldives'
ufo.loc[(ufo['1'] == '(honduras)') & (ufo['country'] == '0'), 'country'] = 'Honduras'
ufo.loc[(ufo['1'] == '(paraguay)') & (ufo['country'] == '0'), 'country'] = 'Paraguay'
ufo.loc[(ufo['1'] == 'rico') & (ufo['country'] == '0'), 'country'] = 'Puerto Rico'
ufo.loc[(ufo['1'] == 'mumbai') & (ufo['country'] == '0'), 'country'] = 'India'
ufo.loc[(ufo['1'] == '(palau)') & (ufo['country'] == '0'), 'country'] = 'Palau'
ufo.loc[(ufo['1'] == '(lesotho)') & (ufo['country'] == '0'), 'country'] = 'Lesotho'
ufo.loc[(ufo['1'] == '(uk/scotland') & (ufo['country'] == '0'), 'country'] = 'Scotland'
ufo.loc[(ufo['1'] == '(kenya)') & (ufo['country'] == '0'), 'country'] = 'Kenya'
ufo.loc[(ufo['1'] == 'africa') & (ufo['country'] == '0'), 'country'] = 'Africa'
ufo.loc[(ufo['1'] == '(bermuda)') & (ufo['country'] == '0'), 'country'] = 'Bermuda'
ufo.loc[(ufo['1'] == 'kennedy') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['1'] == '(nigeria)') & (ufo['country'] == '0'), 'country'] = 'Nigeria'
ufo.loc[(ufo['1'] == '(brasil)') & (ufo['country'] == '0'), 'country'] = 'Brazil'
ufo.loc[(ufo['1'] == '(cancun)') & (ufo['country'] == '0'), 'country'] = 'Mexico'
ufo.loc[(ufo['1'] == 'manchester') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(taiwan)') & (ufo['country'] == '0'), 'country'] = 'Taiwan'
ufo.loc[(ufo['1'] == '(crimea)') & (ufo['country'] == '0'), 'country'] = 'Ukraine'
ufo.loc[(ufo['1'] == '(kyrgyzistan)') & (ufo['country'] == '0'), 'country'] = 'Kyrgyzstan'
ufo.loc[(ufo['1'] == '(serbia)') & (ufo['country'] == '0'), 'country'] = 'Serbia'
ufo.loc[(ufo['1'] == '(luxembourge)') & (ufo['country'] == '0'), 'country'] = 'Luxembourg'
ufo.loc[(ufo['1'] == '(u.a.r.)') & (ufo['country'] == '0'), 'country'] = 'UAR'
ufo.loc[(ufo['1'] == '(u.a.e.)') & (ufo['country'] == '0'), 'country'] = 'UAE'
ufo.loc[(ufo['1'] == 'amsterdam') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['1'] == '(barbados)') & (ufo['country'] == '0'), 'country'] = 'Barbados'
ufo.loc[(ufo['1'] == '(namibia)') & (ufo['country'] == '0'), 'country'] = 'Namibia'
ufo.loc[(ufo['1'] == 'cruise') & (ufo['country'] == '0'), 'country'] = 'Open Water'
ufo.loc[(ufo['1'] == '(peru)') & (ufo['country'] == '0'), 'country'] = 'Peru'
ufo.loc[(ufo['1'] == '(zambia)') & (ufo['country'] == '0'), 'country'] = 'Zambia'
ufo.loc[(ufo['1'] == 'kingdom') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(argentina)') & (ufo['country'] == '0'), 'country'] = 'Argentina'
ufo.loc[(ufo['1'] == '(guatamala)') & (ufo['country'] == '0'), 'country'] = 'Guatamala'
ufo.loc[(ufo['1'] == '(brunei)') & (ufo['country'] == '0'), 'country'] = 'Brunei'
ufo.loc[(ufo['1'] == '(tunisia)') & (ufo['country'] == '0'), 'country'] = 'Africa'
ufo.loc[(ufo['1'] == 'paz/cochabamba/potosi') & (ufo['country'] == '0'), 'country'] = 'Bolivia'
ufo.loc[(ufo['1'] == '(syria)') & (ufo['country'] == '0'), 'country'] = 'Syria'
ufo.loc[(ufo['1'] == '(milano)') & (ufo['country'] == '0'), 'country'] = 'Italy'
ufo.loc[(ufo['1'] == '(midlothian)(uk/scotland)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(natherlands)') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['1'] == '(guatemala)') & (ufo['country'] == '0'), 'country'] = 'Guatemala'
ufo.loc[(ufo['1'] == '(yorkshire)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(cameroon)') & (ufo['country'] == '0'), 'country'] = 'Cameroon'
ufo.loc[(ufo['1'] == '(macedonia)') & (ufo['country'] == '0'), 'country'] = 'Macedonia'
ufo.loc[(ufo['1'] == '(albania)') & (ufo['country'] == '0'), 'country'] = 'Albania'
ufo.loc[(ufo['1'] == '(senegal)') & (ufo['country'] == '0'), 'country'] = 'Senegal'
ufo.loc[(ufo['1'] == '(uar)') & (ufo['country'] == '0'), 'country'] = 'UAR'
ufo.loc[(ufo['1'] == '(botswana)') & (ufo['country'] == '0'), 'country'] = 'Botswana'
ufo.loc[(ufo['1'] == '(uruguay)') & (ufo['country'] == '0'), 'country'] = 'Uruguay'
ufo.loc[(ufo['1'] == '(zimbabwe)') & (ufo['country'] == '0'), 'country'] = 'Zimbabwe'
ufo.loc[(ufo['1'] == '(georgia)') & (ufo['country'] == '0'), 'country'] = 'Georgia'
ufo.loc[(ufo['1'] == 'flight') & (ufo['country'] == '0'), 'country'] = 'Open Water'
ufo.loc[(ufo['1'] == '(uk/england?)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(bosnia/herzegovina)') & (ufo['country'] == '0'), 'country'] = 'Bosnia'
ufo.loc[(ufo['1'] == 'gulf') & (ufo['country'] == '0'), 'country'] = 'Open Water'
ufo.loc[(ufo['1'] == '(australi)') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['1'] == '(boxnia)') & (ufo['country'] == '0'), 'country'] = 'Bosnia'
ufo.loc[(ufo['1'] == '(kazakstan)') & (ufo['country'] == '0'), 'country'] = 'Kazakhstan'
ufo.loc[(ufo['1'] == '(bosnia/herzogovina)') & (ufo['country'] == '0'), 'country'] = 'Bosnia'
ufo.loc[(ufo['1'] == '(netherland)') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['1'] == '(belize)') & (ufo['country'] == '0'), 'country'] = 'Belize'
ufo.loc[(ufo['1'] == '(wales)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(russia)') & (ufo['country'] == '0'), 'country'] = 'Russia'
ufo.loc[(ufo['1'] == '(antibes)') & (ufo['country'] == '0'), 'country'] = 'France'
ufo.loc[(ufo['1'] == '(rhodes)') & (ufo['country'] == '0'), 'country'] = 'Greece'
ufo.loc[(ufo['1'] == '(manchester)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(india') & (ufo['country'] == '0'), 'country'] = 'India'
ufo.loc[(ufo['1'] == '(panama)') & (ufo['country'] == '0'), 'country'] = 'Panama'
ufo.loc[(ufo['1'] == '(botswama)') & (ufo['country'] == '0'), 'country'] = 'Botswana'
ufo.loc[(ufo['1'] == '(mauritius)') & (ufo['country'] == '0'), 'country'] = 'Mauritius'
ufo.loc[(ufo['1'] == '(mongolia)') & (ufo['country'] == '0'), 'country'] = 'Mongolia'
ufo.loc[(ufo['1'] == '(selangor)(malaysia)') & (ufo['country'] == '0'), 'country'] = 'Malaysia'
ufo.loc[(ufo['1'] == '(scotland)') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == 'australia') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['1'] == 'popocatapetl') & (ufo['country'] == '0'), 'country'] = 'Mexico'
ufo.loc[(ufo['1'] == 'midlands') & (ufo['country'] == '0'), 'country'] = 'England'
ufo.loc[(ufo['1'] == '(trinidad)') & (ufo['country'] == '0'), 'country'] = 'Trinidad'
ufo.loc[(ufo['1'] == '(myanmar)') & (ufo['country'] == '0'), 'country'] = 'Myanmar'
ufo.loc[(ufo['1'] == '(inflight)') & (ufo['country'] == '0'), 'country'] = 'Open Water'
ufo.loc[(ufo['1'] == 'states') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['1'] == '(uk/england)k') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == '(qatar)') & (ufo['country'] == '0'), 'country'] = 'Qatar'
ufo.loc[(ufo['1'] == '(sinai)') & (ufo['country'] == '0'), 'country'] = 'Egypt'
ufo.loc[(ufo['1'] == 'sp&aring;nga') & (ufo['country'] == '0'), 'country'] = 'Sweden'
ufo.loc[(ufo['1'] == 'somerset') & (ufo['country'] == '0'), 'country'] = 'England'
ufo.loc[(ufo['0'] == 'australia') & (ufo['1'] == '(rural)') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['0'] == 'croatia') & (ufo['1'] == '(rural)') & (ufo['country'] == '0'), 'country'] = 'Croatia'
ufo.loc[(ufo['1'] == 'fort') & (ufo['country'] == '0'), 'country'] = 'Caribbean'
ufo.loc[(ufo['1'] == 'hill') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['1'] == 'town') & (ufo['country'] == '0'), 'country'] = 'Africa'
ufo.loc[(ufo['1'] == 'rivers') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['1'] == 'keys') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['1'] == 'north') & (ufo['country'] == '0'), 'country'] = 'New Zealand'
ufo.loc[(ufo['1'] == '(southern)') & (ufo['country'] == '0'), 'country'] = 'Iraq'
ufo.loc[(ufo['1'] == 'beach') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['0'] == 'australia') & (ufo['1'] == '(northeast)') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['0'] == 'thailand') & (ufo['1'] == '(northeast)') & (ufo['country'] == '0'), 'country'] = 'Thailand'


# Drop column 1, no more useful information:
ufo.drop(columns='1', inplace=True)

# Check my work:
ufo['country'].value_counts()

USA                   63387
Canada                 3280
UK                     2090
Australia               558
Hawaii                  314
Alaska                  300
0                       232
Mexico                  211
India                   187
Netherlands             113
Africa                  106
Germany                 100
New Zealand              84
Ireland                  65
Open Water               64
Spain                    64
Brazil                   59
Malaysia                 51
France                   49
China                    37
Japan                    37
Belgium                  37
Greece                   35
Philippines              34
Norway                   34
Sweden                   32
Portugal                 31
Israel                   31
Puerto Rico              31
Italy                    27
Pakistan                 27
Finland                  25
Turkey                   24
Romania                  23
Thailand                 22
Croatia             

In [21]:
# Change country values based on values in column 0:
ufo.loc[(ufo['0'] == 'iraq') & (ufo['country'] == '0'), 'country'] = 'Iraq'
ufo.loc[(ufo['0'] == 'gaia') & (ufo['country'] == '0'), 'country'] = 'Portugal'
ufo.loc[(ufo['0'] == 'uk/england') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'cali') & (ufo['country'] == '0'), 'country'] = 'Colombia'
ufo.loc[(ufo['0'] == 'philippines') & (ufo['country'] == '0'), 'country'] = 'Philippines'
ufo.loc[(ufo['0'] == 'australia') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['0'] == 'japan') & (ufo['country'] == '0'), 'country'] = 'Japan'
ufo.loc[(ufo['0'] == 'malmesbury') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'gillingham') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'guatemala') & (ufo['country'] == '0'), 'country'] = 'Guatemala'
ufo.loc[(ufo['0'] == 'seoul') & (ufo['country'] == '0'), 'country'] = 'Korea'
ufo.loc[(ufo['0'] == 'paphos') & (ufo['country'] == '0'), 'country'] = 'Paphos'
ufo.loc[(ufo['0'] == 'luxembourg') & (ufo['country'] == '0'), 'country'] = 'Luxembourg'
ufo.loc[(ufo['0'] == 'kosovo') & (ufo['country'] == '0'), 'country'] = 'Kosovo'
ufo.loc[(ufo['0'] == 'zimbabwe') & (ufo['country'] == '0'), 'country'] = 'Zimbabwe'
ufo.loc[(ufo['0'] == 'kuwait') & (ufo['country'] == '0'), 'country'] = 'Kuwait'
ufo.loc[(ufo['0'] == 'afghanistan') & (ufo['country'] == '0'), 'country'] = 'Afghanistan'
ufo.loc[(ufo['0'] == 'amed') & (ufo['country'] == '0'), 'country'] = 'Indonesia'
ufo.loc[(ufo['0'] == 'estonia') & (ufo['country'] == '0'), 'country'] = 'Estonia'
ufo.loc[(ufo['0'] == 'singapore') & (ufo['country'] == '0'), 'country'] = 'Singapore'
ufo.loc[(ufo['0'] == 'bilbao')& (ufo['country'] == '0'), 'country'] = 'Spain'
ufo.loc[(ufo['0'] == 'tabriz') & (ufo['country'] == '0'), 'country'] = 'Iran'
ufo.loc[(ufo['0'] == 'sharjah') & (ufo['country'] == '0'), 'country'] = 'UAE'
ufo.loc[(ufo['0'] == 'bogor') & (ufo['country'] == '0'), 'country'] = 'Indonesia'
ufo.loc[(ufo['0'] == 'kajaani') & (ufo['country'] == '0'), 'country'] = 'Finland'
ufo.loc[(ufo['0'] == 'wednesbury') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'yateley') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'aruba') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['0'] == 'iquique') & (ufo['country'] == '0'), 'country'] = 'Chile'
ufo.loc[(ufo['0'] == 'barbados') & (ufo['country'] == '0'), 'country'] = 'Barbados'
ufo.loc[(ufo['0'] == 'trinidad/tobago') & (ufo['country'] == '0'), 'country'] = 'Trinidad'
ufo.loc[(ufo['0'] == 'debrecen') & (ufo['country'] == '0'), 'country'] = 'Hungary'
ufo.loc[(ufo['0'] == 'uk/scotland') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'sotira') & (ufo['country'] == '0'), 'country'] = 'Cyprus'
ufo.loc[(ufo['0'] == 'mayag&uuml;ez') & (ufo['country'] == '0'), 'country'] = 'Puerto Rico'
ufo.loc[(ufo['0'] == 'paraparaumu') & (ufo['country'] == '0'), 'country'] = 'New Zealand'
ufo.loc[(ufo['0'] == 'mumbai') & (ufo['country'] == '0'), 'country'] = 'India'
ufo.loc[(ufo['0'] == 'potzberg') & (ufo['country'] == '0'), 'country'] = 'Germany'
ufo.loc[(ufo['0'] == 'in-flight/europe') & (ufo['country'] == '0'), 'country'] = 'Europe'
ufo.loc[(ufo['0'] == 'tirau') & (ufo['country'] == '0'), 'country'] = 'New Zealand'
ufo.loc[(ufo['0'] == 'caracas') & (ufo['country'] == '0'), 'country'] = 'Venezuela'
ufo.loc[(ufo['0'] == 'netherlands') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['0'] == 'shepshed') & (ufo['country'] == '0'), 'country'] = 'England'
ufo.loc[(ufo['0'] == 'guyana') & (ufo['country'] == '0'), 'country'] = 'Guyana'
ufo.loc[(ufo['0'] == 'baghdad') & (ufo['country'] == '0'), 'country'] = 'Baghdad'
ufo.loc[(ufo['0'] == 'ath') & (ufo['country'] == '0'), 'country'] = 'Belgium'
ufo.loc[(ufo['0'] == 'guatamala') & (ufo['country'] == '0'), 'country'] = 'Guatemala'
ufo.loc[(ufo['0'] == 'adelaide') & (ufo['country'] == '0'), 'country'] = 'Australia'
ufo.loc[(ufo['0'] == 'turks/caicos') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'india') & (ufo['country'] == '0'), 'country'] = 'India'
ufo.loc[(ufo['0'] == 'malaysia') & (ufo['country'] == '0'), 'country'] = 'Malaysia'
ufo.loc[(ufo['0'] == 'germany') & (ufo['country'] == '0'), 'country'] = 'Germany'
ufo.loc[(ufo['0'] == 'quito') & (ufo['country'] == '0'), 'country'] = 'Ecuador'
ufo.loc[(ufo['0'] == 'kiev') & (ufo['country'] == '0'), 'country'] = 'Ukraine'
ufo.loc[(ufo['0'] == 'ensenada') & (ufo['country'] == '0'), 'country'] = 'Mexico'
ufo.loc[(ufo['0'] == 'bahamas') & (ufo['country'] == '0'), 'country'] = 'Bahamas'
ufo.loc[(ufo['0'] == 'limassol') & (ufo['country'] == '0'), 'country'] = 'Cyprus'
ufo.loc[(ufo['0'] == 'split') & (ufo['country'] == '0'), 'country'] = 'Croatia'
ufo.loc[(ufo['0'] == 'spain') & (ufo['country'] == '0'), 'country'] = 'Spain'
ufo.loc[(ufo['0'] == 'uk/wales') & (ufo['country'] == '0'), 'country'] = 'Wales'
ufo.loc[(ufo['0'] == 'europe') & (ufo['country'] == '0'), 'country'] = 'Europe'
ufo.loc[(ufo['0'] == 'bulgaria') & (ufo['country'] == '0'), 'country'] = 'Bulgaria'
ufo.loc[(ufo['0'] == 'portugal') & (ufo['country'] == '0'), 'country'] = 'Portugal'
ufo.loc[(ufo['0'] == 'wakeman') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['0'] == 'doha') & (ufo['country'] == '0'), 'country'] = 'Qatar'
ufo.loc[(ufo['0'] == 'romania') & (ufo['country'] == '0'), 'country'] = 'Romania'
ufo.loc[(ufo['0'] == 'mellieha') & (ufo['country'] == '0'), 'country'] = 'Malta'
ufo.loc[(ufo['0'] == 'bermuda') & (ufo['country'] == '0'), 'country'] = 'Bermuda'
ufo.loc[(ufo['0'] == 'roodepoort') & (ufo['country'] == '0'), 'country'] = 'Africa'
ufo.loc[(ufo['0'] == 'avebury') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'hoylake') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'france') & (ufo['country'] == '0'), 'country'] = 'France'
ufo.loc[(ufo['0'] == 'cyprus') & (ufo['country'] == '0'), 'country'] = 'Cyprus'
ufo.loc[(ufo['0'] == 'lelystad') & (ufo['country'] == '0'), 'country'] = 'Netherlands'
ufo.loc[(ufo['0'] == 'belgium') & (ufo['country'] == '0'), 'country'] = 'Belgium'
ufo.loc[(ufo['0'] == 'doncaster') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'oslo') & (ufo['country'] == '0'), 'country'] = 'Norway'
ufo.loc[(ufo['0'] == 'guayaquil') & (ufo['country'] == '0'), 'country'] = 'Ecuador'
ufo.loc[(ufo['0'] == 'kullu') & (ufo['country'] == '0'), 'country'] = 'India'
ufo.loc[(ufo['0'] == 'noshahr') & (ufo['country'] == '0'), 'country'] = 'Iran'
ufo.loc[(ufo['0'] == 'wellingborough') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'greece') & (ufo['country'] == '0'), 'country'] = 'Greece'
ufo.loc[(ufo['0'] == 'mazarron') & (ufo['country'] == '0'), 'country'] = 'Spain'
ufo.loc[(ufo['0'] == 'taipei') & (ufo['country'] == '0'), 'country'] = 'Taiwan'
ufo.loc[(ufo['0'] == 'cardiff') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'hungary') & (ufo['country'] == '0'), 'country'] = 'Hungary'
ufo.loc[(ufo['0'] == 'gibraltar') & (ufo['country'] == '0'), 'country'] = 'UK'
ufo.loc[(ufo['0'] == 'guam') & (ufo['country'] == '0'), 'country'] = 'Guam'
ufo.loc[(ufo['0'] == 'unknown') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['0'] == 'indonesia') & (ufo['country'] == '0'), 'country'] = 'Indonesia'
ufo.loc[(ufo['0'] == 'canada') & (ufo['country'] == '0'), 'country'] = 'Canada'
ufo.loc[(ufo['0'] == 'occoquan') & (ufo['country'] == '0'), 'country'] = 'USA'
ufo.loc[(ufo['0'] == 'kenya') & (ufo['country'] == '0'), 'country'] = 'Africa'

In [22]:
# Look at all country rows with 0 and 0 is not 0:
ufo[(ufo['0'] != '0') & (ufo['country'] == '0') & (ufo['state'] == '0')]

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,0,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class


In [23]:
# Drop column 0, no more useful information:
ufo.drop(columns='0', inplace=True)

# Check my work:
ufo['country'].value_counts()

USA                   63391
Canada                 3281
UK                     2159
Australia               572
Hawaii                  314
Alaska                  300
Mexico                  212
India                   192
Netherlands             116
Africa                  108
Germany                 103
New Zealand              86
Spain                    69
Ireland                  65
Open Water               64
Brazil                   59
Malaysia                 52
France                   51
Philippines              43
Japan                    40
Belgium                  40
Portugal                 38
China                    37
Greece                   36
Norway                   35
Sweden                   32
Puerto Rico              32
Israel                   31
Pakistan                 27
Italy                    27
Finland                  26
Romania                  26
Turkey                   24
Iraq                     23
Croatia                  23
Venezuela           

In [28]:
# Create a continent feature:
ufo['continent'] = ufo['country']
ufo.head(10)

Unnamed: 0,Id,year,month,dow,hour,durations_in_secs,city,state,country,latitude,longitude,color,movement,elevation,sound,hoax,shape_class,continent
0,58,1994,10,Mon,15,3600.0,Mercedies,TX,USA,26.149798,-97.913611,0,0,0,0,0,Non-Geometric,USA
1,59,1994,10,Mon,18,120.0,Burnt Hills,NY,USA,42.909722,-73.895556,0,0,1,0,0,Geometric,USA
2,60,1994,10,Mon,22,5.0,Pinebergen,AR,USA,34.102778,-91.992222,0,1,1,1,0,Type of Light,USA
3,61,1994,10,Mon,23,3600.0,Toronto (Greater Toronto Area) (Canada),ON,Canada,43.666667,-79.416667,0,0,0,0,0,Circular,Canada
4,62,1995,10,Tue,19,120.0,Milwaukee,WI,USA,43.038889,-87.906389,1,0,0,0,0,Other,USA
5,63,1995,10,Tue,22,60.0,Oakland,CA,USA,37.804444,-122.269722,0,1,1,0,0,Other,USA
6,64,1996,10,Thr,3,3.0,Higginsville,MO,USA,39.0725,-93.716944,0,1,1,0,0,Geometric,USA
7,65,1996,10,Thr,20,300.0,Lake Macquarie (Nsw&#44 Australia),0,Australia,-33.093373,151.588982,1,0,0,0,0,Type of Light,Australia
8,66,1996,10,Thr,22,300.0,Charleston,SC,USA,32.776389,-79.931111,0,0,0,0,0,Type of Light,USA
9,67,1996,10,Thr,22,60.0,Monroe County,OH,USA,39.440278,-84.362222,0,0,0,0,0,Non-Geometric,USA


In [32]:
# Create list of countries by continent:
# Africa = 
# Antartica = 
# Asia = 
# Europe = 
# NAmerica = 
# CAmerica = 
# SAmerica = 
# Australia = 

# Change country names to continent names in continent column:
ufo.loc[['Africa', 'Egypt', 'Nigeria', 'Zimbabwe', 'Cameroon', 'Ghana', 'Mauritius', 'Lesotho'], 'continent'] = 'Africa'
ufo.loc['Antarctica', 'continent'] = 'Antartica'
ufo.loc[['Afghanistan', 'Bahrain', 'Brunei', 'Asia', 'China', 'East Timor', 'India', 'Indonesia', 'Israel', 'Iraq', 'Japan', 'Korea',
         'Kuwait', 'Lebanon', 'Malaysia', 'Maldives', 'Mongolia', 'Myanmar', 'Oman', 'Pakistan', 'Philippines', 'Saudi Arabia', 
         'Sri Lanka', 'Taiwan', 'Thailand', 'Turkey', 'UAE', 'Viet Nam', 'Uzbekistan', 'Georgia', 'Kazakhstan'], 
        'continent'] = 'Asia'
ufo.loc[['Europe', 'Belgium', 'British VI', 'Croatia', 'Cyprus', 'Czech Republic', 'Denmark', 'Finland', 'France', 'Germany', 
         'Greece', 'Hungary', 'Ireland', 'Italy', 'Korea', 'Kosovo', 'Luxembourg', 'Malta', 'Netherlands', 'Norway', 'Poland', 
         'Portugal', 'Romania', 'Russia', 'Slovakia', 'Slovenia', 'Spain', 'Sweden', 'Switzerland', 'Ukraine', 'UK', 'Yugoslavia'], 
        'continent'] = 'Europe'
ufo.loc[['Alaska', 'Bahamas', 'Canada', 'Caribbean', 'Cuba', 'Dominican Republic', 'Grenadine Island', 'Guatamala', 
         'Hawaii', 'Jamaica', 'Mexico', 'Puerto Rico', 'Trinidad', 'USA'], 'continent'] = 'North America'
ufo.loc[['Belize', 'Costa Rica', 'El Salvador', 'Honduras', 'Panama'], 'continent'] = 'Central America'
ufo.loc[['Argentina', 'Bolivia', 'Brazil', 'Chile', 'Colombia', 'Ecuador', 'Guyana', 'Peru', 'Uruguay', 'Venezuela', 
         'Suriname'], 'continent'] = 'South America'
ufo.loc[['Australia', 'New Zealand', 'Papua - New Guinea'], 'continent'] = 'Australia'

# Look at the value counts of continent:
ufo['continent'].value_counts()

KeyError: "None of [Index(['Africa', 'Egypt', 'Nigeria', 'Zimbabwe', 'Cameroon', 'Ghana',\n       'Mauritius', 'Lesotho'],\n      dtype='object')] are in the [index]"

In [33]:
# Rename some country values:
# ufo.loc[ufo['country'] == 'Tunisia', 'country'] = 'Africa'
# ufo.loc[ufo['country'] == 'Belarus', 'country'] = 'Europe'
# ufo.loc[]

In [None]:
# # Still a lot more clealing to do, will do if I have extra time. 
# # For now going to save up to this point to a new csv file for later:
# ufo.to_csv('ufos_cleaned_all_countries.csv', index=False)