# **Global Terrorism Analytics: Data Processing**

---

**<u>_Objective:_</u>** We process data from the Global Terrorism Database (GTD), and build an interactive dashboard to report on international terrorist events from 1970 tro 2017.


## Business Understanding



In [3]:
# import dependencies and libraries
import pandas as pd
import numpy as np
import glob
import re
import math
import seaborn as sns
import warnings
import matplotlib.pyplot as plt

sns.set_style('whitegrid')
sns.set_theme(style = 'whitegrid', 
              rc    = {'figure.dpi'    : 400, 
                       'figure.figsize': (20, 12)}, 
              font_scale = 0.60)

from matplotlib import rcParams
rcParams.update({'figure.autolayout': True})

pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', 200)
warnings.filterwarnings('ignore', category = UserWarning, module = 'openpyxl')

## Setting up Environment

In [4]:
import os

# Get current and root directory
cur_dir = os.getcwd()
root_dir = cur_dir[:-11]
data_dir = root_dir + "1_Data\\"

print(f"Current directory: {cur_dir}\nRoot directory : {root_dir}\nData directory : {data_dir}")

Current directory: H:\My Drive\Data Science and Analytics Portfolio\2 Projects\4 Global Terrorism Analytics\2 Main\2_Notebooks
Root directory : H:\My Drive\Data Science and Analytics Portfolio\2 Projects\4 Global Terrorism Analytics\2 Main\
Data directory : H:\My Drive\Data Science and Analytics Portfolio\2 Projects\4 Global Terrorism Analytics\2 Main\1_Data\


## Read Dataset

In [9]:
%%time
df_terror = pd.read_csv(f"{data_dir}/globalterrorismdb_0718dist.csv", encoding = 'latin-1', dtype = str).fillna('')

CPU times: total: 6.84 s
Wall time: 17.6 s


In [10]:
df_terror.head()

Unnamed: 0,eventid,iyear,imonth,iday,approxdate,extended,resolution,country,country_txt,region,region_txt,provstate,city,latitude,longitude,specificity,vicinity,location,summary,crit1,crit2,crit3,doubtterr,alternative,alternative_txt,multiple,success,suicide,attacktype1,attacktype1_txt,attacktype2,attacktype2_txt,attacktype3,attacktype3_txt,targtype1,targtype1_txt,targsubtype1,targsubtype1_txt,corp1,target1,natlty1,natlty1_txt,targtype2,targtype2_txt,targsubtype2,targsubtype2_txt,corp2,target2,natlty2,natlty2_txt,targtype3,targtype3_txt,targsubtype3,targsubtype3_txt,corp3,target3,natlty3,natlty3_txt,gname,gsubname,gname2,gsubname2,gname3,gsubname3,motive,guncertain1,guncertain2,guncertain3,individual,nperps,nperpcap,claimed,claimmode,claimmode_txt,claim2,claimmode2,claimmode2_txt,claim3,claimmode3,claimmode3_txt,compclaim,weaptype1,weaptype1_txt,weapsubtype1,weapsubtype1_txt,weaptype2,weaptype2_txt,weapsubtype2,weapsubtype2_txt,weaptype3,weaptype3_txt,weapsubtype3,weapsubtype3_txt,weaptype4,weaptype4_txt,weapsubtype4,weapsubtype4_txt,weapdetail,nkill,nkillus,nkillter,nwound,nwoundus,nwoundte,property,propextent,propextent_txt,propvalue,propcomment,ishostkid,nhostkid,nhostkidus,nhours,ndays,divert,kidhijcountry,ransom,ransomamt,ransomamtus,ransompaid,ransompaidus,ransomnote,hostkidoutcome,hostkidoutcome_txt,nreleased,addnotes,scite1,scite2,scite3,dbsource,INT_LOG,INT_IDEO,INT_MISC,INT_ANY,related
0,197000000001,1970,7,2,,0,,58,Dominican Republic,2,Central America & Caribbean,,Santo Domingo,18.456792,-69.951164,1,0,,,1,1,1,0,,,0,1,0,1,Assassination,,,,,14,Private Citizens & Property,68,Named Civilian,,Julio Guzman,58,Dominican Republic,,,,,,,,,,,,,,,,,MANO-D,,,,,,,0,,,0,,,,,,,,,,,,,13,Unknown,,,,,,,,,,,,,,,,1.0,,,0.0,,,0,,,,,0,,,,,,,0,,,,,,,,,,,,,PGIS,0,0,0,0,
1,197000000002,1970,0,0,,0,,130,Mexico,1,North America,Federal,Mexico city,19.371887,-99.086624,1,0,,,1,1,1,0,,,0,1,0,6,Hostage Taking (Kidnapping),,,,,7,Government (Diplomatic),45,"Diplomatic Personnel (outside of embassy, cons...",Belgian Ambassador Daughter,"Nadine Chaval, daughter",21,Belgium,,,,,,,,,,,,,,,,,23rd of September Communist League,,,,,,,0,,,0,7.0,,,,,,,,,,,,13,Unknown,,,,,,,,,,,,,,,,0.0,,,0.0,,,0,,,,,1,1.0,0.0,,,,Mexico,1,800000.0,,,,,,,,,,,,PGIS,0,1,1,1,
2,197001000001,1970,1,0,,0,,160,Philippines,5,Southeast Asia,Tarlac,Unknown,15.478598,120.599741,4,0,,,1,1,1,0,,,0,1,0,1,Assassination,,,,,10,Journalists & Media,54,Radio Journalist/Staff/Facility,Voice of America,Employee,217,United States,,,,,,,,,,,,,,,,,Unknown,,,,,,,0,,,0,,,,,,,,,,,,,13,Unknown,,,,,,,,,,,,,,,,1.0,,,0.0,,,0,,,,,0,,,,,,,0,,,,,,,,,,,,,PGIS,-9,-9,1,1,
3,197001000002,1970,1,0,,0,,78,Greece,8,Western Europe,Attica,Athens,37.99749,23.762728,1,0,,,1,1,1,0,,,0,1,0,3,Bombing/Explosion,,,,,7,Government (Diplomatic),46,Embassy/Consulate,,U.S. Embassy,217,United States,,,,,,,,,,,,,,,,,Unknown,,,,,,,0,,,0,,,,,,,,,,,,,6,Explosives,16.0,Unknown Explosive Type,,,,,,,,,,,,,Explosive,,,,,,,1,,,,,0,,,,,,,0,,,,,,,,,,,,,PGIS,-9,-9,1,1,
4,197001000003,1970,1,0,,0,,101,Japan,4,East Asia,Fukouka,Fukouka,33.580412,130.396361,1,0,,,1,1,1,-9,,,0,1,0,7,Facility/Infrastructure Attack,,,,,7,Government (Diplomatic),46,Embassy/Consulate,,U.S. Consulate,217,United States,,,,,,,,,,,,,,,,,Unknown,,,,,,,0,,,0,,,,,,,,,,,,,8,Incendiary,,,,,,,,,,,,,,,Incendiary,,,,,,,1,,,,,0,,,,,,,0,,,,,,,,,,,,,PGIS,-9,-9,1,1,


## Exploratory Data Analysis