# The Spark Foundation :  GRIP  Jan-2021

# Task-4 : Exploratory Data Analysis - Terrorism

### Description : As a security/defense analyst, try to find out the hot zone of terrorism and What all security issues and insights you can derive by EDA?

# Importing libraries

In [None]:
#Importing all Necessary libraries

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Loading Data

In [None]:
terror_data = pd.read_csv('globalterrorismdb_0718dist.csv', encoding='latin-1')

In [None]:
#Checking top five rows of each column

terror_data.head()

In [None]:
#Checking the Shape of Data

terror_data.shape

In [None]:
#Checking data Types 

terror_data.dtypes

# Renaming the Columns which are Important /Required for the analysis

In [None]:
terror_data.rename(columns={'iyear':'Year', 'imonth':'Month', 'iday':'Day', 'country_txt':'Country', 'region_txt':'Region', 'provstate':'State', 'city':'City',
                   'attacktype1_txt':'Attack_Type', 'targtype1_txt':'Target_Type', 'motive':'Motive', 'weaptype1_txt':'Weapon_Type',
                   'weapdetail':'Weapon_Details', 'nkill':'Kill', 'nwound':'Injured', 'summary':'Summary'}, inplace=True)

In [None]:
terror_data.head()

# Loading the important /Required Columns for analysis

In [None]:
terror_data = terror_data[['Year', 'Month', 'Day', 'Country', 'Region', 'State', 'City', 'Attack_Type', 'Target_Type', 'Motive', 'Weapon_Type',
            'Weapon_Details', 'Kill', 'Injured', 'Summary']]

In [None]:
terror_data.head()

In [None]:
#After the Renaming and redicing the data checking the shape of data

terror_data.shape

## We didn't drop the null values rows because if we drop the rows we lose the imformation from data which is required for our analysis

In [None]:
#Checking the null values

terror_data.isnull().sum()

# Checking the Hot Zone

In [None]:
print("Hot Zone for terrorism ")
terror_data['Country'].value_counts().head()

### We can see that Iraq 24636 times under attack of Terrorist

In [None]:
#Plotting the countplot Country vs Count of terrorist attack on Country

plt.figure(figsize=(30,12))
sns.countplot('Country', data=terror_data)
plt.title('Hot Zone for Terrorism', fontsize=25)
plt.xticks(rotation=90)
plt.show()

# Plotting the barplot which has Top 10 Country which has Hot Zone

In [None]:
plt.figure(figsize=(15,6))
sns.barplot(terror_data['Country'].value_counts()[:10].index, terror_data['Country'].value_counts()[:10].values)
plt.xlabel('Top 10 Country under Terrorism')
plt.ylabel('Terrorism attack Count')
plt.title('Top 10 Country under Terrorism attack ', fontsize=20)
plt.xticks(rotation=90)
plt.show()

## From abow barplot we can see that Iraq is the Hot Zone of Terrorist Attack

## After the Iraq, Pakistan and Afghanistan, India is the Hot Zone of Terrorist

In [None]:
print("Country with less terrorism ")
terror_data['Country'].value_counts().tail()

## From abow values we can see that North Korea and New Hebrides are less under attack

In [None]:
#Number of People Killed and Injured according to the Country

country1 = terror_data.groupby(['Country'])['Country', 'Kill', 'Injured'].sum()
country1.head()

### From abow values we can see that in Afghanistan more People Killed and Injured 

In [None]:
print('Amount of pepople Killed and Injured per year')
year1 = terror_data.groupby(['Year'])['Kill', 'Injured'].sum()
year1.head(8)

In [None]:
print('Amount of pepople Killed and Injured per year')
year2 = terror_data.groupby(['Year'])['Kill', 'Injured'].sum()
year2.tail(10)

## From abow we can see that Number of People Killed and Injured as per Year and aslo we can see that as Year increasing Number of killing and Injuries aslo increasing.

In [None]:
#Terrorist activity per Year

year3 = terror_data['Year'].value_counts()
year3.head()

# Count of Terrorism attack per Year

In [None]:
plt.figure(figsize=(15,6))
sns.countplot('Year', data=terror_data)
plt.xlabel('Year of Terrorism attack')
plt.ylabel('Terrorism attack Count')
plt.title('Count of Terrorism attack per Year ', fontsize=20)
plt.xticks(rotation=90)
plt.show()

## Attack_Type and Weapon_Type used against Country

In [None]:
attack_type = terror_data.groupby(['Country'])['Attack_Type', 'Weapon_Type'].max()
attack_type.head(10)

In [None]:
#Number of Attacking type used 

terror_data['Attack_Type'].value_counts()

# Number of Attacking Types used for Attack Purpose

In [None]:
plt.figure(figsize=(15,6))
sns.barplot(terror_data['Attack_Type'].value_counts()[:10].index, terror_data['Attack_Type'].value_counts()[:10].values)
plt.xlabel('Attack type used by Terrorist')
plt.ylabel('Attack_Type Count')
plt.title('Top Attacking Type used by Terrorist ', fontsize=20)
plt.xticks(rotation=90)
plt.show()

## From abow barplot we can see that Bombing/Explosion and Armed Assault is used much more than other attacking type

In [None]:
#Weapon types used for attacking purpose

terror_data['Weapon_Type'].value_counts()

# Weapon Type used for Attacking Purpose

In [None]:
plt.figure(figsize=(15,6))
sns.barplot(terror_data['Weapon_Type'].value_counts()[:15].index, terror_data['Weapon_Type'].value_counts()[:15].values)
plt.xlabel('Weapon type used by Terrorist')
plt.ylabel('Weapon_Type Count')
plt.title('Top Weapon Type used by Terrorist ', fontsize=20)
plt.xticks(rotation=90)
plt.show()

## From abow barplot we can see that Explossives and firearms used much more than other Weapon type

In [None]:
#Region which is used for attacking purpose

region = terror_data['Region'].value_counts()
region.head()

# Region in which More Attack has been happened

In [None]:
plt.figure(figsize=(15,6))
sns.countplot('Region', data=terror_data)
plt.xlabel('Region of Terrorism attack')
plt.ylabel('Region attack Count')
plt.title('Region has Maximun Terrorist Attack ', fontsize=20)
plt.xticks(rotation=90)
plt.show()

## From abow countplot we can see that Middle East and North Africa , South Asia Region is more under attack

In [None]:
#City which is Maximum times under attack

city = terror_data['City'].value_counts()
city.head()

# City with Maximun Attack

In [None]:
plt.figure(figsize=(15,6))
sns.barplot(terror_data['City'].value_counts()[:15].index, terror_data['City'].value_counts()[:15].values)
plt.xlabel('City with most attack')
plt.ylabel('Count')
plt.title('City which is Hot Zone ', fontsize=20)
plt.xticks(rotation=90)
plt.show()

### From abow barplot we can see that Baghdad and Karachi, Lima is most time under attack

# Thanking You