## Requirements and Dataset Overview

In [None]:

import pandas as pd
import matplotlib.pyplot as plt

# Dataset URL
dataset_url = 'https://raw.githubusercontent.com/fivethirtyeight/data/master/airline-safety/airline-safety.csv'


Airline Safety Data from [fivethirtyeight Airline Safety data](https://github.com/fivethirtyeight/data/tree/master/airline-safety)

## Ingest

In [None]:

# Load dataset
df = pd.read_csv(dataset_url)
assert df is not None
assert df.shape == (56, 8)  # Ensuring dataset shape is correct
df.head()


## Data Analysis

In [None]:

# Descriptive statistics
general_stats = df.describe()
general_stats


## Data Visualizations

### Histogram for 1985-1999

In [None]:

# Histogram for incidents (1985-1999)
plt.figure(figsize=(10, 6))
plt.hist(df['incidents_85_99'])
plt.xlabel('Incidents (1985-1999)')
plt.ylabel('Frequency')
plt.title('Frequency of Incidents (1985-1999)')
plt.show()


In [None]:

# Histogram for fatal accidents (1985-1999)
plt.figure(figsize=(10, 6))
plt.hist(df['fatal_accidents_85_99'])
plt.xlabel('Fatal Accidents (1985-1999)')
plt.ylabel('Frequency')
plt.title('Frequency of Fatal Accidents (1985-1999)')
plt.show()


In [None]:

# Histogram for fatalities (1985-1999)
plt.figure(figsize=(10, 6))
plt.hist(df['fatalities_85_99'])
plt.xlabel('Fatalities (1985-1999)')
plt.ylabel('Frequency')
plt.title('Frequency of Fatalities (1985-1999)')
plt.show()


### Histogram for 2000-2014

In [None]:

# Histogram for incidents (2000-2014)
plt.figure(figsize=(10, 6))
plt.hist(df['incidents_00_14'])
plt.xlabel('Incidents (2000-2014)')
plt.ylabel('Frequency')
plt.title('Frequency of Incidents (2000-2014)')
plt.show()


In [None]:

# Histogram for fatal accidents (2000-2014)
plt.figure(figsize=(10, 6))
plt.hist(df['fatal_accidents_00_14'])
plt.xlabel('Fatal Accidents (2000-2014)')
plt.ylabel('Frequency')
plt.title('Frequency of Fatal Accidents (2000-2014)')
plt.show()


In [None]:

# Histogram for fatalities (2000-2014)
plt.figure(figsize=(10, 6))
plt.hist(df['fatalities_00_14'])
plt.xlabel('Fatalities (2000-2014)')
plt.ylabel('Frequency')
plt.title('Frequency of Fatalities (2000-2014)')
plt.show()


### Bar chart for 1985-1999

In [None]:

# Bar chart for incidents (1985-1999) across airlines
plt.figure(figsize=(15, 10))
plt.bar(df['airline'], df['incidents_85_99'])
plt.xlabel('Airline')
plt.ylabel('Incidents (1985-1999)')
plt.title('Incidents (1985-1999) Across Airlines')
plt.xticks(rotation=90, fontsize=8)
plt.show()


In [None]:

# Bar chart for fatal accidents (1985-1999) across airlines
plt.figure(figsize=(15, 10))
plt.bar(df['airline'], df['fatal_accidents_85_99'])
plt.xlabel('Airline')
plt.ylabel('Fatal Accidents (1985-1999)')
plt.title('Fatal Accidents (1985-1999) Across Airlines')
plt.xticks(rotation=90, fontsize=8)
plt.show()


In [None]:

# Bar chart for fatalities (1985-1999) across airlines
plt.figure(figsize=(15, 10))
plt.bar(df['airline'], df['fatalities_85_99'])
plt.xlabel('Airline')
plt.ylabel('Fatalities (1985-1999)')
plt.title('Fatalities (1985-1999) Across Airlines')
plt.xticks(rotation=90, fontsize=8)
plt.show()


### Bar Charts for 2000-2014

In [None]:

# Bar chart for incidents (2000-2014) across airlines
plt.figure(figsize=(15, 10))
plt.bar(df['airline'], df['incidents_00_14'])
plt.xlabel('Airline')
plt.ylabel('Incidents (2000-2014)')
plt.title('Incidents (2000-2014) Across Airlines')
plt.xticks(rotation=90, fontsize=8)
plt.show()


In [None]:

# Bar chart for fatal accidents (2000-2014) across airlines
plt.figure(figsize=(15, 10))
plt.bar(df['airline'], df['fatal_accidents_00_14'])
plt.xlabel('Airline')
plt.ylabel('Fatal Accidents (2000-2014)')
plt.title('Fatal Accidents (2000-2014) Across Airlines')
plt.xticks(rotation=90, fontsize=8)
plt.show()


In [None]:

# Bar chart for fatalities (2000-2014) across airlines
plt.figure(figsize=(15, 10))
plt.bar(df['airline'], df['fatalities_00_14'])
plt.xlabel('Airline')
plt.ylabel('Fatalities (2000-2014)')
plt.title('Fatalities (2000-2014) Across Airlines')
plt.xticks(rotation=90, fontsize=8)
plt.show()


### Scatter Plot for Incidents vs Fatalities (1985-1999)

In [None]:

# Scatter plot comparing incidents and fatalities for each airline (1985-1999)
plt.figure(figsize=(10, 6))
plt.scatter(df['incidents_85_99'], df['fatalities_85_99'], alpha=0.7)
plt.xlabel('Incidents (1985-1999)')
plt.ylabel('Fatalities (1985-1999)')
plt.title('Scatter Plot of Incidents vs Fatalities (1985-1999)')
plt.grid(True)
plt.show()


### Scatter Plot for Incidents vs Fatalities (2000-2014)

In [None]:

# Scatter plot comparing incidents and fatalities for each airline (2000-2014)
plt.figure(figsize=(10, 6))
plt.scatter(df['incidents_00_14'], df['fatalities_00_14'], alpha=0.7, color='orange')
plt.xlabel('Incidents (2000-2014)')
plt.ylabel('Fatalities (2000-2014)')
plt.title('Scatter Plot of Incidents vs Fatalities (2000-2014)')
plt.grid(True)
plt.show()


### Combined Scatter Plot for Incidents vs Fatalities (1985-1999 vs 2000-2014)

In [None]:

# Combined scatter plot for incidents vs fatalities for both periods (1985-1999 and 2000-2014)
plt.figure(figsize=(10, 6))
plt.scatter(df['incidents_85_99'], df['fatalities_85_99'], alpha=0.7, label='1985-1999', color='blue')
plt.scatter(df['incidents_00_14'], df['fatalities_00_14'], alpha=0.7, label='2000-2014', color='orange')
plt.xlabel('Incidents')
plt.ylabel('Fatalities')
plt.title('Combined Scatter Plot of Incidents vs Fatalities (1985-1999 vs 2000-2014)')
plt.legend()
plt.grid(True)
plt.show()
