# SpaceX Launch Data - Exploratory Data Analysis

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline

In [None]:
data = {
    'FlightNumber': list(range(1, 11)),
    'LaunchSite': ['CCAFS LC-40', 'VAFB SLC-4E', 'KSC LC-39A', 'CCAFS SLC-40', 'CCAFS LC-40',
                   'VAFB SLC-4E', 'KSC LC-39A', 'CCAFS SLC-40', 'CCAFS LC-40', 'KSC LC-39A'],
    'PayloadMass': [3000, 4000, 6000, 2500, 3000, 4100, 5800, 2700, 3200, 6100],
    'Orbit': ['LEO', 'LEO', 'GTO', 'LEO', 'SSO', 'SSO', 'GTO', 'LEO', 'GTO', 'LEO'],
    'LaunchSuccess': [1, 0, 1, 1, 0, 1, 1, 0, 1, 1],
    'Year': [2016, 2016, 2017, 2017, 2017, 2018, 2018, 2018, 2019, 2019]
}
df = pd.DataFrame(data)
df.head()

## Flight Number vs. Launch Site

In [None]:
for site in df['LaunchSite'].unique():
    site_data = df[df['LaunchSite'] == site]
    plt.scatter(site_data['FlightNumber'], [site]*len(site_data), label=site)
plt.xlabel('Flight Number')
plt.ylabel('Launch Site')
plt.title('Flight Number vs Launch Site')
plt.legend()
plt.show()

## Payload Mass vs. Launch Site

In [None]:
for site in df['LaunchSite'].unique():
    site_data = df[df['LaunchSite'] == site]
    plt.scatter(site_data['PayloadMass'], [site]*len(site_data), label=site)
plt.xlabel('Payload Mass (kg)')
plt.ylabel('Launch Site')
plt.title('Payload vs Launch Site')
plt.legend()
plt.show()

## Success Rate by Orbit Type

In [None]:
success_by_orbit = df.groupby('Orbit')['LaunchSuccess'].mean()
success_by_orbit.plot(kind='bar', title='Success Rate by Orbit Type')
plt.ylabel('Success Rate')
plt.show()

## Launch Success Yearly Trend

In [None]:
success_by_year = df.groupby('Year')['LaunchSuccess'].mean()
success_by_year.plot(kind='line', marker='o', title='Launch Success Yearly Trend')
plt.ylabel('Average Success Rate')
plt.xlabel('Year')
plt.show()