# Exploratory Data Analysis and Basic Visualizations

- Summary statistics and counts
- Plots for launches per year, satellite mass distribution, country-wise launches


In [None]:
import pandas as pd
import matplotlib.pyplot as plt


In [None]:
missions = pd.read_csv('../data/ISRO missions - till AUGUST 2022.csv')
satellites = pd.read_csv('../data/satellites.csv')

# Convert date columns if needed:
missions['Date'] = pd.to_datetime(missions['Date'], errors='coerce')
satellites['launch_date'] = pd.to_datetime(satellites['launch_date'], errors='coerce')


In [None]:
print("Basic statistics (missions):")
print(missions.describe())

print("Basic statistics (satellites):")
print(satellites.describe())

print("Missing values (missions):")
print(missions.isnull().sum())

print("Missing values (satellites):")
print(satellites.isnull().sum())


In [None]:
plt.figure(figsize=(10,5))
satellites['mass'].dropna().hist(bins=30)
plt.title('Satellite Mass Distribution')
plt.xlabel('Mass (kg)')
plt.ylabel('Frequency')
plt.show()


In [None]:
country_counts = satellites['country'].value_counts()
plt.figure(figsize=(12,6))
country_counts.plot(kind='bar')
plt.title('Number of Satellites per Country')
plt.xlabel('Country')
plt.ylabel('Number of Satellites')
plt.xticks(rotation=45)
plt.show()


In [None]:
missions_per_year = missions['year'].value_counts().sort_index()
plt.figure(figsize=(10,5))
missions_per_year.plot(kind='bar')
plt.title('Missions Launched Per Year')
plt.xlabel('Year')
plt.ylabel('Missions')
plt.show()
