In [None]:
# Climate Visibility Analysis Project in Python

# Step 1: Import Libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Step 2: Load Dataset
# Replace 'climate_data.csv' with your uploaded file
from google.colab import files
uploaded = files.upload()

import io
df = pd.read_csv(io.BytesIO(list(uploaded.values())[0]))

# Step 3: Data Cleaning
print("Initial Data Info:")
print(df.info())
print("\nMissing Values:\n", df.isnull().sum())

# Filling missing values with mean for simplicity
df.fillna(df.mean(numeric_only=True), inplace=True)

# Step 4: Exploratory Data Analysis (EDA)
print("\nStatistical Summary:")
print(df.describe())

# Step 5: Visualization

# Plot Temperature over Time
if 'Temperature' in df.columns and 'Date' in df.columns:
    df['Date'] = pd.to_datetime(df['Date'])
    plt.figure(figsize=(12,5))
    plt.plot(df['Date'], df['Temperature'], color='orange')
    plt.title("Temperature Over Time")
    plt.xlabel("Date")
    plt.ylabel("Temperature (Â°C)")
    plt.show()

# Plot Visibility Distribution
if 'Visibility' in df.columns:
    plt.figure(figsize=(10,5))
    sns.histplot(df['Visibility'], kde=True, color='blue', bins=30)
    plt.title("Visibility Distribution")
    plt.xlabel("Visibility (km)")
    plt.show()

# Correlation Heatmap
plt.figure(figsize=(10,6))
sns.heatmap(df.corr(), annot=True, cmap='coolwarm')
plt.title("Correlation Between Climate Variables")
plt.show()

# Step 6: Insights (Example)
if 'Visibility' in df.columns and 'Humidity' in df.columns:
    low_visibility_days = df[df['Visibility'] < df['Visibility'].mean()]
    print(f"Number of low visibility days: {low_visibility_days.shape[0]}")
    print("Average Humidity on low visibility days:", low_visibility_days['Humidity'].mean())




#Project Title: Climate Visibility Analysis

Objective:

Analyze and visualize climate data to study trends and patterns, focusing on variables like temperature, humidity, and visibility. The project will use Python libraries for data analysis and visualization.

Steps:

Import Libraries: Use pandas for data manipulation and matplotlib/seaborn for visualization.

Load Data: Import a climate dataset (CSV file containing temperature, humidity, visibility, etc.).

Data Cleaning: Handle missing values and incorrect data.

Exploratory Data Analysis (EDA): Analyze trends in temperature, humidity, and visibility.

Visualization: Plot line graphs, histograms, and heatmaps to observe correlations and patterns.

Insights: Summarize findings, such as days with low visibility, correlations between humidity and visibility, etc.

 Dataset Suggestion:
 Use the NOAA Global Climate Dataset or a Kaggle climate/weather dataset (CSV format)