In [None]:
Project Title:  "Impact of Increased Temperature and Drought in Climate Risk & Disaster Management"

Problem Statement: 
Rising global temperatures and more frequent droughts threaten human health, agriculture, water resources, and infrastructure. Traditional disaster 
management is often reactive, causing delays and inefficient resource allocation. There is a pressing need for proactive, data-driven systems that 
can predict risks, assess impacts, and optimize responses during heatwaves and droughts. By leveraging AI/ML with climate and satellite data,
such systems can provide early warnings, accurate damage assessment, and efficient disaster response planning.

Description:
This project develops an AI/ML-powered climate risk management system to predict heatwaves and droughts using NASA, NOAA, and xView2 data. 
It combines time-series forecasting, remote sensing, and ML models to monitor agricultural stress and drought severity. 
Reinforcement learning optimizes resource distribution, while risk maps highlight vulnerable regions. The system empowers governments and NGOs to act 
proactively, reduce economic losses, and strengthen resilience against climate-driven crises.

In [7]:
# Data wrangling
import numpy as np
import pandas as pd
import os


# Data visualization tools
import matplotlib.pyplot as plt
import seaborn as sns

# Utils
from sklearn.model_selection import train_test_split, cross_val_score, GridSearchCV
from sklearn.feature_selection import SelectKBest, chi2, RFE, SelectFromModel
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import GridSearchCV
import pickle
import time

# ML Models
from sklearn.ensemble import RandomForestClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn import tree
from sklearn.cluster import KMeans
from sklearn.cluster import MiniBatchKMeans

# Sampling
from imblearn.over_sampling import SMOTE


# Evaluation Metrics
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix, f1_score, precision_score, recall_score
from sklearn.metrics import roc_auc_score, roc_curve, auc
from sklearn.metrics import silhouette_score

import warnings
warnings.filterwarnings("ignore")





In [13]:
df = pd.read_csv("C:/Users/athir/Downloads/soil_data.csv")
df1 = pd.read_csv("C:/Users/athir/Downloads/temp_cleaned.csv")

In [12]:
print("---- Basic Info ----")
print(df.info())
print(df1.info())

print("\n---- Summary Statistics ----")
print(df.describe(include='all'))  
print(df1.describe(include='all'))

---- Basic Info ----
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 3109 entries, 0 to 3108
Data columns (total 32 columns):
 #   Column         Non-Null Count  Dtype  
---  ------         --------------  -----  
 0   fips           3109 non-null   int64  
 1   lat            3109 non-null   float64
 2   lon            3109 non-null   float64
 3   elevation      3109 non-null   int64  
 4   slope1         3109 non-null   float64
 5   slope2         3109 non-null   float64
 6   slope3         3109 non-null   float64
 7   slope4         3109 non-null   float64
 8   slope5         3109 non-null   float64
 9   slope6         3109 non-null   float64
 10  slope7         3109 non-null   float64
 11  slope8         3109 non-null   float64
 12  aspectN        3109 non-null   float64
 13  aspectE        3109 non-null   float64
 14  aspectS        3109 non-null   float64
 15  aspectW        3109 non-null   float64
 16  aspectUnknown  3109 non-null   float64
 17  WAT_LAND       3109 non-null   

In [10]:
print("\n---- Missing Values ----")
print(df.isnull().sum())

df.dropna(inplace=True)


---- Missing Values ----
fips             0
lat              0
lon              0
elevation        0
slope1           0
slope2           0
slope3           0
slope4           0
slope5           0
slope6           0
slope7           0
slope8           0
aspectN          0
aspectE          0
aspectS          0
aspectW          0
aspectUnknown    0
WAT_LAND         0
NVG_LAND         0
URB_LAND         0
GRS_LAND         0
FOR_LAND         0
CULTRF_LAND      0
CULTIR_LAND      0
CULT_LAND        0
SQ1              0
SQ2              0
SQ3              0
SQ4              0
SQ5              0
SQ6              0
SQ7              0
dtype: int64
