# 📊 Descriptive and Correlation Analysis of Study Area

This notebook performs descriptive statistics and correlation analysis on an Excel file containing climate and province data.


In [None]:
from google.colab import files
uploaded = files.upload()

In [None]:
import pandas as pd

file_name = list(uploaded.keys())[0]
xls = pd.ExcelFile(file_name)
sheet_name = "Location of the study area"
df = xls.parse(sheet_name)
df.head()

In [None]:
print("=== Descriptive Statistics ===")
print(df.describe(include='all'))

In [None]:
import matplotlib.pyplot as plt

climate_counts = df['Climate Type'].value_counts()
climate_counts.plot(kind='bar', color='skyblue', edgecolor='black')
plt.title("Frequency of Climate Types")
plt.xlabel("Climate Type")
plt.ylabel("Count")
plt.xticks(rotation=45)
plt.grid(axis='y', linestyle='--', alpha=0.7)
plt.tight_layout()
plt.show()

In [None]:
from sklearn.preprocessing import LabelEncoder
import seaborn as sns

df_encoded = df.copy()
for column in df_encoded.columns:
    if df_encoded[column].dtype == 'object':
        df_encoded[column] = LabelEncoder().fit_transform(df_encoded[column])

corr_matrix = df_encoded.corr()
print("=== Correlation Matrix ===")
print(corr_matrix)

plt.figure(figsize=(8, 6))
sns.heatmap(corr_matrix, annot=True, cmap='coolwarm', linewidths=0.5)
plt.title("Correlation Heatmap (Encoded)")
plt.tight_layout()
plt.show()

In [None]:
corr_matrix.to_csv("correlation_matrix.csv")
from google.colab import files
files.download("correlation_matrix.csv")