In [None]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt

# Read CSV file
df = pd.read_csv(r"diabetes.csv")

# Display dataframe
df

# Display first and last few rows
display(df.head())   # shows first 5 rows
display(df.tail())   # shows last 5 rows

# Basic information
print(df.shape)      # (rows, columns)
print(df.size)       # total number of elements
print(df.index)      # index info
print(df.columns)    # column names
print(df.dtypes)     # data types of each column

# Summary and statistical description
df.info()            # summary info (datatype, non-null count)
display(df.describe())  # summary statistics

# Memory usage
display(df.memory_usage())   # memory used by each column

# Missing values handling
display(df.isnull())         # shows True/False for missing
print(df.isnull().sum())     # total missing per column
display(df.notnull())        # shows True/False for valid values
df_clean = df.dropna()       # drops missing rows
print(df_clean.shape)        # shape after dropna

# Correlation analysis
correlation = df.corr()      # compute correlation matrix
display(correlation)

# Heatmap visualization
sns.heatmap(correlation, annot=True, cmap='coolwarm')  # show heatmap
plt.title("Correlation Heatmap - Diabetes Dataset")
plt.show()

