In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Sample Indian Demographics Data (Replace with real data from Census of India)
data = {
    'state': ['Maharashtra', 'Uttar Pradesh', 'Bihar', 'West Bengal', 'Tamil Nadu', 'Madhya Pradesh', 'Rajasthan', 'Karnataka', 'Gujarat', 'Andhra Pradesh'],
    'population': [123144223, 237882725, 124799926, 99609303, 77841267, 85034723, 81032689, 67562686, 64357546, 53903393],
    'literacy_rate': [82.9, 73.0, 63.8, 77.1, 80.3, 78.6, 67.1, 75.6, 79.3, 67.4],
    'rural_population_percent': [54.8, 77.7, 88.7, 68.1, 51.7, 72.4, 75.1, 61.3, 57.4, 66.6],
}

demographics_df = pd.DataFrame(data)

# 1. Basic Data Exploration
print(demographics_df.head())
print(demographics_df.info())

In [None]:
# 2. Population Analysis
total_population = demographics_df['population'].sum()
print("\nTotal Population of the Listed States:", total_population)

# 3. Literacy Rate Analysis
average_literacy_rate = demographics_df['literacy_rate'].mean()
print("\nAverage Literacy Rate:", average_literacy_rate)

# 4. Correlation between Literacy Rate and Rural Population
correlation = demographics_df['literacy_rate'].corr(demographics_df['rural_population_percent'])
print("\nCorrelation between Literacy Rate and Rural Population Percentage:", correlation)

# 1. Bar Chart of Population by State
plt.figure(figsize=(12, 6))

sns.barplot(x='state', y='population', data=demographics_df)
plt.title('Population by State')

plt.xlabel('State')
plt.ylabel('Population')

plt.xticks(rotation=45)
plt.show()

In [None]:
# 2. Scatter Plot of Literacy Rate vs. Rural Population
plt.figure(figsize=(8, 6))

sns.scatterplot(x='literacy_rate', y='rural_population_percent', data=demographics_df)
plt.title('Literacy Rate vs. Rural Population Percentage')

plt.xlabel('Literacy Rate (%)')
plt.ylabel('Rural Population (%)')

plt.show()