Load the credit data from a CSV file using pandas.

In [None]:
import pandas as pd

# Load credit data
credit_data = pd.read_csv('credit_data.csv')

Inspect the shape of the data to understand its dimensions.

In [None]:
print(credit_data.shape)

Generate summary statistics for the dataset.

In [None]:
print(credit_data.describe())

Perform data cleansing by removing rows with missing values.

In [None]:
credit_data = credit_data.dropna()

Check for missing values in the dataset.

In [None]:
missing_values = credit_data.isnull().sum()

Drop any unused columns from the data.

In [None]:
credit_data = credit_data.drop(columns=['unused_column'])

Fill missing values with the mean of each column.

In [None]:
credit_data.fillna(credit_data.mean(), inplace=True)

Check for outliers in a specified column.

In [None]:
outliers = credit_data[credit_data['column_name'] > threshold]

Visualize insights using pair plots to see relationships.

In [None]:
import seaborn as sns
import matplotlib.pyplot as plt
sns.pairplot(credit_data)
plt.show()

Analyze demographics by grouping data by age and gender.

In [None]:
age_gender_analysis = credit_data[['age', 'gender']].groupby(['age', 'gender']).size().reset_index(name='counts')

Plot the distribution of the 'duration' variable.

In [None]:
sns.histplot(credit_data['duration'])
plt.title('Distribution of Duration')
plt.show()

Visualize credit amounts based on saving account types.

In [None]:
sns.boxplot(x='saving_account', y='credit_amount', data=credit_data)
plt.title('Credit Amount by Saving Account')
plt.show()

Visualize the purpose of credit based on saving accounts.

In [None]:
sns.boxplot(x='saving_account', y='purpose_of_credit', data=credit_data)
plt.title('Purpose of Credit by Saving Account')
plt.show()

Create a heatmap to visualize the correlation between features.

In [None]:
correlation_matrix = credit_data.corr()
sns.heatmap(correlation_matrix, annot=True)
plt.title('Heatmap of Correlation')
plt.show()