<a href="https://colab.research.google.com/github/Javediamon/Credit-Card-Approval-Prediction/blob/main/Sustainable_Fashion_Eco_Friendly_Trends_Analysis.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
# IMPORTANT: RUN THIS CELL IN ORDER TO IMPORT YOUR KAGGLE DATA SOURCES,
# THEN FEEL FREE TO DELETE THIS CELL.
# NOTE: THIS NOTEBOOK ENVIRONMENT DIFFERS FROM KAGGLE'S PYTHON
# ENVIRONMENT SO THERE MAY BE MISSING LIBRARIES USED BY YOUR
# NOTEBOOK.
import kagglehub
waqi786_sustainable_fashion_eco_friendly_trends_path = kagglehub.dataset_download('waqi786/sustainable-fashion-eco-friendly-trends')

print('Data source import complete.')


# **Load data**

In [None]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import warnings
from sklearn.manifold import TSNE
warnings.filterwarnings("ignore")

df=pd.read_csv("/kaggle/input/sustainable-fashion-eco-friendly-trends/sustainable_fashion_trends_2024.csv")
print(df.info())
print(df.isnull().sum())
print(df.head(10))

In [None]:
df['Certifications'].fillna('None', inplace=True)
print(df.isnull().sum())

In [None]:

print(df.describe())

numeric_df = df.select_dtypes(include=['float64', 'int64'])
plt.figure(figsize=(15, 10))
sns.heatmap(numeric_df.corr(), annot=True, fmt=".2f")
plt.show()


In [None]:
sns.countplot(data=df, x="Sustainability_Rating")
plt.title('Distribution of Sustainability Ratings')
plt.show()

In [None]:
sns.histplot(df['Average_Price_USD'], bins=30, kde=True)
plt.title('Distribution of Average Price (USD)')
plt.show()

In [None]:
sns.scatterplot(data=df, x='Carbon_Footprint_MT', y='Water_Usage_Liters', hue='Sustainability_Rating')
plt.title('Carbon Footprint vs. Water Usage')
plt.show()


In [None]:
df[['Carbon_Footprint_MT', 'Water_Usage_Liters', 'Waste_Production_KG', 'Average_Price_USD']].hist(figsize=(15, 10), bins=30)
plt.show()


In [None]:
sns.pairplot(df[['Carbon_Footprint_MT', 'Water_Usage_Liters', 'Waste_Production_KG', 'Average_Price_USD', 'Sustainability_Rating']])
plt.show()


# **Categorical Features Analysis**

In [None]:
sns.countplot(data=df, x='Sustainability_Rating')
plt.show()


In [None]:
df['Sustainability_Rating'].value_counts().plot.pie(autopct='%1.1f%%')
plt.show()


In [None]:
pd.crosstab(df['Country'], df['Sustainability_Rating']).plot.bar(stacked=True, figsize=(10, 7))
plt.show()


# **Temporal Analysis**

In [None]:
df.groupby('Year')['Average_Price_USD'].mean().plot.line()
plt.title('Average Price Over Years')
plt.show()


In [None]:
sns.countplot(data=df, x='Year')
plt.xticks(rotation=90)
plt.show()


# **Geographical Analysis**

In [None]:
sns.countplot(data=df, x='Country', order=df['Country'].value_counts().index)
plt.xticks(rotation=90)
plt.show()


In [None]:
df['Country'].value_counts().plot.pie(autopct='%1.1f%%')
plt.show()


In [None]:
sns.violinplot(data=df, x='Sustainability_Rating', y='Average_Price_USD')
plt.show()


In [None]:
sns.swarmplot(data=df, x='Sustainability_Rating', y='Water_Usage_Liters')
plt.show()


In [None]:
g = sns.FacetGrid(df, col='Sustainability_Rating', height=4, aspect=1.2)
g.map(sns.scatterplot, 'Carbon_Footprint_MT', 'Water_Usage_Liters')
plt.show()


# **Distribution Analysis**

In [None]:
sns.kdeplot(df['Average_Price_USD'], shade=True)
plt.show()


In [None]:
sns.displot(df['Carbon_Footprint_MT'], kde=True)
plt.show()


In [None]:
sns.ecdfplot(df['Waste_Production_KG'])
plt.show()


# **Comparison Plots**

In [None]:
g = sns.FacetGrid(df, col='Sustainability_Rating', height=4, aspect=1.2)
g.map(sns.histplot, 'Average_Price_USD', bins=30)
plt.show()


In [None]:
sns.boxplot(data=df, x='Country', y='Water_Usage_Liters')
plt.xticks(rotation=90)
plt.show()


In [None]:
sns.boxplot(data=df, x='Sustainability_Rating', y='Carbon_Footprint_MT')
plt.title('Carbon Footprint by Sustainability Rating')
plt.show()


In [None]:
sns.violinplot(data=df, x='Sustainability_Rating', y='Water_Usage_Liters')
plt.title('Water Usage by Sustainability Rating')
plt.show()


In [None]:
sns.pairplot(df[['Carbon_Footprint_MT', 'Water_Usage_Liters', 'Waste_Production_KG', 'Average_Price_USD', 'Sustainability_Rating']], hue='Sustainability_Rating')
plt.show()


In [None]:
tsne = TSNE(n_components=2, random_state=0)
tsne_results = tsne.fit_transform(df[['Carbon_Footprint_MT', 'Water_Usage_Liters', 'Waste_Production_KG', 'Average_Price_USD']])
df_tsne = pd.DataFrame(tsne_results, columns=['Dim1', 'Dim2'])
df_tsne['Sustainability_Rating'] = df['Sustainability_Rating']

sns.scatterplot(data=df_tsne, x='Dim1', y='Dim2', hue='Sustainability_Rating')
plt.title('t-SNE Visualization of Sustainability Features')
plt.show()
