<a href="https://colab.research.google.com/github/MoonlightO2/Nature/blob/main/Greenhouse_Gas_Data.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# **Greenhouse Gas Data**
***Dataset***: https://www.kaggle.com/datasets/unitednations/international-greenhouse-gas-emissions

In [63]:
import pandas as pd
import numpy as np
import matplotlib as plt
import seaborn as sns

In [64]:
file1 = '/content/drive/MyDrive/Projects/Portfolio/Nature & Weather/Greenhouse Gas/Greenhouse Gas Data.csv'
file2 = '/content/drive/MyDrive/Projects/Portfolio/Nature & Weather/Greenhouse Gas/Greenhouse Gas.csv'

In [65]:
data = pd.read_csv(file1)

In [66]:
data.rename(columns={
    'country_or_area': 'Country',
    'year': 'Year',
    'value': 'Value',
    'category': 'Category'
}, inplace=True)

In [67]:
data = data.applymap(lambda x: x.title().replace('_', ' ').strip() if isinstance(x, str) else x)

In [68]:
print('Shape: ', data.shape, '\n')
print('Columns: ', data.columns.tolist(), '\n')
data.head()

Shape:  (8406, 4) 

Columns:  ['Country', 'Year', 'Value', 'Category'] 



Unnamed: 0,Country,Year,Value,Category
0,Australia,2014,393126.946994,Carbon Dioxide Co2 Emissions Without Land Use ...
1,Australia,2013,396913.93653,Carbon Dioxide Co2 Emissions Without Land Use ...
2,Australia,2012,406462.847704,Carbon Dioxide Co2 Emissions Without Land Use ...
3,Australia,2011,403705.528314,Carbon Dioxide Co2 Emissions Without Land Use ...
4,Australia,2010,406200.993184,Carbon Dioxide Co2 Emissions Without Land Use ...


In [69]:
# Mapping dictionary for renaming
rename_dict = {
    'Carbon Dioxide Co2 Emissions Without Land Use Land Use Change And Forestry Lulucf In Kilotonne Co2 Equivalent': 'CO2 Emissions (No LULUCF)',
    'Greenhouse Gas Ghgs Emissions Including Indirect Co2 Without Lulucf In Kilotonne Co2 Equivalent': 'GHGs Emissions (No LULUCF)',
    'Greenhouse Gas Ghgs Emissions Without Land Use Land Use Change And Forestry Lulucf In Kilotonne Co2 Equivalent': 'GHGs Emissions (No Land Use)',
    'Hydrofluorocarbons Hfcs Emissions In Kilotonne Co2 Equivalent': 'HFCs Emissions',
    'Methane Ch4 Emissions Without Land Use Land Use Change And Forestry Lulucf In Kilotonne Co2 Equivalent': 'CH4 Emissions (No LULUCF)',
    'Nitrogen Trifluoride Nf3 Emissions In Kilotonne Co2 Equivalent': 'NF3 Emissions',
    'Nitrous Oxide N2O Emissions Without Land Use Land Use Change And Forestry Lulucf In Kilotonne Co2 Equivalent': 'N2O Emissions (No LULUCF)',
    'Perfluorocarbons Pfcs Emissions In Kilotonne Co2 Equivalent': 'PFCs Emissions',
    'Sulphur Hexafluoride Sf6 Emissions In Kilotonne Co2 Equivalent': 'SF6 Emissions',
    'Unspecified Mix Of Hydrofluorocarbons Hfcs And Perfluorocarbons Pfcs Emissions In Kilotonne Co2 Equivalent': 'Unspecified HFCs/PFCs Mix'
}

# Replace column values using the mapping dictionary
data['Category'] = data['Category'].replace(rename_dict)

# Displaying the DataFrame with renamed column values
print(data)

                       Country  Year          Value                   Category
0                    Australia  2014  393126.946994  CO2 Emissions (No LULUCF)
1                    Australia  2013  396913.936530  CO2 Emissions (No LULUCF)
2                    Australia  2012  406462.847704  CO2 Emissions (No LULUCF)
3                    Australia  2011  403705.528314  CO2 Emissions (No LULUCF)
4                    Australia  2010  406200.993184  CO2 Emissions (No LULUCF)
...                        ...   ...            ...                        ...
8401  United States Of America  1994     593.222570  Unspecified HFCs/PFCs Mix
8402  United States Of America  1993     586.939752  Unspecified HFCs/PFCs Mix
8403  United States Of America  1992     574.414624  Unspecified HFCs/PFCs Mix
8404  United States Of America  1991     566.900968  Unspecified HFCs/PFCs Mix
8405  United States Of America  1990     293.205663  Unspecified HFCs/PFCs Mix

[8406 rows x 4 columns]


In [70]:
for column_name, values in data.items():
    unique_values = set(values)
    num_unique_values = len(unique_values)

    print(f"Column: {column_name}")
    print(f"Unique Values: {unique_values}")
    print(f"Number of Unique Values: {num_unique_values}\n")

Column: Country
Unique Values: {'Croatia', 'Austria', 'Poland', 'Turkey', 'France', 'Malta', 'Belarus', 'Denmark', 'Switzerland', 'Iceland', 'Belgium', 'Spain', 'Norway', 'Czech Republic', 'Australia', 'Portugal', 'Romania', 'Bulgaria', 'Canada', 'Liechtenstein', 'Lithuania', 'Estonia', 'Monaco', 'United Kingdom', 'Slovakia', 'Slovenia', 'Hungary', 'Latvia', 'Russian Federation', 'Sweden', 'Netherlands', 'United States Of America', 'Ireland', 'Japan', 'Cyprus', 'Ukraine', 'Italy', 'New Zealand', 'Luxembourg', 'Greece', 'European Union', 'Germany', 'Finland'}
Number of Unique Values: 43

Column: Year
Unique Values: {1990, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013, 2014}
Number of Unique Values: 25

Column: Value
Unique Values: {32768.5267614461, 1.4652648, 2.34132832272752, 3.71971962315223, 4.72378228524326, 5.344578130212, 4.719000000064, 6.17801344242055, 7.583766724, 9.35877837132, 10.7701

In [71]:
data = data[['Country', 'Year', 'Category', 'Value']]
data.to_csv(file2, index=False)
print('Cleaned file creation successful...!!', file2)

Cleaned file creation successful...!! /content/drive/MyDrive/Projects/Portfolio/Nature & Weather/Greenhouse Gas/Greenhouse Gas.csv
