# Table of Contents

## 1. Importing Data
## 2. Data Overview
## 3. Data Wrangling
## 4. Exporting Data

---
## 1. Importing Data

In [7]:
# load libraries

import pandas as pd
import os

In [None]:
# define path to data

path = "/Users/berkergoz/Desktop/US_Gas_Analysis/02_Data"

In [None]:
# define a function to load data, except path error (e.g., file not found, change the path accordingly)

def load_data(path):
    """
    Load data from a CSV file into a pandas DataFrame.
    
    Parameters:
    path (str): The path to the CSV file.
    
    Returns:
    pd.DataFrame: The loaded data as a DataFrame.
    """
    try:
        df = pd.read_csv(os.path.join(path, "original_data", "gas_data.csv"))
        return df
    except Exception as e:
        print(f"Error loading data: {e}")
        return None 

In [9]:
# load the data
df = load_data(path)

# check if the data is loaded successfully
if df is not None:
    print("Data loaded successfully.")
else:
    print("Failed to load data.")
    

Data loaded successfully.


In [17]:
# set up display options for pandas

pd.set_option('display.max_columns', None)  # Show all columns
pd.set_option('display.max_rows', None)     # Show all rows
pd.set_option('display.width', 200)  # Show columns in a wider format

## 2. Data Overview

In [18]:
# check the first few rows of the data

print(df.head())

   year  month duoarea area-name product product-name process            process-name    series                                 series-description   value units
0  2014      1     SFL   FLORIDA    EPG0  Natural Gas     VCS  Commercial Consumption  N3020FL2  Natural Gas Deliveries to Commercial Consumers...  6605.0  MMCF
1  2014      1     SNH    USA-NH    EPG0  Natural Gas     VCS  Commercial Consumption  N3020NH2  Natural Gas Deliveries to Commercial Consumers...  1691.0  MMCF
2  2014      1     SOR    USA-OR    EPG0  Natural Gas     VCS  Commercial Consumption  N3020OR2  Natural Gas Deliveries to Commercial Consumers...  4711.0  MMCF
3  2014      1     SDE    USA-DE    EPG0  Natural Gas     VCS  Commercial Consumption  N3020DE2  Natural Gas Deliveries to Commercial Consumers...  2128.0  MMCF
4  2014      1     SAZ    USA-AZ    EPG0  Natural Gas     VCS  Commercial Consumption  N3020AZ2  Natural Gas Deliveries to Commercial Consumers...  3915.0  MMCF


In [19]:
# check the last few rows of the data
print(df.tail())

       year  month duoarea      area-name product product-name process             process-name    series                                 series-description    value units
37989  2024      1     SMN      MINNESOTA    EPG0  Natural Gas     VRS  Residential Consumption  N3010MN2  Minnesota Natural Gas Residential Consumption ...  24866.0  MMCF
37990  2024      1     SNE         USA-NE    EPG0  Natural Gas     VRS  Residential Consumption  N3010NE2  Nebraska Natural Gas Residential Consumption (...   7800.0  MMCF
37991  2024      1     SVA         USA-VA    EPG0  Natural Gas     VRS  Residential Consumption  N3010VA2  Virginia Natural Gas Residential Consumption (...  15938.0  MMCF
37992  2024      1     SCT         USA-CT    EPG0  Natural Gas     VRS  Residential Consumption  N3010CT2  Connecticut Natural Gas Residential Consumptio...   9299.0  MMCF
37993  2024      1     SMA  MASSACHUSETTS    EPG0  Natural Gas     VRS  Residential Consumption  N3010MA2  Massachusetts Natural Gas Residen

## 3. Data Wrangling