## Template to concatenate multiple CSV's into 1 file.
Use codes below and replace information where needed to correspond to each set of CSV files.

In [1]:
# Importing dependencies.

from glob import glob
import pandas as pd

In [2]:
# Creating a list of all the CSV files.

balance_sheet_files = sorted(glob('raw_dataset/filtered_balance_sheet/*filtered_balance_sheet.csv'))
balance_sheet_files

In [3]:
# Create a dataframe to house all concatenated files.

df = pd.concat((pd.read_csv(file).assign(filename = file)
          for file in balance_sheet_files), ignore_index = True)
df

In [4]:
# Dropping unwanted columns seen in the dataframe.

cleaned_df = df.drop(['Unnamed: 0','filename'],axis=1)
cleaned_df

In [5]:
# Count of missing values of the entire dataframe. If any drop.

cleaned_df.isnull().sum().sum()

In [6]:
# Replacing the None values with 0.

balance_sheet_df = cleaned_df.replace('None', 0)
balance_sheet_df

In [7]:
# Renaming column names - See column headers on each set of CSV files and input inside the {}.

balance_sheet_df = balance_sheet_df.rename(columns = {
    'SYMBOL': 'symbol',
    })
balance_sheet_df

In [8]:
# Exporting balance_sheet dataframe to csv file without the index.

balance_sheet_df.to_csv('raw_dataset/balance_sheet.csv', index = False)