## Google Capstone Process Step

For the following script to work the user needs a data folder in their working directory with two subfolders:
1. raw
2. time_filtered

![file_tree](https://github.com/MikSm1th/GoogleCapstone/blob/main/file_tree.png?raw=true)

In [1]:
import glob as gl
import pandas as pd
import datetime as dt

In [2]:
def compile_list_of_dataframes(glob_pattern):
    raw_df_list = [f for f in gl.glob(glob_pattern)]
    raw_df_list_filenames = [i[11:] for i in raw_df_list]
    return raw_df_list, raw_df_list_filenames

glob_pattern = './data/raw/*.csv'
df_list, filenames = compile_list_of_dataframes(glob_pattern)
df_list

['./data/raw/202201-divvy-tripdata.csv',
 './data/raw/202112-divvy-tripdata.csv',
 './data/raw/202204-divvy-tripdata.csv',
 './data/raw/202202-divvy-tripdata.csv',
 './data/raw/202207-divvy-tripdata.csv',
 './data/raw/202206-divvy-tripdata.csv',
 './data/raw/202108-divvy-tripdata.csv',
 './data/raw/202203-divvy-tripdata.csv',
 './data/raw/202205-divvy-tripdata.csv',
 './data/raw/202110-divvy-tripdata.csv',
 './data/raw/202109-divvy-tripdata.csv',
 './data/raw/202111-divvy-tripdata.csv']

In [3]:
def time_filtered(df):
    temp_df = pd.read_csv(df) 
    
    temp_df['ride_length'] = (pd.to_datetime(temp_df.ended_at)
                            - pd.to_datetime(temp_df.started_at))
    
    temp_df['day_of_week'] = (pd.to_datetime(temp_df.started_at)
                                .dt.day_name())
    return temp_df

In [4]:
def create_time_filtered_copy(df, file_name, dest_path = './data/time_filtered/'):
    df.to_csv(dest_path + file_name, index = False)

In [5]:
for n, df in enumerate(df_list):
    temp_df = time_filtered(df)
    create_time_filtered_copy(temp_df, filenames[n])
    print(filenames[n], df)

202201-divvy-tripdata.csv ./data/raw/202201-divvy-tripdata.csv
202112-divvy-tripdata.csv ./data/raw/202112-divvy-tripdata.csv
202204-divvy-tripdata.csv ./data/raw/202204-divvy-tripdata.csv
202202-divvy-tripdata.csv ./data/raw/202202-divvy-tripdata.csv
202207-divvy-tripdata.csv ./data/raw/202207-divvy-tripdata.csv
202206-divvy-tripdata.csv ./data/raw/202206-divvy-tripdata.csv
202108-divvy-tripdata.csv ./data/raw/202108-divvy-tripdata.csv
202203-divvy-tripdata.csv ./data/raw/202203-divvy-tripdata.csv
202205-divvy-tripdata.csv ./data/raw/202205-divvy-tripdata.csv
202110-divvy-tripdata.csv ./data/raw/202110-divvy-tripdata.csv
202109-divvy-tripdata.csv ./data/raw/202109-divvy-tripdata.csv
202111-divvy-tripdata.csv ./data/raw/202111-divvy-tripdata.csv
