In [28]:
def get_data_local_csv():
    """
    Request user input. Read in then clean/transform data from a local CSV file.

    This function asks the user to imput a valid stock symbol from the list provided.
    Valid symbols can be entered in lower, upper or mixed case. 
    It takes that input and reads in data from the corrosponding local .csv file. 
    It then cleans/transforms the data into a pandas dataframe.
    The user only gets three attempts to enter a valid stock symbol from the list provided and 
    then the function terminates and returns a message.
    If no corrosponding file is found the function terminates and returns a message.
    

    Parameters
    ----------
    None

    Returns
    -------
    pandas dataframe

    Examples
    --------
    MSFT, AAPL
    """ 

    import pandas as pd
    from datetime import date, datetime

    pd.set_option('display.max_columns', 20)
    pd.set_option('display.width', 1000)
    
    try: # Handles the condition of no dataframe returned (UnboundLocalError) due to no valid input after 3 attempts or file not found error.
        try: # Handles the conditions of a either a valid or invalid input or a FileNotFound error.
            for x in range(3): # Sets the input attempt range to 3 to avoid an infinite run condition.
                symbols = ['AAPL', 'AMD', 'AMZN', 'CSCO', 'META', 'MSFT', 'NFLX', 'QCOM', 'SBUX', 'TSLA'] # List of valid stock symbols for input.
                symbol = input("Please enter one of the following symbols!" + str(symbols)).upper() # User input statement.
                if symbol in symbols: # Checks for valid input.
                    df = pd.read_csv('assets/HistoricalData_' + symbol + '.csv') # Read in data from local CSV file.
                    df['Symbol'] = symbol # Adds the "Symbol" column to the dataframe.
                    df['Open'] = df['Open'].str.replace("$", '', regex=True).astype(float) # Removes the $ from the data in the column and sets type to float.
                    df['High'] = df['High'].str.replace("$", '', regex=True).astype(float) # Removes the $ from the data in the column and sets type to float.
                    df['Low'] = df['Low'].str.replace("$", '', regex=True).astype(float) # Removes the $ from the data in the column and sets type to float.
                    df['Close/Last'] = df['Close/Last'].str.replace("$", '', regex=True).astype(float) # Removes the $ from the data in the column and sets type to float.
                    df.rename(columns={'Close/Last': 'Close'}, inplace=True) # Renames "Close/Last" column to "Close"
                    df['Date'] = pd.to_datetime(df['Date']) # Sets "Date" column to type datetime.
                    df['Year'] = df['Date'].dt.year
                    df['Month'] = df['Date'].dt.month
                    df['Day'] = df['Date'].dt.day
                    df['Week Num'] = df.Date.apply(lambda x:x.isocalendar()[1])
                    df['Day Num'] = df['Date'].dt.day_of_week
                    df['Day Name'] = df['Date'].dt.day_name()
                    break # Breaks loop on successful execution.
                elif x < 2: # Checks range variable for value on unsuccessful execution.
                    print("You have entered an invalid symbol! Please try again!") 
                else: # Informs user that the function is terminating after 3 invalid entries.
                    print("Function terminates after three invalid entries!")
                
        except FileNotFoundError: 
            print("File Not Found!")

        return df # Returns pandas dataframe on successful execution.

    except UnboundLocalError:
        print("No dataframe returned!")
    

In [48]:
df = get_data_local_csv()
print(df)

           Date     Close    Volume      Open      High       Low Symbol  Year  Month  Day  Week Num  Day Num   Day Name
0    2022-09-27  224.3600   7762223  228.6300  230.6400  220.7200   NFLX  2022      9   27        39        1    Tuesday
1    2022-09-26  224.0700   8234285  225.6000  232.7000  223.0100   NFLX  2022      9   26        39        0     Monday
2    2022-09-23  226.4100  11207230  235.1400  236.4499  221.4300   NFLX  2022      9   23        38        4     Friday
3    2022-09-22  237.0500  10017970  235.3500  240.5000  231.6600   NFLX  2022      9   22        38        3   Thursday
4    2022-09-21  236.8700   9166772  242.6700  248.2999  236.6800   NFLX  2022      9   21        38        2  Wednesday
...         ...       ...       ...       ...       ...       ...    ...   ...    ...  ...       ...      ...        ...
2510 2012-10-04    9.5243  91437177    8.9500    9.6100    8.9443   NFLX  2012     10    4        40        3   Thursday
2511 2012-10-03    8.9400  75872

In [49]:
def filter_by_year():
    """
    Requests user input. Reads in then cleans/transforms data from a local CSV file.

    This function calls the get_data_local_csv() function and then asks the user to imput a valid year from the list provided. 
    It takes that input and filters the current dataframe. 
    The user only gets three attempts to enter a valid year from the list provided and 
    then the function terminates and returns a message.
    If the datafram is not returned a message is printed.

    Parameters
    ----------
    None

    Returns
    -------
    pandas dataframe

    Examples
    --------
    MSFT, AAPL
    """

    df = get_data_local_csv()
    try:
        for x in range(3): # Sets the input attempt range to 3 to avoid an infinite run condition.
            years = ['2012', '2103', '2014', '2015', '2016', '2017', '2018', '2019', '2020', '2021', '2022'] # List of valid years for input.
            year = input("Please enter one of the following years!" + str(years)) # User input statement.
            if year in years: # Checks for valid input.
                is_year = df["Year"] == int(year) # Filter dataframe to only requested year.
                df_yr = df[is_year]
                break # Breaks loop on successful execution.
            elif x < 2: # Checks range variable for value on unsuccessful execution.
                print("You have entered an invalid year! Please try again!") 
            else: # Informs user that the function is terminating after 3 invalid entries.
                print("Function terminates after three invalid entries!")

        return df_yr # Returns pandas dataframe on successful execution.

    except UnboundLocalError:
        print("No dataframe returned!")
    

In [50]:
df = filter_by_year()
print(df)


           Date  Close    Volume  Open   High   Low Symbol  Year  Month  Day  Week Num  Day Num   Day Name
1696 2015-12-31   2.87  11068230  2.97  3.010  2.87    AMD  2015     12   31        53        3   Thursday
1697 2015-12-30   2.98  10046410  2.99  3.040  2.93    AMD  2015     12   30        53        2  Wednesday
1698 2015-12-29   3.00  15292210  3.04  3.060  2.97    AMD  2015     12   29        53        1    Tuesday
1699 2015-12-28   3.00  16048590  2.91  3.020  2.86    AMD  2015     12   28        53        0     Monday
1700 2015-12-24   2.92  11900890  2.88  3.000  2.86    AMD  2015     12   24        52        3   Thursday
...         ...    ...       ...   ...    ...   ...    ...   ...    ...  ...       ...      ...        ...
1943 2015-01-08   2.61  11128830  2.59  2.645  2.56    AMD  2015      1    8         2        3   Thursday
1944 2015-01-07   2.58  12373330  2.63  2.650  2.54    AMD  2015      1    7         2        2  Wednesday
1945 2015-01-06   2.63  13916650  2.6