# Collect Data

### Objective: 
- use the `yfinance` library to retrieve and download stock data. 

#### Functions in this notebooks:
1. download_ticker_data(): downloads the stock data of the past 5 years and saves it. If the data already exists, it will not redownload the data. 
2. do_FAANG_download(): focuses on getting the FAANG stock information, creating the Stock objects, and saving those into the data folder. filters the downloaded data for cleaner analysis
3. do_AWS_client_download(): focuses on getting the AWS client stock information, creating the Stock objects, and saving those into the data folderfilters the downloaded data for cleaner analysis

In [1]:
import os
os.chdir("/Commjhub/jupyterhub/comm318_fall2019/daniellegin/comm318_F20/comm318_F20_Final_Project")
print(os.getcwd())

/Commjhub/jupyterhub/comm318_fall2019/daniellegin/comm318_F20/comm318_F20_Final_Project


In [2]:
%run data_analysis/Stock.ipynb

In [3]:
import yfinance as yf
import pandas as pd
import pickle
import pprint

In [4]:
pretty = pprint.PrettyPrinter(indent=4)
pd.set_option('display.max_columns', None)


def download_ticker_data(ticker_list, save_dir):

    for ticker_name in ticker_list:
        ticker_name = ticker_name.upper()
        ticker = yf.Ticker(ticker_name)
        temp_stock = Stock(
            ticker_name,
            ticker.info,
            ticker.history(period="5y")
        )
        stock_file_path = "{}/{} stock.p".format(save_dir, ticker_name)
        print("Attempting to save {}... ".format(ticker_name), end="")
        if not os.path.exists(stock_file_path):
            pickle.dump(temp_stock, open(stock_file_path, "wb"))
            print("saved!")
        else:
            print("exists!")





In [5]:
def do_FAANG_download():
    ticker_list = [
        "FB",
        "AMZN",
        "AAPL",
        "NFLX",
        "GOOG"
    ]
    download_ticker_data(ticker_list, "data/FAANG_stocks")

In [6]:
def do_AWS_client_download():
    ticker_list = [
        "DBX",
        "ADSK",
        "INTU",
        "SUMO",
        "GDDY"
    ]
    download_ticker_data(ticker_list, "data/AWS_client_stocks")