# Historical Stock/Revenue Data Analysis and Dashboard Development

## Author : Enrico Findley

# Installing and importing dependencies

In [3]:
# Installing dependencies
%pip install yfinance
%pip install pandas
%pip install beautifulsoup4
%pip install html5lib
%pip install lxml
%pip install plotly
%pip install nbformat

# Importing dependencies
import yfinance as yf
import pandas as pd
import pandas as pd
import requests
from bs4 import BeautifulSoup
import plotly.graph_objects as go
from plotly.subplots import make_subplots
import re

Collecting yfinance
  Downloading yfinance-0.2.26-py2.py3-none-any.whl (62 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m63.0/63.0 kB[0m [31m3.6 MB/s[0m eta [36m0:00:00[0m
Collecting multitasking>=0.0.7 (from yfinance)
  Downloading multitasking-0.0.11-py3-none-any.whl (8.5 kB)
Installing collected packages: multitasking, yfinance
Successfully installed multitasking-0.0.11 yfinance-0.2.26
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.


# Use yfinance to Extract Stock Data "TSLA"
**Using `Ticker` function with ticker symbol of the stock as parameter to get the stock data we want. The stock is Tesla and its ticker symbol is `TSLA`.**

In [4]:
tesla = yf.Ticker("TSLA")

**Using ticker object and the function `history` to extract stock information and store it in a dataframe named `tesla_data`. Setting the `period` parameter to `max` so we get information for the maximum amount of time.**

In [5]:
tesla_data = tesla.history(period="max")

**Reset the index, save, and display the first five rows of the `tesla_data` dataframe using the `head` function.**

In [6]:
tesla_data.reset_index(inplace=True)
tesla_data.head()

Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
0,2010-06-29 00:00:00-04:00,1.266667,1.666667,1.169333,1.592667,281494500,0.0,0.0
1,2010-06-30 00:00:00-04:00,1.719333,2.028,1.553333,1.588667,257806500,0.0,0.0
2,2010-07-01 00:00:00-04:00,1.666667,1.728,1.351333,1.464,123282000,0.0,0.0
3,2010-07-02 00:00:00-04:00,1.533333,1.54,1.247333,1.28,77097000,0.0,0.0
4,2010-07-06 00:00:00-04:00,1.333333,1.333333,1.055333,1.074,103003500,0.0,0.0


**Use Webscraping to Extract Tesla Revenue Data**

In [7]:
url = "https://companiesmarketcap.com/tesla/revenue/"
data  = requests.get(url).text
soup = BeautifulSoup(data, 'html5lib')
tesla_revenue = pd.DataFrame(columns=["Date", "Revenue"])

**Parsing incoming data using BeautifulSoup**

In [8]:
# First we isolate the body of the table which contains all the information
# Then we loop through each row and find all the column values for each row
for row in soup.find("tbody").find_all('tr'):
    col = row.find_all("td")
    date = col[0].text
    match = re.search(r'\d{4}', date)
    if match:
        date = match.group()
    revenue = col[1].text
    revenue = revenue.replace("$", "").rstrip("B")
    revenue = float(revenue)
    # Finally we append the data of each row to the table
    data_to_append = {'Date': [date], 'Revenue': [revenue]}
    # Create a new DataFrame by concatenating the original and new data
    tesla_revenue = pd.concat([tesla_revenue, pd.DataFrame(data_to_append)], ignore_index=True)

**Display the last five rows of the `tesla_revenue` dataframe using the `tail` function.**

In [9]:
tesla_revenue.tail()

Unnamed: 0,Date,Revenue
10,2013,2.01
11,2012,0.41
12,2011,0.2
13,2010,0.11
14,2009,0.11


# Use yfinance to Extract Stock Data "GME"
**Using `Ticker` function with ticker symbol of the stock as parameter to get the stock data we want. The stock is GameStop and its ticker symbol is `GME`.**

In [10]:
gamestop = yf.Ticker("GME")

**Using ticker object and the function `history` to extract stock information and store it in a dataframe named `gamestop_data`. Setting the `period` parameter to `max` so we get information for the maximum amount of time.**

In [11]:
gamestop_data = gamestop.history(period="max")

**Reset the index, save, and display the first five rows of the `gamestop_data` dataframe using the `head` function.**

In [12]:
gamestop_data.reset_index(inplace=True)
gamestop_data.head()

Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
0,2002-02-13 00:00:00-05:00,1.620129,1.69335,1.603296,1.691667,76216000,0.0,0.0
1,2002-02-14 00:00:00-05:00,1.712707,1.716074,1.670626,1.68325,11021600,0.0,0.0
2,2002-02-15 00:00:00-05:00,1.683251,1.687459,1.658002,1.674834,8389600,0.0,0.0
3,2002-02-19 00:00:00-05:00,1.666418,1.666418,1.578047,1.607504,7410400,0.0,0.0
4,2002-02-20 00:00:00-05:00,1.61592,1.66221,1.603296,1.66221,6892800,0.0,0.0


**Use Webscraping to Extract GME Revenue Data**

In [13]:
url = "https://companiesmarketcap.com/gamestop/revenue/"
data  = requests.get(url).text
soup = BeautifulSoup(data, 'html5lib')
gamestop_revenue = pd.DataFrame(columns=["Date", "Revenue"])

**Parsing incoming data using BeautifulSoup**

In [14]:
# First we isolate the body of the table which contains all the information
# Then we loop through each row and find all the column values for each row
for row in soup.find("tbody").find_all('tr'):
    col = row.find_all("td")
    date = col[0].text
    match = re.search(r'\d{4}', date)
    if match:
        date = match.group()
    revenue = col[1].text
    revenue = revenue.replace("$", "").rstrip("B")
    revenue = float(revenue)
    # Finally we append the data of each row to the table
    data_to_append = {'Date': [date], 'Revenue': [revenue]}
    # Create a new DataFrame by concatenating the original and new data
    gamestop_revenue = pd.concat([gamestop_revenue, pd.DataFrame(data_to_append)], ignore_index=True)

**Display the last five rows of the `gamestop_revenue` dataframe using the `tail` function.**

In [15]:
gamestop_revenue.tail()

Unnamed: 0,Date,Revenue
17,2006,4.68
18,2005,2.13
19,2004,1.75
20,2003,1.47
21,2002,1.34


# **Plot Tesla Stock Graph**

In [16]:
def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data.Date, infer_datetime_format=True), y=stock_data.Close.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data.Date, infer_datetime_format=True), y=revenue_data.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Billions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()

**Use the make_graph function to graph the Tesla Stock Data, also provide a title for the graph.**

In [17]:
make_graph(tesla_data,tesla_revenue,'Tesla')

# **Plot GameStop Stock Graph**

In [18]:
make_graph(gamestop_data,gamestop_revenue,'GameStop')