# Question 1: Use yfinance to Extract Stock Data

In [56]:
import yfinance as yf
import pandas as pd
import requests
from bs4 import BeautifulSoup 
import plotly.graph_objects as go
from plotly.subplots import make_subplots


In [63]:
def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data.Date, infer_datetime_format=True), y=stock_data.Close.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data.Date, infer_datetime_format=True), y=revenue_data.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Millions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()

In [2]:
tesla = yf.Ticker("TSLA")

In [3]:
tesla_info = tesla.info

In [4]:
tesla_data = tesla.history(period = "max")

In [6]:
tesla_data.reset_index(inplace = True)

In [7]:
tesla_data.head()

Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
0,2010-06-29,3.8,5.0,3.508,4.778,93831500,0,0.0
1,2010-06-30,5.158,6.084,4.66,4.766,85935500,0,0.0
2,2010-07-01,5.0,5.184,4.054,4.392,41094000,0,0.0
3,2010-07-02,4.6,4.62,3.742,3.84,25699000,0,0.0
4,2010-07-06,4.0,4.0,3.166,3.222,34334500,0,0.0


# Question 2 - Extracting Tesla Revenue Data Using Webscraping

In [15]:
url = "https://www.macrotrends.net/stocks/charts/TSLA/tesla/revenue?utm_medium=Exinfluencer&utm_source=Exinfluencer&utm_content=000026UJ&utm_term=10006555&utm_id=NA-SkillsNetwork-Channel-SkillsNetworkCoursesIBMDeveloperSkillsNetworkPY0220ENSkillsNetwork23455606-2021-01-01"
data  = requests.get(url).text

In [18]:
soup = BeautifulSoup(data,"html.parser")

In [30]:
read_html_pandas_data = pd.read_html(url)
tesla_dataFrame = read_html_pandas_data[1]  
tesla_revenue = pd.DataFrame(columns = ['Date','Revenue'])
for row in soup.find("tbody").find_all("tr"):
    col = row.find_all("td")
    date = col[0].text
    revenue = col[1].text
    tesla_revenue = tesla_revenue.append({'Date':date,'Revenue':revenue}, ignore_index = True)

Execute the following line to remove the comma and dollar sign from the `Revenue` column.


In [31]:
tesla_revenue["Revenue"] = tesla_revenue['Revenue'].str.replace(',|\$',"")


  tesla_revenue["Revenue"] = tesla_revenue['Revenue'].str.replace(',|\$',"")


Execute the following lines to remove an null or empty strings in the Revenue column.


In [None]:
tesla_revenue.dropna(inplace=True)

tesla_revenue = tesla_revenue[tesla_revenue['Revenue'] != ""]

In [67]:
tesla_revenue.tail()

Unnamed: 0,Date,Revenue
12,2009,8806
13,2008,7094
14,2007,5319
15,2006,3092
16,2005,1843


## Question 3: Use yfinance to Extract Stock Data


In [72]:
GameStop = yf.Ticker("GME")

In [73]:
gme_info = GameStop.info

In [74]:
gme_data = GameStop.history(period = "max")

In [75]:
gme_data.reset_index(inplace = True)

In [77]:
gme_data.tail()

Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
5021,2022-01-24,99.019997,102.860001,86.290001,100.150002,6267700,0.0,0.0
5022,2022-01-25,96.919998,104.970001,95.010002,99.790001,3574300,0.0,0.0
5023,2022-01-26,101.099998,119.0,100.309998,103.260002,8325100,0.0,0.0
5024,2022-01-27,104.139999,107.0,92.889999,93.519997,3661100,0.0,0.0
5025,2022-01-28,95.400002,97.989998,87.660004,97.910004,4056889,0.0,0.0


# Question 4: Use Webscraping to Extract GME Revenue Data


In [40]:
url = "https://www.macrotrends.net/stocks/charts/GME/gamestop/revenue?utm_medium=Exinfluencer&utm_source=Exinfluencer&utm_content=000026UJ&utm_term=10006555&utm_id=NA-SkillsNetwork-Channel-SkillsNetworkCoursesIBMDeveloperSkillsNetworkPY0220ENSkillsNetwork23455606-2021-01-01"
data = requests.get(url).text

In [42]:
soup = BeautifulSoup(data,"html.parser")

In [44]:
 gme_revenue = pd.DataFrame(columns = ['Date','Revenue'])
for row in soup.find("tbody").find_all("tr"):
    col = row.find_all("td")
    date = col[0].text
    revenue = col[1].text
    gme_revenue = tesla_revenue.append({'Date':date,'Revenue':revenue}, ignore_index = True)

In [88]:
gme_revenue["Revenue"] = gme_revenue['Revenue'].str.replace(',|\$',"")


The default value of regex will change from True to False in a future version.



In [89]:
gme_revenue.dropna(inplace=True)

gme_revenue = gme_revenue[gme_revenue['Revenue'] != ""]

In [90]:
gme_revenue.tail()

Unnamed: 0,Date,Revenue
13,2008,7094
14,2007,5319
15,2006,3092
16,2005,1843
17,2005,1843


# Question 5: Plot Tesla Stock Graph


In [81]:
make_graph(tesla_data, tesla_revenue, 'Tesla')

# Question 6: Plot GameStop Stock Graph


In [91]:
make_graph(gme_data, gme_revenue, 'GameStop')
