Extracting and Visualizing Stock Data

In [None]:
!pip install yfinance
#!pip install pandas
#!pip install requests
!pip install bs4
#!pip install plotly

In [None]:
import yfinance as yf
import pandas as pd
import requests
from bs4 import BeautifulSoup
import plotly.graph_objects as go
from plotly.subplots import make_subplots

Define Graphing Function

In [None]:
def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data.Date, infer_datetime_format=True), y=stock_data.Close.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data.Date, infer_datetime_format=True), y=revenue_data.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Millions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()

Use yfinance to Extract Stock Data

In [None]:
tesla =  yf.Ticker('TSLA')

In [None]:
tesla_data = tesla.history(period= 'max')

In [None]:
tesla_data.reset_index(inplace = True)

In [None]:
tesla_data.head()


use webscrapping to extract tesla revenue data

In [None]:
import numpy as np

In [None]:


url = 'https://www.macrotrends.net/stocks/charts/TSLA/tesla/revenue'
html_data = requests.get(url).text



In [None]:
beautiful_soup = BeautifulSoup(html_data,'html5lib')

In [None]:
print('The number of tables in the url are :', len(beautiful_soup.find_all('table')))

for i,j in enumerate(beautiful_soup.find_all('table')):
    if ( 'Tesla Quarterly Revenue' in str(j)):
        print('the table we are looking for is in location:', i)
        
tesla_revenue = pd.DataFrame(columns= ['Date', 'Revenue'])
#beautiful_soup.find_all('table')[1].find('tbody').find_all('tr')[0].text.strip().replace("\t", "").replace('\n',"").split('$')

In [None]:
for i in beautiful_soup.find_all('table')[1].find('tbody').find_all('tr'):
    col = i
    date = col.text.strip().replace("\t", "").replace('\n',"").split('$')[0]
    #print(date)
    try:
        revenue = col.text.strip().replace("\t", "").replace('\n',"").split('$')[1]
       # print(revenue)    
    except IndexError:
        revenue= np.nan
        #print(revenue)
    tesla_revenue= tesla_revenue.append({"Date":date,"Revenue":revenue}, ignore_index=True)
#tesla_revenue.head()

In [None]:
tesla_revenue.dropna(inplace =True)

In [None]:
tesla_revenue['Revenue'] = tesla_revenue['Revenue'].apply(lambda x: x.replace(',',''))

In [None]:
tesla_revenue.tail(5)

use yfinance to extract stock data

In [None]:


gme = yf.Ticker('GME')



In [None]:
gme_data = gme.history(period='max')

In [None]:
gme_data.reset_index(inplace= True)

In [None]:
gme_data.head()

Use Webscraping to Extract GME Revenue Data

In [None]:
url2 = ' https://www.macrotrends.net/stocks/charts/GME/gamestop/revenue'
html_data2 = requests.get(url2).text

In [None]:
beautiful_soup2 = BeautifulSoup(html_data2,'html5lib')

In [None]:


print('The number of tables in the url are :', len(beautiful_soup2.find_all('table')))

for i,j in enumerate(beautiful_soup2.find_all('table')):
    if ( 'GameStop Quarterly Revenue' in str(j)):
        print('the table we are looking for is in location:', i)
        
gme_revenue = pd.read_html(str(beautiful_soup2.find_all('table')[1]), flavor='bs4')[0]    
gme_revenue.columns



In [None]:


print('The number of tables in the url are :', len(beautiful_soup2.find_all('table')))

for i,j in enumerate(beautiful_soup2.find_all('table')):
    if ( 'GameStop Quarterly Revenue' in str(j)):
        print('the table we are looking for is in location:', i)
        
gme_revenue = pd.read_html(str(beautiful_soup2.find_all('table')[1]), flavor='bs4')[0]    
gme_revenue.columns



In [None]:
gme_revenue.tail()

In [None]:
Plot Tesla Stock Graph

In [None]:
tesla_revenue['Revenue'] = tesla_revenue['Revenue'].apply(lambda x: np.float(x))

In [None]:
make_graph(tesla_data, tesla_revenue, 'Tesla')

In [None]:


gme_revenue['Revenue'] = gme_revenue['Revenue'].apply(lambda x : float(x))
make_graph(gme_data, gme_revenue, 'GameStop')

