# Data Science Basics Intro
> Collected basics from IBM Data Science course

- toc: true
- badges: true
- comments: true
- sticky_rank: 1
- author: Felix
- categories: [ibm, data_science, pandas, numpy]

In [14]:
import yfinance as yf
import pandas as pd
import requests
from bs4 import BeautifulSoup
import plotly.graph_objects as go
from plotly.subplots import make_subplots

def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data.Date, infer_datetime_format=True), y=stock_data.Close.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data.Date, infer_datetime_format=True), y=revenue_data.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Millions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()

In [15]:
tsla = yf.Ticker('TSLA')
tesla_data = tsla.history(period='max')
tesla_data.reset_index(inplace=True)
tesla_data.head()


Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
0,2010-06-29,3.8,5.0,3.51,4.78,93831500,0,0.0
1,2010-06-30,5.16,6.08,4.66,4.77,85935500,0,0.0
2,2010-07-01,5.0,5.18,4.05,4.39,41094000,0,0.0
3,2010-07-02,4.6,4.62,3.74,3.84,25699000,0,0.0
4,2010-07-06,4.0,4.0,3.17,3.22,34334500,0,0.0


In [16]:
url = 'https://www.macrotrends.net/stocks/charts/TSLA/tesla/revenue'
html_data  = requests.get(url).text
soup = BeautifulSoup(html_data,"html5lib")
tesla_revenue = pd.DataFrame(columns=['Date', 'Revenue'])
quarterly = soup.findAll("table")[1].find("tbody")

for row in quarterly.find_all("tr"):
    col = row.find_all("td")
    date = col[0].text
    revenue = col[1].text.replace("$", "").replace(",", "")
    tesla_revenue = tesla_revenue.append({"Date":date, "Revenue":revenue}, ignore_index=True)
tesla_revenue.head()

tesla_revenue.dropna(inplace=True)
tesla_revenue = tesla_revenue[tesla_revenue['Revenue'] != ""]
tesla_revenue.tail()

Unnamed: 0,Date,Revenue
41,2010-09-30,31
42,2010-06-30,28
43,2010-03-31,21
45,2009-09-30,46
46,2009-06-30,27


In [13]:
#make_graph(tesla_data, tesla_revenue, 'Tesla Stock Data')