In [2]:
# Necessary Libraries

!pip install yfinance
!pip install requests
!pip install bs4
!pip install plotly

import yfinance as yf
import pandas as pd
import requests
from bs4 import BeautifulSoup
import plotly.graph_objects as go
from plotly.subplots import make_subplots

Collecting bs4
  Downloading bs4-0.0.2-py2.py3-none-any.whl.metadata (411 bytes)
Downloading bs4-0.0.2-py2.py3-none-any.whl (1.2 kB)
Installing collected packages: bs4
Successfully installed bs4-0.0.2


In [71]:
# Question 1 - Extracting Tesla Stock Data Using yfinance - 2 Points

# Function to extract stock data using yfinance
def get_stock_data(ticker):
    stock = yf.Ticker(ticker)
    stock_data = stock.history(period="max")
    stock_data.reset_index(inplace=True)
    return stock_data[['Date', 'Open']]


# Extracting Tesla Stock Data
tesla_stock_data = get_stock_data('TSLA')
tesla_stock_data.head()

Unnamed: 0,Date,Open
0,2010-06-29 00:00:00-04:00,1.266667
1,2010-06-30 00:00:00-04:00,1.719333
2,2010-07-01 00:00:00-04:00,1.666667
3,2010-07-02 00:00:00-04:00,1.533333
4,2010-07-06 00:00:00-04:00,1.333333


In [72]:
# Question 2 - Extracting Tesla Revenue Data Using Webscraping - 1 Point

# URL containing Tesla revenue data
url = 'https://cf-courses-data.s3.us.cloud-object-storage.appdomain.cloud/IBMDeveloperSkillsNetwork-PY0220EN-SkillsNetwork/labs/project/revenue.htm'

response = requests.get(url)
soup = BeautifulSoup(response.content, 'html.parser')

# Find all tables in the page
tables = soup.find_all('table')

# Create a list to hold data temporarily
data = []

# Extract data from the second table (index 1)
for row in tables[1].find_all('tr')[1:]:  # Skip the header row
    cols = row.find_all('td')
    date = cols[0].text.strip()
    revenue = cols[1].text.strip().replace("$", "").replace(",", "")
    data.append({"Date": date, "Revenue": revenue})

# Convert list of dictionaries to a DataFrame
tesla_revenue_data = pd.DataFrame(data)

# Convert 'Date' to datetime format and 'Revenue' to numeric
tesla_revenue_data['Date'] = pd.to_datetime(tesla_revenue_data['Date'])
tesla_revenue_data['Revenue'] = pd.to_numeric(tesla_revenue_data['Revenue'], errors='coerce')

# Display the DataFrame
tesla_revenue_data.tail()


Unnamed: 0,Date,Revenue
49,2010-06-30,28.0
50,2010-03-31,21.0
51,2009-12-31,
52,2009-09-30,46.0
53,2009-06-30,27.0


In [73]:
# Question 3 - Extracting GameStop Stock Data Using yfinance - 2 Points

# Function to extract stock data using yfinance
def get_stock_data(ticker):
    stock = yf.Ticker(ticker)
    stock_data = stock.history(period="max")
    stock_data.reset_index(inplace=True)
    return stock_data[['Date', 'Open']]

# Question 3 - Extracting GameStop Stock Data
gamestop_stock_data = get_stock_data('GME')
gamestop_stock_data.head()

Unnamed: 0,Date,Open
0,2002-02-13 00:00:00-05:00,1.620128
1,2002-02-14 00:00:00-05:00,1.712707
2,2002-02-15 00:00:00-05:00,1.68325
3,2002-02-19 00:00:00-05:00,1.666418
4,2002-02-20 00:00:00-05:00,1.615921


In [74]:
# Question 4 - Extracting GameStop Revenue Data Using Webscraping - 1 Point

url = 'https://cf-courses-data.s3.us.cloud-object-storage.appdomain.cloud/IBMDeveloperSkillsNetwork-PY0220EN-SkillsNetwork/labs/project/stock.html'

response = requests.get(url)
soup = BeautifulSoup(response.content, 'html.parser')

# Find all tables in the page
tables = soup.find_all('table')

# Create a list to hold data temporarily
data = []

# Extract data from the second table (quarterly data)
for row in tables[1].find_all('tr')[1:]:  # Skip the header row
    cols = row.find_all('td')
    date = cols[0].text.strip()
    revenue = cols[1].text.strip().replace("$", "").replace(",", "")
    data.append({"Date": date, "Revenue": revenue})

# Convert list of dictionaries to a DataFrame
gamestop_revenue_data = pd.DataFrame(data)

# Convert 'Date' to datetime format and 'Revenue' to numeric
gamestop_revenue_data['Date'] = pd.to_datetime(gamestop_revenue_data['Date'])
gamestop_revenue_data['Revenue'] = pd.to_numeric(gamestop_revenue_data['Revenue'], errors='coerce')

# Display the DataFrame
gamestop_revenue_data.tail()


Unnamed: 0,Date,Revenue
57,2006-01-31,1667
58,2005-10-31,534
59,2005-07-31,416
60,2005-04-30,475
61,2005-01-31,709


In [70]:
# Question 5 - Tesla Stock and Revenue Dashboard - 2 Points

def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    stock_data_specific = stock_data[stock_data.Date <= '2021--06-14']
    revenue_data_specific = revenue_data[revenue_data.Date <= '2021-04-30']
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data_specific.Date, infer_datetime_format=True), y=stock_data_specific.Open.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data_specific.Date, infer_datetime_format=True), y=revenue_data_specific.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Millions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()
make_graph(tesla_stock_data, tesla_revenue_data, 'Tesla')


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.



In [66]:
#Question 6 - GameStop Stock and Revenue Dashboard- 2 Points

def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    stock_data_specific = stock_data[stock_data.Date <= '2021--06-14']
    revenue_data_specific = revenue_data[revenue_data.Date <= '2021-04-30']
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data_specific.Date, infer_datetime_format=True), y=stock_data_specific.Open.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data_specific.Date, infer_datetime_format=True), y=revenue_data_specific.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Millions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()

make_graph(gamestop_stock_data, gamestop_revenue_data, 'Gamestop')


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.

