In [1]:
import yfinance as yf
import pandas as pd
import requests
from bs4 import BeautifulSoup
import plotly.graph_objects as go
from plotly.subplots import make_subplots

In [2]:
import warnings
# Ignore all warnings
warnings.filterwarnings("ignore", category=FutureWarning)

In [3]:
def make_graph(stock_data, revenue_data, stock):
    fig = make_subplots(rows=2, cols=1, shared_xaxes=True, subplot_titles=("Historical Share Price", "Historical Revenue"), vertical_spacing = .3)
    stock_data_specific = stock_data[stock_data.Date <= '2021--06-14']
    revenue_data_specific = revenue_data[revenue_data.Date <= '2021-04-30']
    fig.add_trace(go.Scatter(x=pd.to_datetime(stock_data_specific.Date, infer_datetime_format=True), y=stock_data_specific.Close.astype("float"), name="Share Price"), row=1, col=1)
    fig.add_trace(go.Scatter(x=pd.to_datetime(revenue_data_specific.Date, infer_datetime_format=True), y=revenue_data_specific.Revenue.astype("float"), name="Revenue"), row=2, col=1)
    fig.update_xaxes(title_text="Date", row=1, col=1)
    fig.update_xaxes(title_text="Date", row=2, col=1)
    fig.update_yaxes(title_text="Price ($US)", row=1, col=1)
    fig.update_yaxes(title_text="Revenue ($US Millions)", row=2, col=1)
    fig.update_layout(showlegend=False,
    height=900,
    title=stock,
    xaxis_rangeslider_visible=True)
    fig.show()

In [4]:
Tesla = yf.Ticker("TSLA")

In [5]:
tesla_data = Tesla.history(period="max")
df=tesla_data

In [6]:
df.reset_index(inplace=True)
df.head(5)

Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
0,2010-06-29 00:00:00-04:00,1.266667,1.666667,1.169333,1.592667,281494500,0.0,0.0
1,2010-06-30 00:00:00-04:00,1.719333,2.028,1.553333,1.588667,257806500,0.0,0.0
2,2010-07-01 00:00:00-04:00,1.666667,1.728,1.351333,1.464,123282000,0.0,0.0
3,2010-07-02 00:00:00-04:00,1.533333,1.54,1.247333,1.28,77097000,0.0,0.0
4,2010-07-06 00:00:00-04:00,1.333333,1.333333,1.055333,1.074,103003500,0.0,0.0


In [7]:
url= "https://www.macrotrends.net/stocks/charts/TSLA/tesla/revenue"
html_data = requests.get(url).text

In [8]:
soup = BeautifulSoup(html_data,"html.parser")

In [9]:
import requests
from bs4 import BeautifulSoup
import pandas as pd

url = 'https://www.macrotrends.net/stocks/charts/TSLA/tesla/revenue'
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'}

try:
    response = requests.get(url, headers=headers)
    response.raise_for_status()  # Lanza una excepción si la solicitud no fue exitosa
except requests.HTTPError as e:
    print(f'Error HTTP: {e.response.status_code}')
except requests.ConnectionError:
    print('Error de conexión')
except requests.Timeout:
    print('La solicitud ha caducado')
except requests.RequestException as e:
    print(f'Error inesperado: {e}')
else:
    soup = BeautifulSoup(response.text, 'html.parser')
    tables = soup.find_all('table')
    if tables:
        table = tables[1]  # Selecciona la segunda tabla
        tesla_revenue = pd.DataFrame(columns=["Date", "Revenue"])
        for row in table.find("tbody").find_all("tr"):
            cols = row.find_all('td')
            date = cols[0].get_text(strip=True)
            revenue = cols[1].get_text(strip=True)
            new_row = pd.DataFrame([[date, revenue]], columns=["Date", "Revenue"])
            tesla_revenue = pd.concat([tesla_revenue, new_row], ignore_index=True)
        tesla_revenue["Revenue"] = tesla_revenue['Revenue'].str.replace('$', '').str.replace(',', '')
        print(tesla_revenue)
    else:
        print('No se encontraron tablas en la página.')


          Date Revenue
0   2024-06-30   25500
1   2024-03-31   21301
2   2023-12-31   25167
3   2023-09-30   23350
4   2023-06-30   24927
..         ...     ...
56  2010-06-30      28
57  2010-03-31      21
58  2009-12-31        
59  2009-09-30      46
60  2009-06-30      27

[61 rows x 2 columns]


In [10]:
tesla_revenue.tail(5)

Unnamed: 0,Date,Revenue
56,2010-06-30,28.0
57,2010-03-31,21.0
58,2009-12-31,
59,2009-09-30,46.0
60,2009-06-30,27.0


In [11]:
GME= yf.Ticker("GME")

In [12]:
GME_share_price_data = GME.history(period="max")
df=GME_share_price_data

In [13]:
df.reset_index(inplace=True)
df.head()

Unnamed: 0,Date,Open,High,Low,Close,Volume,Dividends,Stock Splits
0,2002-02-13 00:00:00-05:00,1.620128,1.69335,1.603296,1.691666,76216000,0.0,0.0
1,2002-02-14 00:00:00-05:00,1.712707,1.716074,1.670626,1.68325,11021600,0.0,0.0
2,2002-02-15 00:00:00-05:00,1.68325,1.687458,1.658002,1.674834,8389600,0.0,0.0
3,2002-02-19 00:00:00-05:00,1.666418,1.666418,1.578047,1.607504,7410400,0.0,0.0
4,2002-02-20 00:00:00-05:00,1.61592,1.66221,1.603296,1.66221,6892800,0.0,0.0


In [14]:
url= "https://www.macrotrends.net/stocks/charts/GME/gamestop/revenue"
html_data = requests.get(url).text

In [15]:
soup = BeautifulSoup(html_data,"html.parser")

In [16]:
import requests
from bs4 import BeautifulSoup
import pandas as pd

# URL de la página web de GameStop
url = 'https://www.macrotrends.net/stocks/charts/GME/gamestop/revenue'

# Encabezados para la solicitud HTTP
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'}

# Realizar la solicitud HTTP con manejo de errores
try:
    response = requests.get(url, headers=headers)
    response.raise_for_status()  # Lanza una excepción si la solicitud no fue exitosa
except requests.HTTPError as e:
    print(f'Error HTTP: {e.response.status_code}')
except requests.ConnectionError:
    print('Error de conexión')
except requests.Timeout:
    print('La solicitud ha caducado')
except requests.RequestException as e:
    print(f'Error inesperado: {e}')
else:
    # Analizar el contenido HTML de la página
    soup = BeautifulSoup(response.text, 'html.parser')
    
    # Encontrar todas las tablas en la página
    tables = soup.find_all('table')
    
    # Verificar si se encontraron tablas
    if tables:
        # Seleccionar la segunda tabla (índice 1)
        table = tables[1]
        
        # Leer la tabla HTML en un DataFrame de pandas
        gme_revenue = pd.read_html(str(table))[0]
        
        # Renombrar las columnas a 'Date' y 'Revenue'
        gme_revenue.columns = ['Date', 'Revenue']
        
        # Limpiar la columna 'Revenue' eliminando símbolos de dólar y comas
        gme_revenue['Revenue'] = gme_revenue['Revenue'].str.replace('$', '').str.replace(',', '')
        
        # Eliminar filas con valores nulos en 'Revenue'
        gme_revenue.dropna(subset=['Revenue'], inplace=True)
        
        # Convertir todas las columnas a tipo de datos string
        gme_revenue = gme_revenue.astype(str)
        
        # Mostrar el DataFrame resultante
        print(df)
    else:
        print('No se encontraron tablas en la página.')


                          Date       Open       High        Low      Close  \
0    2002-02-13 00:00:00-05:00   1.620128   1.693350   1.603296   1.691666   
1    2002-02-14 00:00:00-05:00   1.712707   1.716074   1.670626   1.683250   
2    2002-02-15 00:00:00-05:00   1.683250   1.687458   1.658002   1.674834   
3    2002-02-19 00:00:00-05:00   1.666418   1.666418   1.578047   1.607504   
4    2002-02-20 00:00:00-05:00   1.615920   1.662210   1.603296   1.662210   
...                        ...        ...        ...        ...        ...   
5706 2024-10-15 00:00:00-04:00  21.450001  21.680000  20.980000  21.270000   
5707 2024-10-16 00:00:00-04:00  21.129999  21.750000  21.030001  21.660000   
5708 2024-10-17 00:00:00-04:00  21.500000  21.660000  21.230000  21.410000   
5709 2024-10-18 00:00:00-04:00  21.410000  21.610001  20.980000  21.219999   
5710 2024-10-21 00:00:00-04:00  21.410000  21.216600  21.100000  21.216600   

        Volume  Dividends  Stock Splits  
0     76216000       

In [17]:
gme_revenue.tail()

Unnamed: 0,Date,Revenue
58,2010-01-31,3524
59,2009-10-31,1835
60,2009-07-31,1739
61,2009-04-30,1981
62,2009-01-31,3492


In [22]:
tesla_revenue.dropna(subset=['Revenue'], inplace=True)


In [25]:
def convertir_a_float(valor):
    try:
        return float(valor)
    except ValueError:
        return None  # O asigna un valor predeterminado

# Aplica la función a la columna 'Revenue'
tesla_revenue['Revenue'] = tesla_revenue['Revenue'].apply(convertir_a_float)


In [27]:
make_graph(tesla_data,tesla_revenue,"Tesla Stock Data")


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.



In [19]:
make_graph(GME_share_price_data,gme_revenue,"GameStop Stock Data")


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.


The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.

