In [1]:
# Phase 2: yfinance API
# Objective: Map out all the data points. `yfinance` provides asset like SPY.
# 1. Fix the `data_pipeline.py` Bug: First, let's implement the fix for the `TypeError` we discovered.
# 2. Explore the Ticker Object: We will then systematically call every method on the `yf.Ticker('SPY')` object to see the full range of available data, including financials, corporate actions, news, and more.

In [3]:
import yfinance as yf
import pandas as pd
import logging

logging.basicConfig(level=logging.INFO, format = '%(asctime)s - %(levelname)s - %(message)s')

class PatchedLiveDataHandler:
    def __init__(self, ticker: str = "SPY"):
        self.ticker = ticker
        self.tk = yf.Ticker(self.ticker)
        self.data = None
        
    def fetch_data(self, period: str = "5y", interval: str = "1d") -> pd.DataFrame:
        logging.info(f"Fetching {period} of {interval} data for {self.ticker}...")
        self.data = self.tk.history(period=period, interval=interval, auto_adjust = False)
        if self.data.empty:
            logging.error(f"No data fetched for ticker {self.ticker}.")
            return pd.DataFrame()
        
        self.data.columns = [str(col).lower().replace(' ', '_') for col in self.data.columns]
        logging.info(f"Equity data fetched. Shape: {self.data.shape}")
        return self.data


In [4]:
# Prove the fix works"
live_pipeline = PatchedLiveDataHandler(ticker="SPY")
live_data_raw = live_pipeline.fetch_data(period="1y")
print("Successfully fetched data using the patched handler:")
print(live_data_raw.head())

2025-10-02 19:53:30,611 - INFO - Fetching 1y of 1d data for SPY...
2025-10-02 19:53:35,221 - INFO - Equity data fetched. Shape: (250, 9)


Successfully fetched data using the patched handler:
                                 open        high         low       close  \
Date                                                                        
2024-10-03 00:00:00-04:00  567.359985  569.799988  565.489990  567.820007   
2024-10-04 00:00:00-04:00  572.349976  573.359985  568.099976  572.979980   
2024-10-07 00:00:00-04:00  571.299988  571.960022  566.630005  567.799988   
2024-10-08 00:00:00-04:00  570.419983  573.780029  569.530029  573.169983   
2024-10-09 00:00:00-04:00  573.159973  577.710022  572.549988  577.140015   

                            adj_close    volume  dividends  stock_splits  \
Date                                                                       
2024-10-03 00:00:00-04:00  560.999634  40846500        0.0           0.0   
2024-10-04 00:00:00-04:00  566.097656  42939100        0.0           0.0   
2024-10-07 00:00:00-04:00  560.979858  49964700        0.0           0.0   
2024-10-08 00:00:00-04:00  

In [None]:
spy = yf.Ticker('SPY') 

# Systematically explore and print all available data points
print("--- Ticker Info ---")
print(spy.info)

print("--- Actions (Dividends, Splits) ---")
print(spy.actions.head())

print("--- Financials ---")
print(spy.financials)

print("--- Major Holders ---")
print(spy.major_holders)

print("--- Institutional Holders ---")
print(spy.institutional_holders.head())

print("--- Balance Sheet ---")
print(spy.balance_sheet)

print("--- Cashflow ---")
print(spy.cashflow)

print("--- Earnings ---")
print(spy.earnings)

print("--- Analyst Recommendations ---")
print(spy.recommendations.tail())

print("--- Calendar (Upcoming Events) ---")
print(spy.calendar)

print("--- News ---")
for news_item in spy.news[:5]: # Print first 5 news items
    print(f"- {news_item['title']}")

--- Ticker Info ---
{'longBusinessSummary': 'The trust seeks to achieve its investment objective by holding a portfolio of the common stocks that are included in the index, with the weight of each stock in the portfolio substantially corresponding to the weight of such stock in the index.', 'companyOfficers': [], 'executiveTeam': [], 'maxAge': 86400, 'priceHint': 2, 'previousClose': 668.45, 'open': 670.45, 'dayLow': 666.79, 'dayHigh': 670.56, 'regularMarketPreviousClose': 668.45, 'regularMarketOpen': 670.45, 'regularMarketDayLow': 666.79, 'regularMarketDayHigh': 670.56, 'trailingPE': 28.26803, 'volume': 56719366, 'regularMarketVolume': 56719366, 'averageVolume': 70571260, 'averageVolume10days': 79851960, 'averageDailyVolume10Day': 79851960, 'bid': 669.46, 'ask': 669.49, 'bidSize': 8, 'askSize': 5, 'yield': 0.0111, 'totalAssets': 654797701120, 'fiftyTwoWeekLow': 481.8, 'fiftyTwoWeekHigh': 670.56, 'allTimeHigh': 669.37, 'allTimeLow': 42.8125, 'fiftyDayAverage': 646.638, 'twoHundredDayAve

2025-10-02 20:01:15,182 - ERROR - HTTP Error 404: {"quoteSummary":{"result":null,"error":{"code":"Not Found","description":"No fundamentals data found for symbol: SPY"}}}


Empty DataFrame
Columns: []
Index: []
--- Institutional Holders ---
Empty DataFrame
Columns: []
Index: []
--- Balance Sheet ---
Empty DataFrame
Columns: []
Index: []
--- Cashflow ---
Empty DataFrame
Columns: []
Index: []
--- Earnings ---
None
--- Analyst Recommendations ---


2025-10-02 20:01:15,442 - ERROR - HTTP Error 404: {"quoteSummary":{"result":null,"error":{"code":"Not Found","description":"No fundamentals data found for symbol: SPY"}}}


Empty DataFrame
Columns: []
Index: []
--- Calendar (Upcoming Events) ---


2025-10-02 20:01:15,730 - ERROR - HTTP Error 404: {"quoteSummary":{"result":null,"error":{"code":"Not Found","description":"No fundamentals data found for symbol: SPY"}}}


{}
--- News ---


KeyError: 'title'

In [8]:
nvda = yf.Ticker('NVDA') # to test, we used ticker `NVDA` as `SPY` would not have certain details like individual stock ticker does.

# Systematically explore and print all available data points
print("--- Ticker Info ---")
print(nvda.info)

print("--- Actions (Dividends, Splits) ---")
print(nvda.actions.head())

print("--- Financials ---")
print(nvda.financials)

print("--- Major Holders ---")
print(nvda.major_holders)

print("--- Institutional Holders ---")
print(nvda.institutional_holders.head())

print("--- Balance Sheet ---")
print(nvda.balance_sheet)

print("--- Cashflow ---")
print(nvda.cashflow)

print("--- Earnings ---")
print(nvda.earnings)

print("--- Analyst Recommendations ---")
print(nvda.recommendations.tail())

print("--- Calendar (Upcoming Events) ---")
print(nvda.calendar)

print("--- News ---")
for news_item in nvda.news[:5]: # Print first 5 news items
    print(f"- {news_item['title']}")

--- Ticker Info ---
{'address1': '2788 San Tomas Expressway', 'city': 'Santa Clara', 'state': 'CA', 'zip': '95051', 'country': 'United States', 'phone': '408 486 2000', 'website': 'https://www.nvidia.com', 'industry': 'Semiconductors', 'industryKey': 'semiconductors', 'industryDisp': 'Semiconductors', 'sector': 'Technology', 'sectorKey': 'technology', 'sectorDisp': 'Technology', 'longBusinessSummary': "NVIDIA Corporation, a computing infrastructure company, provides graphics and compute and networking solutions in the United States, Singapore, Taiwan, China, Hong Kong, and internationally. The Compute & Networking segment includes its Data Centre accelerated computing platforms and artificial intelligence solutions and software; networking; automotive platforms and autonomous and electric vehicle solutions; Jetson for robotics and other embedded platforms; and DGX Cloud computing services. The Graphics segment offers GeForce GPUs for gaming and PCs, the GeForce NOW game streaming servi



  period  strongBuy  buy  hold  sell  strongSell
0     0m         11   48     4     1           0
1    -1m         11   47     6     1           0
2    -2m         11   48     6     1           0
--- Calendar (Upcoming Events) ---
{'Dividend Date': datetime.date(2025, 10, 1), 'Ex-Dividend Date': datetime.date(2025, 9, 10), 'Earnings Date': [datetime.date(2025, 11, 19)], 'Earnings High': 1.34, 'Earnings Low': 1.14, 'Earnings Average': 1.24214, 'Revenue High': 58340000000, 'Revenue Low': 53461000000, 'Revenue Average': 54603117970}
--- News ---


KeyError: 'title'