# S&P 500 by date

Get snapshot of S&P 500 components at a given date

In [11]:
from datetime import datetime
import os
import shutil
import pandas as pd

pd.options.mode.chained_assignment = None  # default='warn'
pd.set_option('display.max_rows', 600)

# -*- encoding: utf-8 -*-
%matplotlib inline

In [12]:
%%javascript
IPython.OutputArea.prototype._should_scroll = function(lines) {
    return false;
}

<IPython.core.display.Javascript object>

In [13]:
# Date to use for snapshot of S&P 500 components.
snap_shot = '2020-10-23'

In [14]:
def get_table(filename):

    if os.path.isfile(filename):
        df = pd.read_csv(filename, index_col='date')
        return df

In [15]:
filename = 'S&P 500 Historical Components & Changes(03-10-2025).csv'
df = get_table(filename)
df.tail()

Unnamed: 0_level_0,tickers
date,Unnamed: 1_level_1
2024-09-23,"A,AAPL,ABBV,ABNB,ABT,ACGL,ACN,ADBE,ADI,ADM,ADP..."
2024-09-30,"A,AAPL,ABBV,ABNB,ABT,ACGL,ACN,ADBE,ADI,ADM,ADP..."
2024-10-01,"A,AAPL,ABBV,ABNB,ABT,ACGL,ACN,ADBE,ADI,ADM,ADP..."
2024-11-26,"A,AAPL,ABBV,ABNB,ABT,ACGL,ACN,ADBE,ADI,ADM,ADP..."
2024-12-23,"A,AAPL,ABBV,ABNB,ABT,ACGL,ACN,ADBE,ADI,ADM,ADP..."


In [16]:
# Convert ticker column from csv to list, then sort.
df['tickers'] = df['tickers'].apply(lambda x: sorted(x.split(',')))
df.tail()

Unnamed: 0_level_0,tickers
date,Unnamed: 1_level_1
2024-09-23,"[A, AAPL, ABBV, ABNB, ABT, ACGL, ACN, ADBE, AD..."
2024-09-30,"[A, AAPL, ABBV, ABNB, ABT, ACGL, ACN, ADBE, AD..."
2024-10-01,"[A, AAPL, ABBV, ABNB, ABT, ACGL, ACN, ADBE, AD..."
2024-11-26,"[A, AAPL, ABBV, ABNB, ABT, ACGL, ACN, ADBE, AD..."
2024-12-23,"[A, AAPL, ABBV, ABNB, ABT, ACGL, ACN, ADBE, AD..."


In [17]:
# Number of symbols in the first row.
l = list(df['tickers'].head(1))[0]
len(l)

487

In [18]:
# Get the synbols on snap_shot date by filtering df by rows before or on the snap_shot date,
# then picking the last row.
df2 = df[df.index <= snap_shot]
last_row = df2.tail(1)
last_row

Unnamed: 0_level_0,tickers
date,Unnamed: 1_level_1
2020-10-12,"[A, AAL, AAP, AAPL, ABBV, ABC, ABMD, ABT, ACN,..."


In [19]:
past = last_row['tickers'].iloc[0]
print('*'*40, f'S&P 500 on {snap_shot}', '*'*40)
print(past)

**************************************** S&P 500 on 2020-10-23 ****************************************
['A', 'AAL', 'AAP', 'AAPL', 'ABBV', 'ABC', 'ABMD', 'ABT', 'ACN', 'ADBE', 'ADI', 'ADM', 'ADP', 'ADSK', 'AEE', 'AEP', 'AES', 'AFL', 'AIG', 'AIV', 'AIZ', 'AJG', 'AKAM', 'ALB', 'ALGN', 'ALK', 'ALL', 'ALLE', 'ALXN', 'AMAT', 'AMCR', 'AMD', 'AME', 'AMGN', 'AMP', 'AMT', 'AMZN', 'ANET', 'ANSS', 'ANTM', 'AON', 'AOS', 'APA', 'APD', 'APH', 'APTV', 'ARE', 'ATO', 'ATVI', 'AVB', 'AVGO', 'AVY', 'AWK', 'AXP', 'AZO', 'BA', 'BAC', 'BAX', 'BBY', 'BDX', 'BEN', 'BF.B', 'BIIB', 'BIO', 'BK', 'BKNG', 'BKR', 'BLK', 'BLL', 'BMY', 'BR', 'BRK.B', 'BSX', 'BWA', 'BXP', 'C', 'CAG', 'CAH', 'CARR', 'CAT', 'CB', 'CBOE', 'CBRE', 'CCI', 'CCL', 'CDNS', 'CDW', 'CE', 'CERN', 'CF', 'CFG', 'CHD', 'CHRW', 'CHTR', 'CI', 'CINF', 'CL', 'CLX', 'CMA', 'CMCSA', 'CME', 'CMG', 'CMI', 'CMS', 'CNC', 'CNP', 'COF', 'COG', 'COO', 'COP', 'COST', 'CPB', 'CPRT', 'CRM', 'CSCO', 'CSX', 'CTAS', 'CTLT', 'CTSH', 'CTVA', 'CTXS', 'CVS', 'CVX', 'CXO

In [20]:
# Get current S&P500 list.
filename = 'sp500.csv'
current = pd.read_csv(filename)
current = sorted(list(current['Symbol']))
#print(current)

In [21]:
# Show what's been added and removed since snap_shot date.

added = list(set(current) - set(past))
print('*'*40, f'ADDED since {snap_shot}', '*'*40)
print(added)
print()

removed = list(set(past) - set(current))
print('*'*40, f'REMOVED since {snap_shot}', '*'*40)
print(removed)

**************************************** ADDED since 2020-10-23 ****************************************
['MOH', 'CSGP', 'SW', 'CZR', 'PCG', 'PODD', 'WDAY', 'DOC', 'EQT', 'EG', 'PANW', 'APO', 'UBER', 'FI', 'DELL', 'WBD', 'VTRS', 'KDP', 'ERIE', 'LII', 'TSLA', 'GDDY', 'CPAY', 'KKR', 'ABNB', 'VLTO', 'ON', 'ELV', 'VICI', 'BRO', 'ACGL', 'CPT', 'WTW', 'TRMB', 'NDSN', 'BX', 'CTRA', 'LULU', 'BALL', 'INVH', 'AXON', 'BLDR', 'TPL', 'FSLR', 'DECK', 'GEN', 'MPWR', 'CRL', 'META', 'STLD', 'SOLV', 'PARA', 'SMCI', 'PTC', 'GNRC', 'EPAM', 'CEG', 'KVUE', 'ENPH', 'CRWD', 'COR', 'BG', 'RVTY', 'GEHC', 'FDS', 'TECH', 'MTCH', 'PLTR', 'MRNA', 'HUBB', 'FICO', 'DAY', 'JBL', 'TRGP', 'NXPI', 'VST', 'GEV']

**************************************** REMOVED since 2020-10-23 ****************************************
['WLTW', 'IPGP', 'WRK', 'TIF', 'FB', 'DRE', 'LUMN', 'UAA', 'FLT', 'WU', 'FLS', 'PVH', 'BIO', 'RE', 'AIV', 'PBCT', 'QRVO', 'KSU', 'XRX', 'INFO', 'CERN', 'FISV', 'XLNX', 'VFC', 'VIAC', 'COG', 'FBHS', 'MXIM', '