In [1]:
# rSLDS actual data 

In [2]:
IN_COLAB = True
REMOUNT = False

In [3]:
# RUN IN COLAB ONLY: mount Google drive
if IN_COLAB:
    from google.colab import drive
    drive.mount('/content/drive')

In [4]:
# RUN IN COLAB ONLY: unmount, remount Google drive - if required
if REMOUNT:
    !fusermount -u /content/drive 2>/dev/null || true
    !rm -rf /content/drive
    from google.colab import auth
    auth.authenticate_user()
    from google.colab import drive
    drive.mount('/content/drive', force_remount=True)

In [5]:
# RUN IN COLAB ONLY: install required modules: ssm, openpyxl
if IN_COLAB:
    !pip -q install git+https://github.com/lindermanlab/ssm.git #egg=ssm
    !pip -q install openpyxl
    !pip -q install filelock pyarrow

In [6]:
# RUN IN COLAB ONLY: force-fetch latest files from GitHub (overwrite local copies)
if IN_COLAB:
    !rm -rf /content/SLDS
    !git clone --depth=1 https://github.com/chrismader1/SLDS.git /content/SLDS
    import sys
    sys.path.append("/content/SLDS")

In [7]:
# RUN IN COLAB ONLY: prevent timeouts
if IN_COLAB:
    from IPython.display import Javascript, display
    display(Javascript("""
    (function keepAlive(){
      function clickConnect(){
        // Try shadow-root button (newer Colab)
        const el = document.querySelector('colab-connect-button');
        if (el && el.shadowRoot){
          const btn = el.shadowRoot.querySelector('#connect');
          if (btn){ btn.click(); console.log('keepAlive: clicked shadow connect'); return; }
        }
        // Fallbacks
        const btn2 = document.querySelector('#connect, button#connect');
        if (btn2){ btn2.click(); console.log('keepAlive: clicked #connect'); return; }
        console.log('keepAlive: connect button not found');
      }
      setInterval(clickConnect, 60 * 1000);
      console.log('keepAlive: armed');
    })();
    """))

In [8]:
# RUN IN COLAB ONLY: clear cache
if IN_COLAB:
    !rm -f "/content/drive/MyDrive/Colab Notebooks/SLDS/Data/gridsearch_results.csv"
    !rm -f "/content/drive/MyDrive/Colab Notebooks/SLDS/Data/gridsearch_segments.csv"
    !echo "Reset done."

In [9]:
import numpy as np
import pandas as pd
from gridsearch import pipeline_actual

In [None]:
# paths

COLAB_PATHS = {
    "data_excel": "/content/drive/MyDrive/Colab Notebooks/SLDS/Data/bbg_data.xlsx",  # Google Drive
    "ff_dir": "/content/drive/MyDrive/Colab Notebooks/SLDS/Data/",                   # Google Drive
    "ff_files": {
        "ff5": "F-F_Research_Data_5_Factors_2x3_daily.csv",
        "ff3": "F-F_Research_Data_Factors_daily.csv",
        "mom": "F-F_Momentum_Factor_daily.csv",},
    "results_csv": "/content/drive/MyDrive/Colab Notebooks/SLDS/Out/gridsearch_results.csv",            # Google Drive
    "segments_parquet": "/content/drive/MyDrive/Colab Notebooks/SLDS/Out/gridsearch_segments.parquet",  # Google Drive
    "tmp_dir":          "/content/tmp_slds/",                      # Colab local
    "segments_tmp_csv": "/content/tmp_slds/segments_tmp.csv",      # Colab local
}

LOCAL_PATHS = {
    "data_excel": "/Users/chrismader/Python/SLDS/Data/bbg_data.xlsx",
    "ff_dir": "/Users/chrismader/Python/SLDS/Data/",
    "ff_files": {
        "ff5": "F-F_Research_Data_5_Factors_2x3_daily.csv",
        "ff3": "F-F_Research_Data_Factors_daily.csv",
        "mom": "F-F_Momentum_Factor_daily.csv",},
    "results_csv": "/Users/chrismader/Python/SLDS/Out/gridsearch_results.csv",
    "segments_parquet": "/Users/chrismader/Python/SLDS/Out/gridsearch_segments.parquet",
    "tmp_dir":          "/Users/chrismader/Python/SLDS/tmp_slds/",
    "segments_tmp_csv": "/Users/chrismader/Python/SLDS/tmp_slds/segments_tmp.csv",
}

In [10]:
# --------------------------------------------------------------------------------------
# CONFIG
# --------------------------------------------------------------------------------------

CONFIG = {
    
    # Core defaults
    "n_jobs": -1,  # multi-threading
    "dt": 1.0 / 252.0,
    "n_iters": 10,
    "h_z": 3.0,  # CUSUM parameter
    
    # Batch windows
    "batch_grid": [
        {"train_window": 756, "overlap_window": 5},
        # {"train_window": 256, "overlap_window": 63},
        # {"train_window": 504, "overlap_window": 63},
        # {"train_window": 756, "overlap_window": 63},
        # {"train_window": 1260, "overlap_window": 63},
    ],

    # Number of regimes
    "K_grid": [2, 3, 4],
    
    # Unrestricted models: 
    "unrestricted_models": [
        {"label": "[y]",         "channels": ["y"],                "dim_latent": [1]},
        # {"label": "[y,h]",       "channels": ["y","h"],            "dim_latent": [2]},
        # {"label": "[g,v]",       "channels": ["g","v"],            "dim_latent": [2]},
        # {"label": "[g,v,h]",     "channels": ["g","v","h"],        "dim_latent": [2,3]},
        # {"label": "[y,g,v,h]",   "channels": ["y","g","v","h"],    "dim_latent": [3,4]},
    ],

    # Restricted models: 
    "restricted_models": [
        # {"label": "fund1",        "channels": ["y"],                 "dim_latent": [2],    "C_type": "fund1"},
        # {"label": "fund1_vix",    "channels": ["y","h"],             "dim_latent": [3],    "C_type": "fund1_vix"},
        # {"label": "fund2",        "channels": ["y","g"],             "dim_latent": [2],    "C_type": "fund2"},
        # {"label": "fund2_vix",    "channels": ["y","g","h"],         "dim_latent": [3],    "C_type": "fund2_vix"},
        # {"label": "fund3",        "channels": ["y","v","g"],         "dim_latent": [2],    "C_type": "fund3"},
        # {"label": "fund3_vix",    "channels": ["y","v","g","h"],     "dim_latent": [3],    "C_type": "fund3_vix"},   

        # {"label": "factor1",      "channels": ["y"],                 "dim_latent": [2],    "C_type": "factor1"},
        # {"label": "factor1_vix",  "channels": ["y","h"],             "dim_latent": [3],    "C_type": "factor1_vix"},

        {"label": "factor2_ff3",   "channels": ["y","mkt","smb","hml"],                   "dim_latent": [3], "C_type": "factor2"},
        # {"label": "factor2_ff3mom","channels": ["y","mkt","smb","hml","mom"],             "dim_latent": [4], "C_type": "factor2"},
        # {"label": "factor2_ff5",   "channels": ["y","mkt","smb","hml","rmw","cma"],       "dim_latent": [5], "C_type": "factor2"},
        # {"label": "factor2_ff5mom","channels": ["y","mkt","smb","hml","rmw","cma","mom"], "dim_latent": [6], "C_type": "factor2"},
    ],

    # Model selection
    "run_unrestricted": True,
    "run_restricted": True,

    # Output
    "verbose": True,
    "display": False,
}

CONFIG.update(COLAB_PATHS if IN_COLAB else LOCAL_PATHS)

In [11]:
# --------------------------------------------------------------------------------------
# Execute
# --------------------------------------------------------------------------------------

def main():
    
    import os
    import pandas as pd

    # IO from CONFIG
    csv_path = CONFIG["results_csv"]
    filename = CONFIG["data_excel"]
    out_path = os.path.dirname(CONFIG["results_csv"]) + "/"
    
    # securities_master = [
    #     "MSFT","NVDA","AAPL","AVGO","GOOGL","ORCL","IBM","CSCO","CRM","AMD","INTU","NOW","TXN","QCOM",
    #     "ADBE","AMAT","PLTR","ACN","META","NFLX","GOOGL","DIS","VZ","T","UBER","AMZN","TSLA","HD",
    #     "MCD","BKNG","COST","WMT","PG","KO","PM","PEP","BRK/B","JPM","V","MA","BAC","WFC","GS","MS","SPGI",
    #     "SCHW","AXP","BLK","C","PGR","LLY","JNJ","ABBV","UNH","ABT","MRK","ISRG","BSX","TMO","AMGN","RTX",
    #     "XOM","CVX","GE","CAT","BA","HON","LIN","NEE","DUK","SO","AEP","D","AMT","PLD","EQIX","O","CBRE",]

    securities_master = ["MSFT","NVDA","AAPL","AVGO","GOOGL","ORCL","IBM","CSCO"]

    # resume if CSV exists; otherwise start from beginning
    if os.path.exists(csv_path) and os.path.getsize(csv_path) > 0:
        df = pd.read_csv(csv_path)
        assert "security" in df.columns, "results_csv missing 'security' column"
        done_set = set(df["security"].dropna().astype(str))
        done = [s for s in securities_master if s in done_set]
        securities = [s for s in securities_master if s not in done_set]
        print("Resuming from CSV:", csv_path)
        print("Already completed:", done)
    else:
        securities = securities_master
        print("Resuming from: START (no/empty CSV)")
    
    print("Remaining tickers:", len(securities), securities)

    if len(securities) == 0:
        print("Nothing to do.")
        return

    _ = pipeline_actual(securities=securities, CONFIG=CONFIG)

if __name__ == "__main__":
    main()


Resuming from CSV: /Users/chrismader/Python/SLDS/Out/gridsearch_results.csv
Already completed: {'MSFT', 'NVDA'}
Remaining tickers: 6 ['AAPL', 'AVGO', 'GOOGL', 'ORCL', 'IBM', 'CSCO']


AAPL
combo_total= 3


------------------------------------------------------------------------
(1/3) unrestricted | Params: {'n_regimes': 2, 'dim_latent': 1, 'single_subspace': True};{'train_window': 756, 'overlap_window': 5}
------------------------------------------------------------------------


------------------------------------------------------------------------
(3/3) unrestricted | Params: {'n_regimes': 4, 'dim_latent': 1, 'single_subspace': True};{'train_window': 756, 'overlap_window': 5}
------------------------------------------------------------------------


------------------------------------------------------------------------
(2/3) unrestricted | Params: {'n_regimes': 3, 'dim_latent': 1, 'single_subspace': True};{'train_window': 756, 'overlap_window': 5}
--------------------------------

ELBO: 1631.1: 100%|██████████| 10/10 [00:00<00:00, 43.65it/s]
ELBO: 1674.4: 100%|██████████| 10/10 [00:00<00:00, 38.39it/s]
ELBO: 1609.0: 100%|██████████| 10/10 [00:00<00:00, 35.60it/s]
ELBO: 1702.8: 100%|██████████| 10/10 [00:00<00:00, 44.76it/s]
ELBO: 1726.3: 100%|██████████| 10/10 [00:00<00:00, 42.42it/s]
ELBO: 1717.7: 100%|██████████| 10/10 [00:00<00:00, 42.21it/s]
ELBO: 1612.4: 100%|██████████| 10/10 [00:00<00:00, 48.00it/s]
ELBO: 1610.3: 100%|██████████| 10/10 [00:00<00:00, 43.20it/s]
ELBO: 1614.8: 100%|██████████| 10/10 [00:00<00:00, 44.04it/s]
ELBO: 1643.3: 100%|██████████| 10/10 [00:00<00:00, 48.93it/s]
ELBO: 1647.0: 100%|██████████| 10/10 [00:00<00:00, 44.39it/s]
ELBO: 1636.8: 100%|██████████| 10/10 [00:00<00:00, 42.23it/s]
ELBO: 1084.7: 100%|██████████| 10/10 [00:00<00:00, 66.43it/s]
ELBO: 1070.5: 100%|██████████| 10/10 [00:00<00:00, 57.53it/s]
ELBO: 1040.7: 100%|██████████| 10/10 [00:00<00:00, 58.10it/s]



fits succeeded: 15

LEADERBOARD:
 rank    score  n_regimes  dim_latent  single_subspace
    1 -0.00599          4           1             True
    2 -0.02881          2           1             True
    3 -0.02881          3           1             True
combo_total= 3


------------------------------------------------------------------------
(2/3) factor2_ff3 | Params: {'n_regimes': 3, 'dim_latent': 3, 'single_subspace': True, 'restrictions': {'C': array([[ 0.01155257, -0.00295532, -0.00344376],
       [ 1.        ,  0.        ,  0.        ],
       [ 0.        ,  1.        ,  0.        ],
       [ 0.        ,  0.        ,  1.        ]]), 'd': array([0.00016178, 0.        , 0.        , 0.        ]), 'b_pattern': ['mu_form', 'mu_form', 'mu_form']}, 'model_name': 'factor2_ff3'};{'train_window': 756, 'overlap_window': 5}
------------------------------------------------------------------------


ELBO: -8081.1: 100%|██████████| 1/1 [00:00<00:00, 21.40it/s]
ELBO: -7912.0: 100%|██████████| 1/1 [00:00<00:00, 14.54it/s]
ELBO: -7785.0: 100%|██████████| 1/1 [00:00<00:00, 29.80it/s]
ELBO: -7779.4: 100%|██████████| 1/1 [00:00<00:00, 25.64it/s]
ELBO: -7736.8: 100%|██████████| 1/1 [00:00<00:00, 32.46it/s]
ELBO: -7710.8: 100%|██████████| 1/1 [00:00<00:00, 29.30it/s]
ELBO: -7684.8: 100%|██████████| 1/1 [00:00<00:00, 32.19it/s]
ELBO: -7710.7: 100%|██████████| 1/1 [00:00<00:00, 33.18it/s]
ELBO: -7669.8: 100%|██████████| 1/1 [00:00<00:00, 31.50it/s]
ELBO: -7666.5: 100%|██████████| 1/1 [00:00<00:00, 31.67it/s]
ELBO: -7631.0: 100%|██████████| 1/1 [00:00<00:00, 33.53it/s]
ELBO: -7655.9: 100%|██████████| 1/1 [00:00<00:00, 32.33it/s]
ELBO: -7622.8: 100%|██████████| 1/1 [00:00<00:00, 34.02it/s]
ELBO: -7648.3: 100%|██████████| 1/1 [00:00<00:00, 31.36it/s]
ELBO: -7635.8: 100%|██████████| 1/1 [00:00<00:00, 32.07it/s]
ELBO: -7641.6: 100%|██████████| 1/1 [00:00<00:00, 33.72it/s]
ELBO: -7641.3: 100%|████



------------------------------------------------------------------------
(1/3) factor2_ff3 | Params: {'n_regimes': 2, 'dim_latent': 3, 'single_subspace': True, 'restrictions': {'C': array([[ 0.01155257, -0.00295532, -0.00344376],
       [ 1.        ,  0.        ,  0.        ],
       [ 0.        ,  1.        ,  0.        ],
       [ 0.        ,  0.        ,  1.        ]]), 'd': array([0.00016178, 0.        , 0.        , 0.        ]), 'b_pattern': ['mu_form', 'mu_form', 'mu_form']}, 'model_name': 'factor2_ff3'};{'train_window': 756, 'overlap_window': 5}
------------------------------------------------------------------------


------------------------------------------------------------------------
(3/3) factor2_ff3 | Params: {'n_regimes': 4, 'dim_latent': 3, 'single_subspace': True, 'restrictions': {'C': array([[ 0.01155257, -0.00295532, -0.00344376],
       [ 1.        ,  0.        ,  0.        ],
       [ 0.        ,  1.        ,  0.        ],
       [ 0.        ,  0.        ,  1. 

ELBO: -7767.0: 100%|██████████| 1/1 [00:00<00:00, 37.32it/s]
ELBO: -7754.1: 100%|██████████| 1/1 [00:00<00:00, 30.59it/s]
ELBO: -7447.1: 100%|██████████| 1/1 [00:00<00:00, 32.68it/s]
ELBO: -7766.8: 100%|██████████| 1/1 [00:00<00:00, 34.59it/s]
ELBO: -7817.3: 100%|██████████| 1/1 [00:00<00:00, 30.06it/s]
ELBO: -7469.5: 100%|██████████| 1/1 [00:00<00:00, 35.05it/s]
ELBO: -7764.5: 100%|██████████| 1/1 [00:00<00:00, 40.28it/s]
ELBO: -7726.3: 100%|██████████| 1/1 [00:00<00:00, 30.78it/s]
ELBO: -7424.4: 100%|██████████| 1/1 [00:00<00:00, 32.24it/s]
ELBO: -7680.7: 100%|██████████| 1/1 [00:00<00:00, 34.18it/s]
ELBO: -7701.3: 100%|██████████| 1/1 [00:00<00:00, 30.48it/s]
ELBO: -7484.3: 100%|██████████| 1/1 [00:00<00:00, 35.21it/s]
ELBO: -7670.8: 100%|██████████| 1/1 [00:00<00:00, 40.51it/s]
ELBO: -7719.0: 100%|██████████| 1/1 [00:00<00:00, 38.32it/s]
ELBO: -7366.8: 100%|██████████| 1/1 [00:00<00:00, 36.98it/s]
ELBO: -7690.1: 100%|██████████| 1/1 [00:00<00:00, 34.45it/s]
ELBO: -7677.6: 100%|████

KeyboardInterrupt: 