<a href="https://colab.research.google.com/github/yorkjong/vistock/blob/feature%2Fibd/notebooks/ibd_rs_rating.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

### Stock Analysis and Ranking with IBD RS Rating, inspired by the Investor's Business Daily (IBD) methodology.

### Install and Setup

#### Install Packages

In [1]:
%pip install "git+https://github.com/yorkjong/vistock.git@feature/ibd"
%pip install requests-cache

Collecting git+https://github.com/yorkjong/vistock.git@feature/ibd
  Cloning https://github.com/yorkjong/vistock.git (to revision feature/ibd) to /tmp/pip-req-build-wbxxl65d
  Running command git clone --filter=blob:none --quiet https://github.com/yorkjong/vistock.git /tmp/pip-req-build-wbxxl65d
  Running command git checkout -b feature/ibd --track origin/feature/ibd
  Switched to a new branch 'feature/ibd'
  Branch 'feature/ibd' set up to track remote branch 'feature/ibd' from 'origin'.
  Resolved https://github.com/yorkjong/vistock.git to commit 396e54c463cebba93b85e7870f86b0d3a83b4f11
  Preparing metadata (setup.py) ... [?25l[?25hdone
Collecting mplfinance (from vistock==0.5.0)
  Downloading mplfinance-0.12.10b0-py3-none-any.whl.metadata (19 kB)
Downloading mplfinance-0.12.10b0-py3-none-any.whl (75 kB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m75.0/75.0 kB[0m [31m2.1 MB/s[0m eta [36m0:00:00[0m
[?25hBuilding wheels for collected packages: vistock
  Buildin

#### Setup and Configuration

In [2]:
# @title Enable DataFrame Formatter
from google.colab import data_table
data_table.enable_dataframe_formatter()

In [3]:
# @title Enable Requests Cache
import requests_cache
requests_cache.install_cache('ibd_cache', expire_after=3600)

In [4]:
# @title Initialize Widgets
import ipywidgets as widgets
output = widgets.Output()

In [5]:
# @title GitHub
import base64
import requests
import pandas as pd
from io import StringIO


class GitHub:
    def __init__(self, repo_owner, repo_name, token, dir='', branch='main'):
        base = 'https://api.github.com/repos'
        dir = dir.strip('/')
        if dir:
            self.base_url = f'{base}/{repo_owner}/{repo_name}/contents/{dir}'
        else:
            self.base_url = f'{base}/{repo_owner}/{repo_name}/contents'
        self.branch = branch
        self.token = token

    def _request(self, method, url, headers=None, params=None, json=None):
        response = requests.request(method, url, headers=headers,
                                    params=params, json=json)
        if response.status_code in [200, 201]:
            return response.json()
        else:
            print(f"Request failed: {response.status_code} - {response.json()}")
            return None

    def file_exists(self, file_path):
        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json',
        }
        response = requests.get(url, headers=headers,
                                params={'ref': self.branch})
        if response.status_code == 200:
            return True
        elif response.status_code == 404:
            return False
        else:
            print(f"Request failed: {response.status_code} - {response.json()}")
            return None

    def list_filenames(self, dir_path=''):
        url = f'{self.base_url}/{dir_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json',
        }
        response = requests.get(url, headers=headers,
                                params={'ref': self.branch})
        if response.status_code == 200:
            files = response.json()
            return [item['name'] for item in files]
        else:
            print(f"Request failed: {response.status_code} - {response.json()}")
            return []

    def download_file(self, file_path):
        if not self.file_exists(file_path):
            print(f"File '{file_path}' does not exist. Cannot download.")
            return None

        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json',
        }

        file_info = self._request('GET', url, headers=headers)
        if file_info:
            download_url = file_info['download_url']
            response = requests.get(download_url)
            if response.status_code == 200:
                return StringIO(response.text)
            else:
                print(f"Failed to download file: "
                      f"{response.status_code} - {response.text}")
                return None
        return None

    def download_csv(self, file_path):
        file_content = self.download_file(file_path)
        if file_content:
            return pd.read_csv(file_content)
        else:
            return pd.DataFrame()

    def upload_file(self, file_path, content):
        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json'
        }

        encoded_content = base64.b64encode(content.encode()).decode()
        payload = {
            'message': 'Uploading file',
            'content': encoded_content,
            'branch': self.branch
        }
        self._request('PUT', url, headers=headers, json=payload)

    def upload_df_as_csv(self, file_path, df):
        """Upload a DataFrame to a CSV file."""
        if not file_path.endswith('.csv'):
            file_path += '.csv'
        csv_content = df.to_csv(index=False)
        self.upload_file(file_path, csv_content)

    def remove_file(self, file_path):
        if not self.file_exists(file_path):
            print(f"File '{file_path}' does not exist. Skipping deletion.")
            return

        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json'
        }

        # Fetch the file info to get the SHA needed for deletion
        file_info = self._request('GET', url, headers=headers)
        if file_info:
            sha = file_info['sha']
            payload = {
                'message': 'Deleting file',
                'sha': sha,
                'branch': self.branch
            }
            self._request('DELETE', url, headers=headers, json=payload)

#-------------------------------------------------------------------------------

from google.colab import userdata

github = GitHub(
    repo_owner='YorkJong',
    repo_name='stock-reports',
    token=userdata.get('GithubToken.stock-reports'),
    dir='ibd',
)

In [6]:
# @title Update and Filter DataFrame

def update_tickers_with_names(df, ticker_column, name_separator=','):
    """
    Update ticker codes in a DataFrame with their corresponding stock names.

    Parameters:
    - df: The DataFrame containing ticker codes.
    - ticker_column: The name of the column containing ticker codes.
    - name_separator: Separator used to join names (default is comma for multiple tickers).

    This function updates the specified column with the stock names instead of ticker codes.
    """
    # Iterate over the specified column in the DataFrame
    for index, row in df.iterrows():
        tickers = row[ticker_column].split(name_separator)  # Split the tickers string into a list
        stock_names = [tw.stock_name(ticker) for ticker in tickers]  # Get stock names for each ticker
        # Update the stock names back to the DataFrame
        df.at[index, ticker_column] = name_separator.join(stock_names)  # Join the names back into a string


def remove_ticker_suffix(df, ticker_column):
    """
    Remove the '.TW' or '.TWO' suffix from ticker codes in a DataFrame.

    Parameters:
    - df: The DataFrame containing ticker codes.
    - ticker_column: The name of the column containing ticker codes.
    """
    # Apply string replacement for each ticker in the specified column
    df[ticker_column] = df[ticker_column].str.replace('.TWO', '', regex=False)
    df[ticker_column] = df[ticker_column].str.replace('.TW', '', regex=False)


def filter_increasing_relative_strength(df):
    """
    Filter stocks with increasing Relative Strength over different time periods.

    This function filters the DataFrame to include only those stocks where:
    - Relative Strength is above 100.
    - Relative Strength has increased over the past 1 month, 3 months, and 6 months.
    Optionally, you can add a condition to check if Percentile is above 90.
    """
    return df[
        (df["Relative Strength"] > 100)
        & (df["Relative Strength"] > df["1 Month Ago"])
        & (df["1 Month Ago"] > df["3 Months Ago"])
        & (df["3 Months Ago"] > df["6 Months Ago"])
        # & (df["Percentile"] > 90)  # Uncomment to include Percentile filter
    ]


In [7]:
# @title Rank Function

import os
from datetime import datetime

from vistock import ibd
from vistock import tw
from vistock.stock_indices import get_tickers

def rank(code, period='2y', tickers_getter=get_tickers,
         ticker_ref='^GSPC', out_dir='out'):
    tickers = tickers_getter(code)

    output.clear_output()
    with output:
        rank_stock, rank_indust = ibd.rankings(tickers, period=period,
                                               ticker_ref=ticker_ref)
    if rank_stock.empty or rank_indust.empty:
        print("Not enough data to generate rankings.")
        return

    # Update the stock names back to the DataFrame
    #update_tickers_with_names(rank_stock, 'Ticker')
    #update_tickers_with_names(rank_indust, 'Tickers')

    # Remove the '.TW' or '.TWO' suffix
    remove_ticker_suffix(rank_stock, 'Ticker')
    remove_ticker_suffix(rank_indust, 'Tickers')

    # Save to CSV
    print("\n\n***")
    os.makedirs(out_dir, exist_ok=True)
    today = datetime.now().strftime('%Y%m%d')
    for df, kind in zip([rank_stock, rank_indust],
                           ['stocks', 'industries']):
        filename = f'{code}_{kind}_{period}_{today}.csv'
        github.upload_df_as_csv(filename, df)
        df.to_csv(os.path.join(out_dir, filename), index=False)
        print(f'Your "{filename}" is in the "{out_dir}" folder.')
    print("***\n")

    return rank_stock, rank_indust

### Glossary of Terms

source (The source of stocks to analyze):
- This could include stocks traded on exchanges or components of a specific index.
- Common abbreviation(s) for the exchange or market sector.  
  - For Taiwan Markets, possible values include:
    - `TWSE`: Taiwan Stock Exchange (台灣上市股票交易所）
    - `TPEX`: Taipei Exchange （上櫃交易所）
    - `ESB`: Emerging Stock Board （興櫃交易所）
  - Can also be combined with '+' (e.g., `TWSE+TPEX`, `TWSE+TPEX+ESB`)
  - For America Markets, possible values include:
    - `SPX`: S&P 500 (標普五百指數)
    - `DJIA`: Dow Jones Industrial Average (道瓊指數)
    - `NDX`: NASDAQ-100 (納斯達克一百指數)
    - `SOX`: PHLX Semiconductor Index （費半指數）
  - Multiple indices can be combined using '+' (e.g., `SPX+DJIA+NDX+SOX`)

period (Historical Data Time Range)：
- The time range for which to fetch historical data.
- `2y` means 2 years
- `6mo` means 6 monthes

RS (Relative Strength)
- Relative Strength (RS) is a metric used to evaluate the performance of a stock relative to a benchmark index.
  - A higher RS rating indicates that the stock has outperformed the index, while a lower RS rating suggests underperformance.
- The IBD RS calculates the performance of the last year, with the most recent quarter weighted double.

min_percentile (最小百分位)
- The minimum percentile for a stock to be included in the rankings.

### Error Messages

In [None]:
display(output)

Output()

### RS Rating and Ranking

In [8]:
source = "All Indices" #@param ["S&P 500", "Dow Jones Industrial Average", "NASDAQ 100", "PHLX Semiconductor", "All Indices"]
period = "2y" # @param ["6mo","1y","ytd","2y"]

code_from_name = {
    'S&P 500': 'SPX',
    'Dow Jones Industrial Average': 'DJIA',
    'NASDAQ 100': 'NDX',
    'PHLX Semiconductor': 'SOX',
    'All Indices': 'SPX+DJIA+NDX+SOX',
}

rank_stock, rank_indust = rank(code_from_name[source], period)
for df in (rank_stock, rank_indust):
    display(data_table.DataTable(df, include_index=False, num_rows_per_page=10))



***
Request failed: 422 - {'message': 'Invalid request.\n\n"sha" wasn\'t supplied.', 'documentation_url': 'https://docs.github.com/rest/repos/contents#create-or-update-file-contents', 'status': '422'}
Your "SPX+DJIA+NDX+SOX_stocks_2y_20240824.csv" is in the "out" folder.
Request failed: 422 - {'message': 'Invalid request.\n\n"sha" wasn\'t supplied.', 'documentation_url': 'https://docs.github.com/rest/repos/contents#create-or-update-file-contents', 'status': '422'}
Your "SPX+DJIA+NDX+SOX_industries_2y_20240824.csv" is in the "out" folder.
***



Unnamed: 0,Ticker,Sector,Industry,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
435,NVDA,Technology,Semiconductors,164.49,183.79,181.03,190.04,99,99,99,99,1
147,VST,Utilities,Utilities - Independent Power Producers,155.58,166.81,246.18,147.77,99,99,99,99,2
380,COHR,Technology,Scientific & Technical Instruments,146.00,140.59,124.96,138.20,99,99,94,97,3
242,IRM,Real Estate,REIT - Specialty,142.10,129.65,109.91,112.32,99,97,83,85,4
308,NRG,Utilities,Utilities - Independent Power Producers,137.09,130.04,170.19,116.86,99,97,99,90,5
...,...,...,...,...,...,...,...,...,...,...,...,...
17,MDB,Technology,Software - Infrastructure,55.94,58.98,82.77,122.43,0,0,15,94,517
328,DXCM,Healthcare,Medical Devices,55.68,80.43,98.47,89.85,0,14,57,35,518
314,INTC,Technology,Semiconductors,51.21,76.90,70.78,109.15,0,8,2,80,519
465,WBA,Healthcare,Pharmaceutical Retailers,45.93,44.76,58.60,70.94,0,0,0,3,520


Unnamed: 0,Industry,Sector,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Tickers,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
68,Utilities - Independent Power Producers,Utilities,146.34,148.43,208.18,132.32,"VST,NRG",98,98,99,97,1
57,Medical Care Facilities,Healthcare,121.10,106.49,105.23,106.25,"UHS,HCA,DVA",97,91,81,81,2
89,Residential Construction,Consumer Cyclical,119.52,112.04,105.04,115.88,"DHI,PHM,NVR,LEN",96,96,80,95,3
47,Banks - Regional,Financial Services,114.08,109.99,105.91,96.57,"CFG,FITB,KEY,TFC,PNC,RF,MTB,HBAN,USB",95,95,84,50,4
84,REIT - Healthcare Facilities,Real Estate,114.06,100.87,96.60,80.45,"VTR,DOC",94,77,55,5,5
...,...,...,...,...,...,...,...,...,...,...,...,...
40,Oil & Gas Equipment & Services,Energy,83.48,82.45,87.49,81.62,"BKR,SLB,HAL",4,9,9,7,91
67,Auto Parts,Consumer Cyclical,81.79,76.04,83.34,77.79,"GPC,BWA,LKQ,APTV",3,0,2,2,92
51,Steel,Basic Materials,81.64,87.53,98.77,102.30,"STLD,NUE",2,18,59,63,93
9,Airlines,Industrials,78.83,79.81,94.90,94.73,"LUV,DAL,UAL,AAL",1,4,46,42,94


In [None]:
# @title Top Percentile Stocks
min_percentile = 90 # @param {"type":"slider","min":1,"max":99,"step":1}
top_stocks = rank_stock[rank_stock[ibd.TITLE_PERCENTILE] >= min_percentile]
num_rows, _ = top_stocks.shape
print(f'\nnumber of filtered tickers: {num_rows}')
top_stock_list = list(top_stocks["Ticker"])
print(top_stock_list)


number of filtered tickers: 52
['NVDA', 'VST', 'COHR', 'IRM', 'NRG', 'GDDY', 'HWM', 'MMM', 'FICO', 'MHK', 'UHS', 'AXON', 'TRGP', 'KKR', 'NTAP', 'MPWR', 'AVGO', 'CFG', 'ANET', 'GE', 'DHI', 'K', 'TSM', 'NEM', 'PGR', 'LLY', 'PHM', 'ISRG', 'FITB', 'CBRE', 'GRMN', 'KEY', 'NVR', 'IP', 'SYF', 'GS', 'TT', 'VTR', 'META', 'RCL', 'EXR', 'HCA', 'GM', 'AFL', 'EFX', 'URI', 'DVA', 'CEG', 'COST', 'LEN', 'MSI', 'REGN']


In [None]:
# @title Filtered Stocks with Increasing RS > 100
filtered_rank_stock = filter_increasing_relative_strength(rank_stock)
data_table.DataTable(filtered_rank_stock, include_index=False, num_rows_per_page=10)

Unnamed: 0,Ticker,Sector,Industry,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
6,TRGP,Energy,Oil & Gas Midstream,130.08,124.88,117.91,103.72,97,95,91,68,13
126,CFG,Financial Services,Banks - Regional,125.1,118.91,110.99,93.27,96,94,84,44,18
334,NEM,Basic Materials,Gold,121.99,106.02,103.15,67.84,95,79,67,1,24
207,VTR,Real Estate,REIT - Healthcare Facilities,116.88,103.18,96.09,84.7,92,73,50,19,38
150,EXR,Real Estate,REIT - Industrial,116.59,108.55,94.13,89.21,92,84,44,32,41
185,MSI,Technology,Communication Equipment,114.78,107.08,104.71,96.75,90,81,71,51,51
362,PNC,Financial Services,Banks - Regional,114.41,110.63,104.93,98.2,89,87,71,55,53
125,WMT,Consumer Defensive,Discount Stores,114.28,108.07,106.62,98.5,89,84,76,55,54
132,WELL,Real Estate,REIT - Healthcare Facilities,114.22,107.96,103.73,98.8,89,83,68,56,55
171,TYL,Technology,Software - Application,113.39,109.68,105.29,96.87,88,86,73,52,60


### RS Rating and Ranking for Taiwan Stocks

In [None]:
from vistock import tw

source = "上市+上櫃" #@param ["上市", "上櫃", "上市+上櫃", "興櫃", "全部"]
period = "2y" # @param ["6mo","1y","ytd","2y"]

code_from_name = {
    '上市': 'TWSE',
    '上櫃': 'TPEX',
    '上市+上櫃': 'TWSE+TPEX',
    '興櫃': 'ESB',
    '全部': 'TWSE+TPEX+ESB'
}

tw_stocks, tw_industries = rank(code_from_name[source], period,
     tickers_getter=tw.get_tickers, ticker_ref='^TWII')
for df in (tw_stocks, tw_industries):
    display(data_table.DataTable(df, include_index=False, num_rows_per_page=10))



***
Request failed: 422 - {'message': 'Invalid request.\n\n"sha" wasn\'t supplied.', 'documentation_url': 'https://docs.github.com/rest/repos/contents#create-or-update-file-contents', 'status': '422'}
Your "TWSE+TPEX_stocks_2y_20240824.csv" is in the "out" folder.
Request failed: 422 - {'message': 'Invalid request.\n\n"sha" wasn\'t supplied.', 'documentation_url': 'https://docs.github.com/rest/repos/contents#create-or-update-file-contents', 'status': '422'}
Your "TWSE+TPEX_industries_2y_20240824.csv" is in the "out" folder.
***



Unnamed: 0,Ticker,Sector,Industry,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
790,6144,Communication Services,Entertainment,551.25,418.14,127.34,84.52,99,99,92,21,1
296,1799,Healthcare,Drug Manufacturers—Specialty & Generic,451.91,354.75,268.75,194.15,99,99,99,98,2
1205,6640,Technology,Semiconductors,418.13,371.68,240.75,217.75,99,99,99,98,3
1413,6442,Technology,Electronic Components,388.79,433.97,183.51,219.09,99,99,98,98,4
620,8374,Industrials,Industrial Distribution,356.81,348.68,103.01,82.73,99,99,78,16,5
...,...,...,...,...,...,...,...,...,...,...,...,...
1600,5227,Industrials,Electrical Equipment & Parts,55.67,63.15,57.40,70.69,0,1,0,1,2001
486,1256,Consumer Defensive,Beverages—Non-Alcoholic,55.50,61.00,65.15,85.63,0,0,3,25,2002
77,6958,Financial Services,Credit Services,55.46,70.14,72.97,88.75,0,7,12,38,2003
331,2740,Consumer Cyclical,Restaurants,54.62,57.12,67.92,79.67,0,0,6,10,2004


Unnamed: 0,Industry,Sector,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Tickers,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
68,Industrial Distribution,Industrials,152.04,150.14,88.85,88.68,837491160831142373,99,99,56,30,1
60,Entertainment,Communication Services,142.67,124.74,92.46,94.68,614448066596844684506184662564646856,98,94,68,61,2
86,Utilities—Renewable,Utilities,139.56,143.16,98.57,111.78,6869687368068087,97,98,81,92,3
2,Real Estate—Development,Real Estate,133.10,130.09,120.39,107.18,"2524,5508,3188,5455,2537,1436,2718,6171,3489,6...",96,96,98,82,4
55,Real Estate—Diversified,Real Estate,124.37,128.11,121.33,115.29,1438621999462520254555122547,95,95,99,95,5
...,...,...,...,...,...,...,...,...,...,...,...,...
38,Credit Services,Financial Services,75.95,72.77,72.29,86.73,"9941A,6592A,9941,6592,5871,6958",4,2,4,20,91
17,Travel Services,Consumer Cyclical,75.81,78.37,92.06,85.60,2745273157062743271962422734,3,13,67,15,92
59,Pharmaceutical Retailers,Healthcare,72.51,68.48,70.28,85.38,417341756469,2,0,2,14,93
66,Auto Manufacturers,Consumer Cyclical,71.82,72.98,78.15,95.33,15992206222722042201,1,3,14,63,94


In [None]:
# @title Top Percentile Taiwan Stocks
min_percentile = 95 # @param {"type":"slider","min":1,"max":99,"step":1}

top_stocks = tw_stocks[tw_stocks[ibd.TITLE_PERCENTILE] >= min_percentile]
num_rows, _ = top_stocks.shape
print(f'\nnumber of filtered tickers: {num_rows}')
top_stock_list = list(top_stocks["Ticker"])
top_stock_list = [tw.stock_name(ticker) for ticker in top_stock_list]
print(top_stock_list)


number of filtered tickers: 101
['得利影', '易威', '均華', '光聖', '羅昇', '穎漢', '昆盈', '慧友', '福裕', '康全電訊', '錦明', '京城', '晶彩科', '新復興', '均豪', '皇昌', '擎亞', '福大', '海悅', '彬台', '欣巴巴', '所羅門', '弘塑', '天方能源', '志聖', '弘憶股', '翔耀', '新門', '東捷', '旺矽', '福懋油', '天揚', '順藥', '系微', '精湛', '高鋒', '太普高', '鑫科', '天品', '世紀', '訊舟', '昇陽半導體', '花王', '永信建', '合騏', '慶騰', '雲豹能源', '晟銘電', '聯鈞', '安國', '鈊象', '訊聯基因', '精材', '鏵友益', '鑫龍騰', '德晉', '峰源-KY', '錸德', '藝舍-KY', '萬潤', '華景電', '友威科', '東科-KY', '全譜', '昇益', '聯上發', '鈺邦', '力麗店', '喬福', '南仁湖', '泓德能源-創', '華城', '三地開發', '和椿', '及成', '達能', '上詮', '波力-KY', '華友聯', '惠特', '蜜望實', '泰谷', '泰金-KY', '迎廣', '藥華藥', '華義', '勝昱', '京晨科', '亞力', '德律', '亞光', '岱稜', '晶悅', '信紘科', '加捷生醫', '辛耘', '雷科', '信驊', '大城地產', '大量', '益登']


In [None]:
# @title Filtered Taiwan Stocks with Increasing RS > 100

def convert_to_list(value):
    if isinstance(value, str):
        return value.split(',')
    return value

filtered_tw_stocks = filter_increasing_relative_strength(tw_stocks)
update_tickers_with_names(filtered_tw_stocks, 'Ticker')

filtered_tw_industries = filter_increasing_relative_strength(tw_industries)
update_tickers_with_names(filtered_tw_industries, 'Tickers')
#filtered_tw_industries.loc[:, 'Tickers'] = filtered_tw_industries['Tickers'].apply(convert_to_list)

for df in (filtered_tw_stocks, filtered_tw_industries):
    display(data_table.DataTable(df, include_index=False, num_rows_per_page=10))

Unnamed: 0,Ticker,Sector,Industry,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
790,得利影,Communication Services,Entertainment,551.25,418.14,127.34,84.52,99,99,92,21,1
296,易威,Healthcare,Drug Manufacturers—Specialty & Generic,451.91,354.75,268.75,194.15,99,99,99,98,2
1205,均華,Technology,Semiconductors,418.13,371.68,240.75,217.75,99,99,99,98,3
620,羅昇,Industrials,Industrial Distribution,356.81,348.68,103.01,82.73,99,99,78,16,5
1946,穎漢,Industrials,Specialty Industrial Machinery,312.38,297.73,148.56,87.89,99,99,96,33,6
...,...,...,...,...,...,...,...,...,...,...,...,...
279,臻鼎-KY,Technology,Electronic Components,103.46,100.12,93.49,81.78,76,75,66,14,472
1392,東鹼,Basic Materials,Chemicals,103.11,88.13,83.97,81.41,76,56,44,13,480
1756,臺企銀,Financial Services,Banks—Regional,102.85,99.87,99.84,88.03,75,75,75,34,487
956,展宇,Basic Materials,Chemicals,101.29,81.63,80.42,76.73,74,40,33,6,522


Unnamed: 0,Industry,Sector,Relative Strength,1 Month Ago,3 Months Ago,6 Months Ago,Tickers,Percentile,1 Month Ago.1,3 Months Ago.1,6 Months Ago.1,Rank
68,Industrial Distribution,Industrials,152.04,150.14,88.85,88.68,"羅昇,明輝-DR,好德,震旦行",99,99,56,30,1
2,Real Estate—Development,Real Estate,133.1,130.09,120.39,107.18,"京城,永信建,鑫龍騰,昇益,聯上發,華友聯,晶悅,大城地產,森寶,新潤,理銘,富宇,坤悅,達...",96,96,98,82,4
24,Real Estate Services,Real Estate,112.39,112.21,111.52,104.12,"海悅,愛山林,綠意,台火,名軒,鉅陞,上曜,富裔,華建,全坤建,昇陽,宏璟,潤隆,亞昕,怡華...",89,91,96,80,11
69,Insurance—Life,Financial Services,101.12,90.58,85.99,84.49,"三商,新光金,三商壽,富邦金,新光金甲特,新光金乙特,國泰金,開發金,開發金乙特,國泰特,富...",77,63,44,8,22


### Remove files in GitHub Repository

In [None]:
# @title CSV Deleter
import re
import ipywidgets as widgets

# Example filenames
with requests_cache.disabled():
    all_filenames = github.list_filenames()

# Function to extract unique dates from filenames
def extract_dates(filenames):
    date_pattern = r'\d{8}'
    dates = set()
    for fn in filenames:
        match = re.search(date_pattern, fn)
        if match:
            dates.add(match.group(0))
    return sorted(dates, reverse=True)  # Sort dates from newest to oldest

# Function to remove a file (replace with your actual implementation)
def remove_file(filename):
    print(f"Removing file: {filename}")
    with requests_cache.disabled():
        github.remove_file(filename)
    all_filenames.remove(filename)

#-------------------------------------------------------------------------------

# Update file selector options based on selected date
def update_file_selector(change):
    def selector_width(filenames):
        max_filename_length = max(len(fn) for fn in filenames)
        return f'{max_filename_length * 10}px'  # 10px width per character

    selected_date = change['new']
    lst_fns = [fn for fn in all_filenames if selected_date in fn]
    file_selector_widget.options = lst_fns
    file_selector_widget.rows = len(file_selector_widget.options)
    file_selector_widget.layout=widgets.Layout(width=selector_width(lst_fns))

# Function to delete selected files
def delete_files(button):
    selected_files = file_selector_widget.value
    for file in selected_files:
        remove_file(file)
    update_widgets()    # Update widgets after deletion

# Update widgets to reflect current state
def update_widgets():
    # Refresh the date selector
    dates = extract_dates(all_filenames)
    selected_date = date_selector_widget.value
    if selected_date not in dates:
        i = date_selector_widget.options.index(selected_date)
        if i > len(dates) - 1:
            selected_date = dates[-1]
        else:
            selected_date = dates[i]
    date_selector_widget.options = dates
    date_selector_widget.value = selected_date
    if not dates:
        file_selector_widget.options = []
        return
    update_file_selector({'new': date_selector_widget.value})

#-------------------------------------------------------------------------------

# Create a widget for selecting dates
def create_date_selector(dates):
    return widgets.Dropdown(
        options=dates,
        value = dates[0],
        description='Date:',
        disabled=False
    )

# Create a widget for selecting files
def create_file_selector(filenames):

    return widgets.SelectMultiple(
        options=[],
        value=[],
        description='Files',
        disabled=False,
    )

# Create widgets
dates = extract_dates(all_filenames)
date_selector_widget = create_date_selector(dates)
file_selector_widget = create_file_selector(all_filenames)
delete_button = widgets.Button(description="Delete Selected Files")
delete_button.on_click(delete_files)

# Initialize the file selector with the latest date
update_widgets()

# Set up the observer to update file selector when date is changed
date_selector_widget.observe(update_file_selector, names='value')

# Display widgets
display(date_selector_widget)
display(file_selector_widget)
display(delete_button)


Dropdown(description='Date:', options=('20240824', '20240818', '20240813'), value='20240824')

SelectMultiple(description='Files', layout=Layout(width='430px'), options=('SPX+DJIA+NDX+SOX_industries_2y_202…

Button(description='Delete Selected Files', style=ButtonStyle())