<a href="https://colab.research.google.com/github/yorkjong/vistock/blob/main/notebooks/rsm_rating.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

### Stock Analysis and Ranking with RSM (Mansfield Relative Strength) Rating

### Install and Config

#### Install Required Packages

In [1]:
%pip install "git+https://github.com/yorkjong/vistock.git"
%pip install requests-cache

Collecting git+https://github.com/yorkjong/vistock.git
  Cloning https://github.com/yorkjong/vistock.git to /tmp/pip-req-build-mu0u_3jf
  Running command git clone --filter=blob:none --quiet https://github.com/yorkjong/vistock.git /tmp/pip-req-build-mu0u_3jf
  Resolved https://github.com/yorkjong/vistock.git to commit e10a3e1fba2226937200a5024216bab63f030208
  Preparing metadata (setup.py) ... [?25l[?25hdone
Collecting mplfinance (from vistock==0.5.2)
  Downloading mplfinance-0.12.10b0-py3-none-any.whl.metadata (19 kB)
Downloading mplfinance-0.12.10b0-py3-none-any.whl (75 kB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m75.0/75.0 kB[0m [31m2.2 MB/s[0m eta [36m0:00:00[0m
[?25hBuilding wheels for collected packages: vistock
  Building wheel for vistock (setup.py) ... [?25l[?25hdone
  Created wheel for vistock: filename=vistock-0.5.2-py3-none-any.whl size=83598 sha256=468ae36b77b20d84ab580cbb338843479b2a12fed24bb57986d5c51e4bb41465
  Stored in directory: /tmp/pi

#### Setup and Configuration

In [2]:
# @title Enable DataFrame Formatter
from google.colab import data_table
data_table.enable_dataframe_formatter()

In [3]:
# @title Enable Requests Cache
import requests_cache
requests_cache.install_cache('ibd_cache', expire_after=3600)

In [4]:
# @title GitHub
import base64
import requests
import pandas as pd
from io import StringIO


class GitHub:
    def __init__(self, repo_owner, repo_name, token, dir='', branch='main'):
        base = 'https://api.github.com/repos'
        dir = dir.strip('/')
        if dir:
            self.base_url = f'{base}/{repo_owner}/{repo_name}/contents/{dir}'
        else:
            self.base_url = f'{base}/{repo_owner}/{repo_name}/contents'
        self.branch = branch
        self.token = token

    def _request(self, method, url, headers=None, params=None, json=None):
        response = requests.request(method, url, headers=headers,
                                    params=params, json=json)
        if response.status_code in [200, 201]:
            return response.json()
        elif response.status_code == 404:
            return None
        else:
            print(f"Request failed: {response.status_code} - {response.json()}")
            return None

    def file_exists(self, file_path):
        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json',
        }
        response = requests.get(url, headers=headers,
                                params={'ref': self.branch})
        if response.status_code == 200:
            return True
        elif response.status_code == 404:
            return False
        else:
            print(f"Request failed: {response.status_code} - {response.json()}")
            return None

    def list_filenames(self, dir_path=''):
        url = f'{self.base_url}/{dir_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json',
        }
        response = requests.get(url, headers=headers,
                                params={'ref': self.branch})
        if response.status_code == 200:
            files = response.json()
            return [item['name'] for item in files]
        else:
            print(f"Request failed: {response.status_code} - {response.json()}")
            return []

    def download_file(self, file_path):
        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json',
        }

        file_info = self._request('GET', url, headers=headers,
                                  params={'ref': self.branch})
        if file_info:
            response = requests.get(file_info['download_url'])
            if response.status_code == 200:
                return StringIO(response.text)
            else:
                print(f"Failed to download file: "
                      f"{response.status_code} - {response.text}")
        else:
            print(f"File '{file_path}' does not exist. Cannot download.")
        return None

    def download_csv(self, file_path):
        file_content = self.download_file(file_path)
        if file_content:
            return pd.read_csv(file_content)
        else:
            return pd.DataFrame()

    def upload_file(self, file_path, content):
        url = f'{self.base_url}/{file_path}'

        # Encode the content to base64
        encoded_content = base64.b64encode(content.encode()).decode()
        payload = {
            'message': 'Uploading file',
            'content': encoded_content,
            'branch': self.branch
        }

        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json'
        }

        # Check if the file already exists to get the current sha
        file_info = self._request('GET', url, headers=headers,
                                  params={'ref': self.branch})
        # If the file exists, get the current SHA
        if file_info:
            payload['sha'] = file_info.get('sha')

        # PUT request to create or update the file
        self._request('PUT', url, headers=headers, json=payload)

    def upload_df_as_csv(self, file_path, df):
        """Upload a DataFrame to a CSV file."""
        if not file_path.endswith('.csv'):
            file_path += '.csv'
        csv_content = df.to_csv(index=False)
        self.upload_file(file_path, csv_content)

    def remove_file(self, file_path):
        if not self.file_exists(file_path):
            print(f"File '{file_path}' does not exist. Skipping deletion.")
            return

        url = f'{self.base_url}/{file_path}'
        headers = {
            'Authorization': f'token {self.token}',
            'Accept': 'application/vnd.github.v3+json'
        }

        # Fetch the file info to get the SHA needed for deletion
        file_info = self._request('GET', url, headers=headers)
        if file_info:
            payload = {
                'message': 'Deleting file',
                'sha': file_info['sha'],
                'branch': self.branch
            }
            self._request('DELETE', url, headers=headers, json=payload)

#-------------------------------------------------------------------------------

from google.colab import userdata

github = GitHub(
    repo_owner='yorkjong',
    repo_name='stock-reports',
    token=userdata.get('GithubToken.stock-reports'),
    dir='weinstein',
)

In [5]:
# @title DataFrame Operations

def is_taiwan_stock_df(df):
    ticker = df['Ticker'].iloc[0].replace('.TWO', '').replace('.TW', '')
    return ticker.isdigit()

def add_name_column(df):
    column_names = df.columns.tolist()
    if 'Name' in column_names:
        return df
    if 'Ticker' not in column_names:
        return df
    if df.empty:
        return df
    if not is_taiwan_stock_df(df):
        return df
    df['Name'] = None
    ticker_index = column_names.index('Ticker')
    column_names.insert(ticker_index + 1, 'Name')
    df = df[column_names]   # create a new DataFrame
    df['Name'] = df['Ticker'].apply(tw.stock_name)
    return df


def remove_ticker_suffix(df, ticker_column):
    """
    Remove the '.TW' or '.TWO' suffix from ticker codes in a DataFrame.

    Parameters:
    - df: The DataFrame containing ticker codes.
    - ticker_column: The name of the column containing ticker codes.
    """
    # Apply string replacement for each ticker in the specified column
    df[ticker_column] = df[ticker_column].str.replace('.TWO', '', regex=False)
    df[ticker_column] = df[ticker_column].str.replace('.TW', '', regex=False)

In [6]:
# @title Rank Function

import os
from datetime import datetime

from vistock import rsm
from vistock import tw
from vistock.stock_indices import get_tickers


def remove_failed_tickers(tickers):
    delisted = ['BRK.B', 'LEN.B', 'BF.B', 'UHAL.B', 'BF.A', 'CWEN.A', 'HEI.A']
    invalid = ['GEV', 'SOLV', 'VLTO', 'SW', 'ARM', 'CART', 'AS', 'BIRK', 'VSTS','LOAR', 'ALAB','GRAL', 'SEG']
    invalid += ['00945B.TW', '6928.TW', '6914.TW', '6771.TW', '00944.TW', '8162.TW', '1563.TW', '00946.TW', '00941.TW', '6423.TW', '00940.TW', '00939.TW', '4949.TW', '00943.TW', '8487.TW', '6794.TW', '6949.TW', '4771.TW']
    invalid += ['00936.TW', '6805.TW', '2254.TW', '6658.TW', '00935.TW', '6592B.TW', '6526.TW', '6906.TW', '4736.TW', '00636K.TW', '6968.TWO', '4442.TWO', '6534.TW', '6901.TW', '00934.TW', '00657K.TW', '6472.TW', '2258.TW', '6916.TW', '2762.TW', '6933.TW']
    invalid += ['02001R.TW', '020031.TW', '020039.TW', '020016.TW', '02001L.TW', '020019.TW', '020028.TW', '020020.TW', '02001S.TW', '020018.TW', '020038.TW', '020034.TW', '020011.TW', '020030.TW', '020012.TW', '020036.TW', '020029.TW', '020000.TW', '020015.TW', '020037.TW']
    invalid += ['6890.TW', '00951.TW', '3150.TW', '6957.TW', '00947.TW', '00949.TW']
    invalid += ['6838.TW', '00953B.TW', '00956.TW', '00954.TW']
    return list(set(tickers) - set(delisted) - set(invalid))

def rank(code, period='2y', ma="EMA", ticker_ref='^GSPC', out_dir='out'):
    tickers = get_tickers(code)
    #tickers = remove_failed_tickers(tickers)

    rank_stock = rsm.ranking(tickers, period=period,
                             ticker_ref=ticker_ref, ma=ma)
    if rank_stock.empty:
        print("Not enough data to generate rankings.")
        return

    rank_stock = add_name_column(rank_stock)

    # Remove the '.TW' or '.TWO' suffix
    remove_ticker_suffix(rank_stock, 'Ticker')

    # Save to CSV
    print("\n\n***")
    os.makedirs(out_dir, exist_ok=True)
    today = datetime.now().strftime('%Y%m%d')
    filename = f'{code}_stocks_{period}_{ma}_{today}.csv'
    github.upload_df_as_csv(filename, rank_stock)
    rank_stock.to_csv(os.path.join(out_dir, filename), index=False)
    print(f'Your "{filename}" is in the "{out_dir}" folder.')
    print("***\n")

    return rank_stock

### RS Rating and Ranking

In [8]:
source = "U.S. Listed Stocks" #@param ["S&P 500", "Dow Jones Industrial Average", "NASDAQ 100", "Russell 1000", "Russell 2000", "PHLX Semiconductor", "U.S. Listed Stocks"]
ma = "SMA" # @param ["EMA","SMA"]

code_from_name = {
    'S&P 500': 'SPX',
    'Dow Jones Industrial Average': 'DJIA',
    'NASDAQ 100': 'NDX',
    'Russell 1000': 'RUI',
    'Russell 2000': 'RUT',
    'PHLX Semiconductor': 'SOX',
    'U.S. Listed Stocks': 'U.S.Listed',
}

df = rank(code_from_name[source], ma=ma)
data_table.DataTable(df, include_index=False, num_rows_per_page=20)

[**********************100%**********************]  5442 of 5442 info downloaded


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Volume'] = df['Volume'].fillna(0).astype(np.int64)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Volume'] = df['Volume'].fillna(0).astype(np.int64)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Volume'] = df['Volume'].fillna(0).astype(np.int64)
A value is trying to be set on a copy of

Num of downloaded stocks: 5442
[                        0%                      ]  18 of 5441 financials downloaded
[                        1%                      ]  29 of 5441 financials downloaded
[                        1%                      ]  32 of 5441 financials downloaded
[                        1%                      ]  33 of 5441 financials downloaded

[                        1%                      ]  43 of 5441 financials downloaded
[                        1%                      ]  50 of 5441 financials downloaded
[                        1%                      ]  51 of 5441 financials downloaded
[                        1%                      ]  73 of 5441 financials downloaded
[                        1%                      ]  81 of 5441 financials downloaded
[                        2%                      ]  90 of 5441 financials downloaded
[                        2%                      ]  101 of 5441 financials downloaded
[                        2%     

Unnamed: 0,Ticker,Sector,Industry,RS (%),1 Week Ago,1 Month Ago,3 Months Ago,6 Months Ago,9 Months Ago,RS Rank (%),Price,MA10,MA30,Volume / VMA10,EPS RS (%),TTM EPS,Rev RS (%),TTM RPS,TTM PE
2807,LASE,Industrials,Specialty Industrial Machinery,503.21,494.18,84.39,3.37,-26.65,-62.63,100.00,16.31,6.78,3.55,0.24,173.20,-0.65,-47.13,0.389,
4783,TIL,Healthcare,Biotechnology,314.69,335.41,23.75,-6.91,-7.82,-38.56,99.98,67.32,35.82,19.40,0.07,394.70,-18.39,0.53,,
1516,DUO,Real Estate,Real Estate Services,302.16,73.14,-48.42,-63.48,-91.82,-92.75,99.96,3.10,0.77,0.65,3.52,,-3.20,,73.309,
3344,NEON,Technology,Electronic Components,202.52,244.05,217.51,-10.56,-65.09,-60.18,99.94,9.10,6.54,3.60,0.10,238.15,-0.67,28.99,0.289,
4451,SMMT,Healthcare,Biotechnology,197.14,199.86,144.41,108.97,48.74,10.28,99.92,21.90,17.02,9.69,0.13,178.15,-0.11,0.53,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5418,ZJK,,,,,,,,,,,,,,,,,,38.46
5420,ZK,Consumer Cyclical,Auto Manufacturers,,,,,,,,,,,,224.12,-4.98,0.53,314.047,
5421,ZKH,Consumer Cyclical,Internet Retail,,,,,,,,,,,,738.70,-0.37,2.70,82.533,
5426,ZOOZ,Consumer Cyclical,Specialty Retail,,,,,,,,,,,,,-22.44,,0.069,


### RS Rating and Ranking for Taiwan Stocks

In [7]:
from vistock import tw

source = "上市+上櫃" #@param ["上市", "上櫃", "上市+上櫃", "興櫃", "全部"]
ma = "SMA" # @param ["EMA","SMA"]

code_from_name = {
    '上市': 'TWSE',
    '上櫃': 'TPEX',
    '上市+上櫃': 'TWSE+TPEX',
    '興櫃': 'ESB',
    '全部': 'TWSE+TPEX+ESB'
}

df_tw = rank(code_from_name[source], ma=ma, ticker_ref='^TWII')
data_table.DataTable(df_tw, include_index=False, num_rows_per_page=20)

[**********************100%**********************]  2087 of 2087 info downloaded


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Volume'] = df['Volume'].fillna(0).astype(np.int64)
[*********************100%***********************]  1889 of 1889 completed
ERROR:yfinance:
33 Failed downloads:
ERROR:yfinance:['6928.TW', '6957.TW', '6423.TW', '3150.TW', '6794.TW', '1563.TW', '6771.TW', '6890.TW', '4949.TW', '6914.TW']: YFInvalidPeriodError("%ticker%: Period '2y' is invalid, must be one of ['1d', '5d', '1mo', '3mo', '6mo', 'ytd', 'max']")
ERROR:yfinance:['6526.TW', '6916.TW', '6906.TW', '8487.TW', '6933.TW', '6949.TW', '4771.TW', '6534.TW', '8162.TW', '6472.TW', '6805.TW', '6658.TW', '2258.TW', '2762.TW', '4736.TW', '4442.TWO', '2254.TW']: YFInvalidPeriodError("%ticker%: Period '2y' is invalid, must be one of ['1d', '5d', '1mo', '3mo', '6mo', '1y', 'ytd

Num of downloaded stocks: 1889

[                        0%                      ]  2 of 1888 financials downloaded
[***                     7%                      ]  123 of 1888 financials downloaded
[********               17%                      ]  330 of 1888 financials downloaded
[*************          28%                      ]  534 of 1888 financials downloaded
[*************          28%                      ]  538 of 1888 financials downloaded
[*************          29%                      ]  546 of 1888 financials downloaded
[*************          29%                      ]  547 of 1888 financials downloaded
[*************          29%                      ]  548 of 1888 financials downloaded
[*************          29%                      ]  550 of 1888 financials downloaded
[**************         29%                      ]  551 of 1888 financials downloaded
[**************         29%                      ]  554 of 1888 financials downloaded
[**************         

Unnamed: 0,Ticker,Name,Sector,Industry,RS (%),1 Week Ago,1 Month Ago,3 Months Ago,6 Months Ago,9 Months Ago,RS Rank (%),Price,MA10,MA30,Volume / VMA10,EPS RS (%),TTM EPS,Rev RS (%),TTM RPS,TTM PE
1300,6144,得利影,Communication Services,Entertainment,198.74,202.71,238.07,109.39,2.71,-12.81,100.00,115.5,98.65,53.72,0.78,-22.18,-0.44,-17.51,5.190,
708,3230,錦明,Technology,Electronic Components,198.22,192.65,210.13,12.90,-19.79,-28.14,99.95,57.5,41.95,23.71,0.10,507.88,3.69,-40.84,10.307,15.58
1065,4909,新復興,Technology,Electronic Components,123.96,127.17,78.69,98.14,143.27,35.77,99.89,190.0,140.30,110.01,0.69,12.98,3.96,42.32,11.834,47.98
269,2070,精湛,Industrials,Specialty Industrial Machinery,122.82,127.66,92.67,0.85,1.85,-13.19,99.84,111.5,87.48,55.85,0.72,23.87,3.60,-3.15,19.149,30.97
1828,8937,合騏,Consumer Cyclical,Recreational Vehicles,116.85,124.34,130.26,-15.53,-14.76,-0.32,99.78,69.2,55.43,34.57,0.30,46.85,1.12,46.76,1.649,61.79
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1655,6949,沛爾生醫-創,Healthcare,Biotechnology,,,,,,,,,,,,739.69,-7.87,1.43,0.346,
1659,6957,裕慶-KY,Consumer Cyclical,"Furnishings, Fixtures & Appliances",,,,,,,,,,,,-110.47,13.48,-29.50,68.984,17.28
1663,6969,成信實業*-創,,,,,,,,,,,,,,,,,,
1730,8162,微矽電子-創,Technology,Semiconductors,,,,,,,,,,,,-907.89,0.66,-15.55,15.150,52.42


### Remove files in GitHub Repository

In [None]:
# @title CSV Deleter
import re
import ipywidgets as widgets

# Example filenames
with requests_cache.disabled():
    all_filenames = github.list_filenames()

# Function to extract unique dates from filenames
def extract_dates(filenames):
    date_pattern = r'\d{8}'
    dates = set()
    for fn in filenames:
        match = re.search(date_pattern, fn)
        if match:
            dates.add(match.group(0))
    return sorted(dates, reverse=True)  # Sort dates from newest to oldest

# Function to remove a file (replace with your actual implementation)
def remove_file(filename):
    print(f"Removing file: {filename}")
    with requests_cache.disabled():
        github.remove_file(filename)
    all_filenames.remove(filename)

#-------------------------------------------------------------------------------

# Update file selector options based on selected date
def update_file_selector(change):
    def selector_width(filenames):
        max_filename_length = max(len(fn) for fn in filenames)
        return f'{max_filename_length * 10}px'  # 10px width per character

    selected_date = change['new']
    lst_fns = [fn for fn in all_filenames if selected_date in fn]
    file_selector_widget.options = lst_fns
    file_selector_widget.rows = len(file_selector_widget.options)
    file_selector_widget.layout=widgets.Layout(width=selector_width(lst_fns))

# Function to delete selected files
def delete_files(button):
    selected_files = file_selector_widget.value
    for file in selected_files:
        remove_file(file)
    update_widgets()    # Update widgets after deletion

# Update widgets to reflect current state
def update_widgets():
    # Refresh the date selector
    dates = extract_dates(all_filenames)
    selected_date = date_selector_widget.value
    if dates and selected_date not in dates:
        i = date_selector_widget.options.index(selected_date)
        if i > len(dates) - 1:
            selected_date = dates[-1]
        else:
            selected_date = dates[i]
    date_selector_widget.options = dates
    date_selector_widget.value = selected_date
    if not dates:
        file_selector_widget.options = []
        return
    update_file_selector({'new': date_selector_widget.value})

#-------------------------------------------------------------------------------

# Create a widget for selecting dates
def create_date_selector(dates):
    return widgets.Dropdown(
        options=dates,
        value = dates[0] if dates else None,
        description='Date:',
        disabled=False
    )

# Create a widget for selecting files
def create_file_selector(filenames):

    return widgets.SelectMultiple(
        options=[],
        value=[],
        description='Files',
        disabled=False,
    )

# Create widgets
dates = extract_dates(all_filenames)
date_selector_widget = create_date_selector(dates)
file_selector_widget = create_file_selector(all_filenames)
delete_button = widgets.Button(description="Delete Selected Files")
delete_button.on_click(delete_files)

# Initialize the file selector with the latest date
update_widgets()

# Set up the observer to update file selector when date is changed
date_selector_widget.observe(update_file_selector, names='value')

# Display widgets
display(date_selector_widget, file_selector_widget, delete_button)