## SILVER TO GOLD LAYER

### Gold Layer - Holdings


In [None]:
# Importing Common Utility Funcation

import pandas as pd
from PortfolioTracker import GlobalPath, Portfolio

In [None]:
# Import necessary libraries and utility functions
%run ../COMMON/common_utility.ipynb

In [None]:
# Instantiate GlobalPath
tradehistory_silver_file_path = GlobalPath(
    "DATA/SILVER/TradeHistory/TradeHistory_data.csv"
)
stockprice_silver_file_path = GlobalPath(
    "DATA/SILVER/StockPrice/StockPrice_data.csv"
)
holdingshistory_gold_file_path = GlobalPath(
    "DATA/GOLD/Holdings/HoldingsHistory_data.csv"
)
current_holding_records_file_path = GlobalPath(
    "DATA/GOLD/Holdings/CurrentHoldings_data.csv"
)
symbol_silver_file_path = GlobalPath("DATA/SILVER/Symbol/Symbol_data.csv")
holdingshistory_source_layer_path = GlobalPath(
    "DATA/SOURCE/Holdings/HoldingsHistory_data.csv"
)

### Data Processing

- Read and sort trade history data.
- Apply portfolio trade logic.


In [None]:
# Read the CSV file
df_trade_history = pd.read_csv(tradehistory_silver_file_path)

# Filter the DataFrame to include only rows where the segment is 'EQ' (Equity) or 'MF' (Mutual Funds)
df_trade_history = df_trade_history[
    df_trade_history["segment"].isin(["EQ", "MF"])
]

# Convert 'datetime' to datetime type
df_trade_history["datetime"] = pd.to_datetime(df_trade_history["datetime"])

# Sort the DataFrame by 'datetime'
df_trade_history = df_trade_history.sort_values(by="datetime")

print(
    f"Read SILVER Layer trade history data from: {tradehistory_silver_file_path}"
)

### Portfolio Logic Application

- Instantiate Portfolio and apply trade logic.
- Handle expired stocks


In [None]:
# Apply the trade logic to each row of the DataFrame
# Instantiate the Portfolio object
portfolio = Portfolio()
# .astype(str)
for record in df_trade_history.to_dict(orient="records"):
    portfolio.trade(record)

portfolio.check_expired_stocks()
# expired_stocks example : df_trade_history["scrip_name"] == "NIFTY-PE-24650-18JUL2024"

### Final Processing and Export

- Select and sort relevant columns.
- Save the processed data as a CSV file in the Gold layer.


In [None]:
# Create a DataFrame from the processed data
df_holding_records = pd.DataFrame(portfolio.get_current_holdings())

# Remove '_amount' suffix from column names for clarity
df_holding_records = df_holding_records.rename(
    columns={
        col: col.replace("open_", "") for col in df_holding_records.columns
    }
)
# Sort the DataFrame
df_holding_records = df_holding_records.sort_values(
    by=[
        "segment",
        "exchange",
        "symbol",
        "scrip_name",
        "datetime",
    ]
)

# Round the values in to two decimal places
df_holding_records = df_holding_records.round(2)

# Reset index to ensure it starts from 0
df_holding_records = df_holding_records.reset_index(drop=True)

# Select and reorder the columns for the final DataFrame
df_holding_records = df_holding_records[
    [
        "scrip_name",
        "symbol",
        "exchange",
        "segment",
        "datetime",
        "side",
        "quantity",
        "price",
        "amount",
    ]
]

# Save the final DataFrame to a CSV file
df_holding_records.to_csv(current_holding_records_file_path, index=None)

print("GOLD Layer CSV file for Current Holdings successfully created at:")
print(current_holding_records_file_path)

# Display the DataFrame debugrmation
df_holding_records.info()

In [None]:
# Create a DataFrame from the processed data
df_holdings = pd.DataFrame(portfolio.get_holdings_history())

# Round the values in the columns to two decimal places
df_holdings = df_holdings.round(2)

# Extract date from datetime
df_holdings["date"] = df_holdings["datetime"].dt.date

# Find the index of the maximum datetime for each scrip_name and date
idx = df_holdings.groupby(["scrip_name", "date"])["datetime"].idxmax()

# Use the indices to filter the original DataFrame
df_holdings = df_holdings.loc[idx].reset_index(drop=True)

In [None]:
# Create a function to expand the date range for each stock


def expand_dates(stock_df):
    """
    Expands the date range for each stock to include all dates from the
    minimum date to the current date and forward fills the missing values.

    Parameters:
    stock_df (pd.DataFrame): DataFrame containing stock data for a single stock.

    Returns:
    pd.DataFrame: DataFrame with expanded date range and forward-filled values.
    """
    # Find the minimum date for this stock
    min_date = stock_df["date"].min()

    # Create a date range from the minimum date to today
    date_range = pd.date_range(start=min_date, end=pd.to_datetime("today"))

    # Reindex the stock_df to include the full date range
    stock_df = stock_df.set_index("date").reindex(date_range)

    # Forward fill the values to fill missing dates
    stock_df = stock_df.ffill().reset_index()

    # Rename the 'index' column to 'date'
    stock_df = stock_df.rename(columns={"index": "date"})

    return stock_df


# Apply the expand_dates function to each stock group
df_holdings = (
    df_holdings.groupby("scrip_name")
    .apply(expand_dates, include_groups=False)
    .reset_index()
)

In [None]:
# Load stock prices data from the specified CSV file path
df_stockprice = pd.read_csv(stockprice_silver_file_path)

# Convert the 'date' column in stock prices to datetime type for consistency
df_stockprice["date"] = pd.to_datetime(df_stockprice["date"])

print(
    f"Loaded SILVER Layer stock price data from: {stockprice_silver_file_path}"
)

# Merge the expanded holdings data with the stock price data
df_holdings = pd.merge(
    df_holdings,
    df_stockprice,
    on=["date", "symbol"],
    how="left",
)

In [None]:
# Calculate the OHLC value of holdings
col_names = ["open", "high", "low", "close"]
for col_name in col_names:
    df_holdings[f"{col_name}_price"] = df_holdings[col_name]
    df_holdings[f"{col_name}_amount"] = (
        df_holdings[col_name] * df_holdings["holding_quantity"]
    )

# Forward fill the values to fill missing dates
df_holdings = df_holdings.ffill()

# Filter out rows with zero holding quantity
df_holdings = df_holdings[df_holdings["holding_quantity"] != 0]

# Round the values in to two decimal places
df_holdings = df_holdings.round(2)

In [None]:
# Sort the DataFrame for organized output
df_holdings = df_holdings.sort_values(
    by=[
        "date",
        "segment",
        "exchange",
        "symbol",
        "scrip_name",
    ]
)

# Reset index to ensure it starts from 0
df_holdings = df_holdings.reset_index(drop=True)

# Select and reorder the columns for the final DataFrame
df_holdings = df_holdings[
    [
        "date",
        "segment",
        "exchange",
        "symbol",
        "scrip_name",
        "holding_quantity",
        "avg_price",
        "holding_amount",
        "open_price",
        "open_amount",
        "high_price",
        "high_amount",
        "low_price",
        "low_amount",
        "close_price",
        "close_amount",
    ]
]

# Save the final processed DataFrame to a new CSV file
df_holdings.to_csv(holdingshistory_gold_file_path, index=None)

print(
    f"GOLD Layer CSV file for Holdings successfully created at: {holdingshistory_gold_file_path}"
)

# Display debugrmation about the final DataFrame
df_holdings.info()

In [None]:
# Replace scrip code with scrip_name name
df_symbol = pd.read_csv(symbol_silver_file_path)
print(f"Loaded data from: {symbol_silver_file_path}")

# Calculate the min and max dates for each stock
df_holdings = (
    df_holdings.groupby(["segment", "exchange", "symbol"])
    .agg(min_date=("date", "min"), max_date=("date", "max"))
    .reset_index()
)

# Merge df_HoldingHistory with df_Symbol on the matching columns
df_holdings = df_holdings.merge(
    df_symbol[["symbol", "isin"]],
    left_on="symbol",
    right_on="symbol",
    how="left",
)


# Save the final processed DataFrame to a new CSV file
df_holdings.to_csv(holdingshistory_source_layer_path, index=None)

print(
    f"GOLD Layer CSV file for Holdings successfully created at: {holdingshistory_source_layer_path}"
)

# Display debugrmation about the final DataFrame
df_holdings.info()