This notebook contains code for implementing the Heston model and calibrating model parameters, followed by Monte Carlo simulations to validate the model.

# Importing Libraries

In [23]:
import os
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import time
import warnings
import plotly.graph_objects as go

from scipy.integrate import quad
from scipy.optimize import minimize
from datetime import datetime as dt

from nelson_siegel_svensson.calibrate import calibrate_nss_ols

# Implementing Heston Model
Heston model known parameters (from market data):
- initial asset price (S0) 
- risk-free interest rate (r) 
- time to maturity(T) 
- strike price (K)

unknown parameters (determined through optimization algorithms and calibration techniques):
- initial volatility (v0),
- speed of mean-reversion (kappa)
- long term mean of volatility (theta)
- volatility of volatility (sigma)
- correlation between the two wiener processes for asset price and volatility (rho)

Heston equations (SDEs, PDE, characteristic function) are from this paper:
https://www.maths.univ-evry.fr/pages_perso/crepey/Finance/051111_mikh%20heston.pdf

In [24]:
# Defining heston model characteristic function
# Characteristic function derived by assuming form and substituting into Heston PDE (from )

def heston_char_func(phi, S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd):

    # commonly used term
    rspi = rho*sigma*phi*1j

    # constants
    a = kappa*theta
    b = kappa+lambd

    # d and g parameter in heston characteristic function
    d = np.sqrt((rspi - b)**2 + sigma**2 * (phi*1j+phi**2))
    g = (b-rspi+d) / (b-rspi-d)

    exp1 = np.exp(r*phi*1j*tau)
    term1 = S0**(1j*phi) * ((1-g*np.exp(d*tau))/(1-g))**(-2*a/sigma**2)
    exp2 = np.exp(a*tau/sigma**2 * (b-rspi+d) + v0/sigma**2 * (b-rspi+d)*((1-np.exp(d*tau))/(1-g*np.exp(d*tau))))

    return exp1*term1*exp2

In [25]:
# Using numerical integration to simplify the process of finding price
def heston_call_price(S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd):
    args = (S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd)
    
    # 10000 steps and range of 1-100, each step (dphi) is 0.01
    P, umax, N = 0, 100, 10000
    dphi=umax/N 
    
    # Loop through all the steps and summing the value of integral at each step
    for i in range (1,N):
        phi = dphi * (2*i + 1)/2
        
        # P is 0 intially, and the value of the integral * dphi is added to P each step 
        P += ((np.exp(r*tau)*heston_char_func(phi-1j,*args) - K * heston_char_func(phi,*args)) / (1j*phi*K**(1j*phi))) * dphi

    # Substituting the value of the integral into equation for cost and taking the real value
    return np.real((S0 - K*np.exp(-r*tau))/2 + P/np.pi)

In [26]:
S0 = 105
K = 110
v0 = 0.04
tau = 0.1
r = 0.05
sigma = 0.6
rho = -0.8
kappa = 3
theta = 0.04
lambd = 0.8

heston_call_price(S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd)

np.float64(0.5687456253728729)

# Getting Real World Data
## Risk Free Interest Rate

In [146]:
rates_df = pd.read_csv('/Users/wongmarco/Downloads/daily-treasury-rates.csv')
rates_df['Date'] = pd.to_datetime(rates_df['Date'], format='%m/%d/%Y')
rates_df

Unnamed: 0,Date,1 Mo,2 Mo,3 Mo,4 Mo,6 Mo,1 Yr,2 Yr,3 Yr,5 Yr,7 Yr,10 Yr,20 Yr,30 Yr
0,2023-12-29,5.60,5.59,5.40,5.41,5.26,4.79,4.23,4.01,3.84,3.88,3.88,4.20,4.03
1,2023-12-28,5.57,5.55,5.45,5.42,5.28,4.82,4.26,4.02,3.83,3.84,3.84,4.14,3.98
2,2023-12-27,5.55,5.53,5.44,5.42,5.26,4.79,4.20,3.97,3.78,3.81,3.79,4.10,3.95
3,2023-12-26,5.53,5.52,5.45,5.44,5.28,4.83,4.26,4.05,3.89,3.91,3.89,4.20,4.04
4,2023-12-22,5.54,5.52,5.44,5.45,5.31,4.82,4.31,4.04,3.87,3.92,3.90,4.21,4.05
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
245,2023-01-09,4.37,4.58,4.70,4.74,4.83,4.69,4.19,3.93,3.66,3.60,3.53,3.83,3.66
246,2023-01-06,4.32,4.55,4.67,4.74,4.79,4.71,4.24,3.96,3.69,3.63,3.55,3.84,3.67
247,2023-01-05,4.30,4.55,4.66,4.75,4.81,4.78,4.45,4.18,3.90,3.82,3.71,3.96,3.78
248,2023-01-04,4.20,4.42,4.55,4.69,4.77,4.71,4.36,4.11,3.85,3.79,3.69,3.97,3.81


In [28]:
# Unused code: we are simplifying it by using only the 1 Month par yield curve rates to look at options with short maturitities
# This can be used in the future for a range of maturities and for better accuracy (curving it so it is more accurate daily)

# Using Nelson Siegel Svennson model (parametric) to analyse yield curve using ordinary least squares
# maturities = rates_df.columns.astype(float).to_numpy()
# rates_df['curve_fit'] = rates_df.apply(lambda row: calibrate_nss_ols(maturities, row.values)[0], axis=1)

## Option data
Option data is downloaded from optionsdx in form of CSV files (This project doesn't require real time quoting of option data)

In [142]:
# File path below contains EOD option data for NVDA in 2023 (we will be using 2023 Jan to Nov data to estimate option prices for Dec 2023 )
file_path = ['/Users/wongmarco/Downloads/nvda_eod_2023q1-0x56e5/nvda_eod_202301.txt','/Users/wongmarco/Downloads/nvda_eod_2023q1-0x56e5/nvda_eod_202302.txt','/Users/wongmarco/Downloads/nvda_eod_2023q1-0x56e5/nvda_eod_202303.txt','/Users/wongmarco/Downloads/nvda_eod_2023q2-miyyse/nvda_eod_202304.txt','/Users/wongmarco/Downloads/nvda_eod_2023q2-miyyse/nvda_eod_202305.txt','/Users/wongmarco/Downloads/nvda_eod_2023q2-miyyse/nvda_eod_202306.txt','/Users/wongmarco/Downloads/nvda_eod_2023q3-vzquiq/nvda_eod_202307.txt','/Users/wongmarco/Downloads/nvda_eod_2023q3-vzquiq/nvda_eod_202308.txt','/Users/wongmarco/Downloads/nvda_eod_2023q3-vzquiq/nvda_eod_202309.txt','/Users/wongmarco/Downloads/nvda_eod_2023q4-jf5cdq/nvda_eod_202310.txt','/Users/wongmarco/Downloads/nvda_eod_2023q4-jf5cdq/nvda_eod_202311.txt']


dataframes = []
for file in file_path:
    df = pd.read_csv(file)  # Use pd.read_excel() for Excel files, etc.
    dataframes.append(df)

# Concatenate all DataFrames into a single DataFrame
options_df = pd.concat(dataframes, ignore_index=True)


Columns (29) have mixed types. Specify dtype option on import or set low_memory=False.


Columns (8,9,10,11,12,15,17,18,20,21,23,24,25,26,27,28) have mixed types. Specify dtype option on import or set low_memory=False.



Data Cleaning and Transformation

In [143]:
pd.set_option('display.max_columns', 33)
options_df.columns = options_df.columns.str.replace('[\[\] ]', '', regex=True)
options_df['QUOTE_DATE'] = pd.to_datetime(options_df['QUOTE_DATE'])
options_df['EXPIRE_DATE'] = pd.to_datetime(options_df['EXPIRE_DATE'])
options_df = options_df.replace(' ',np.nan )
options_df[['C_VOLUME','C_ASK','C_BID']] = options_df[['C_VOLUME','C_ASK','C_BID']].astype(float)
options_df.dropna()
# Removing inaccurate data where days to expiry is 0
options_df = options_df[options_df['DTE'] != 0]

# Removing inaccurate data where option last trading price = 0 and trade volume is null 
options_df = options_df[(options_df['C_LAST'] != 0) & (options_df['P_LAST'] != 0)]


In [147]:
options_df
# Columns in dataframe: 
    # Time: (time in unix, quote time, quote date, quote hour of time, expire date, expire time in unix, day to expiration)
    # Greeks: Delta (Call and Put), Gamma, Vega, Theta, Rho
    # Other data (Call and Put):  implied volatility, trading volume, last traded price, size (open interest)
    # Strike: Strike price, strike distance (absolute/ percentage distance) between stock and strike price

Unnamed: 0,QUOTE_UNIXTIME,QUOTE_READTIME,QUOTE_DATE,QUOTE_TIME_HOURS,UNDERLYING_LAST,EXPIRE_DATE,EXPIRE_UNIX,DTE,C_DELTA,C_GAMMA,C_VEGA,C_THETA,C_RHO,C_IV,C_VOLUME,C_LAST,C_SIZE,C_BID,C_ASK,STRIKE,P_BID,P_ASK,P_SIZE,P_LAST,P_DELTA,P_GAMMA,P_VEGA,P_THETA,P_RHO,P_IV,P_VOLUME,STRIKE_DISTANCE,STRIKE_DISTANCE_PCT
0,1672779600,2023-01-03 16:00,2023-01-03,16.0,143.15,2023-01-06,1673038800,3.0,0.99562,0.00029,0.00165,-0.06241,0.00696,3.174680,2.0,76.9,1 x 1,78.15,78.35,65.0,0.0,0.01,0 x 43,0.02,-0.00056,0.0001,0.00035,-0.00402,0.0,2.468900,0.000000,78.2,0.546
1,1672779600,2023-01-03 16:00,2023-01-03,16.0,143.15,2023-01-06,1673038800,3.0,0.99658,0.00025,0.00138,-0.04172,0.00732,2.732770,0.0,92.25,1 x 1,73.15,73.3,70.0,0.0,0.01,0 x 43,0.04,-0.0005,0.00009,0.00026,-0.0046,0.0,2.247870,0.000000,73.2,0.511
2,1672779600,2023-01-03 16:00,2023-01-03,16.0,143.15,2023-01-06,1673038800,3.0,0.99863,0.00013,0.00059,-0.02118,0.00808,2.229220,0.0,69.26,1 x 1,68.1,68.3,75.0,0.0,0.01,0 x 43,0.01,-0.00028,0.00004,-0.00002,-0.00404,-0.00037,2.042420,0.000000,68.2,0.476
3,1672779600,2023-01-03 16:00,2023-01-03,16.0,143.15,2023-01-06,1673038800,3.0,1.0,0.0,0.0,-0.0102,0.00838,,0.0,64.21,35 x 35,61.2,64.4,80.0,0.0,0.01,0 x 43,0.01,-0.00107,0.00008,-0.00011,-0.00485,-0.00043,1.849050,0.000000,63.2,0.441
4,1672779600,2023-01-03 16:00,2023-01-03,16.0,143.15,2023-01-06,1673038800,3.0,1.0,0.0,0.0,-0.01147,0.00835,0.000050,0.0,55.5,37 x 35,57.15,59.2,85.0,0.0,0.01,0 x 31,0.02,-0.00025,0.00016,0.00074,-0.00465,0.0,1.667000,0.000000,58.2,0.406
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
468230,1701378000,2023-11-30 16:00,2023-11-30,16.0,467.70,2026-01-16,1768597200,778.0,0.29558,0.00123,2.32871,-0.07258,2.09956,0.411170,0.0,34.5,70 x 92,39.25,40.2,840.0,368.75,374.85,47 x 35,359.25,-1.0,0.0,0.0,0.0,0.0,,0.000000,372.3,0.796
468231,1701378000,2023-11-30 16:00,2023-11-30,16.0,467.70,2026-01-16,1768597200,778.0,0.2874,0.00115,2.30113,-0.07138,2.05323,0.410120,0.0,55.04,64 x 104,37.75,38.95,850.0,377.9,385.9,32 x 5,373.0,-1.0,0.0,0.0,0.0,0.0,,0.000000,382.3,0.817
468232,1701378000,2023-11-30 16:00,2023-11-30,16.0,467.70,2026-01-16,1768597200,778.0,0.28099,0.00119,2.27554,-0.07032,2.01066,0.409860,0.0,55.8,88 x 95,36.65,37.75,860.0,387.4,395.35,32 x 32,379.42,-1.0,0.0,0.0,0.0,0.0,,0.000000,392.3,0.839
468234,1701378000,2023-11-30 16:00,2023-11-30,16.0,467.70,2026-01-16,1768597200,778.0,0.26792,0.00114,2.22572,-0.06884,1.92965,0.410230,0.0,43.9,49 x 105,34.7,35.4,880.0,404.0,418.85,25 x 25,428.81,-1.0,0.0,0.0,0.0,0.0,,0.000000,412.3,0.882


In [189]:
# Data processing

# Getting a dataframe with only the parameters needed for the actively traded call options (for short maturities)
traded_options = options_df[(options_df['C_VOLUME'] > 500)&(options_df['DTE']<30)][['UNDERLYING_LAST','QUOTE_DATE','DTE','C_VOLUME','C_LAST','C_SIZE','C_BID','C_ASK','STRIKE']]

# Change DTE from days to year, and using C_BID and C_ASK to estimate market price (Bid-Ask spread)
traded_options['DTE'] = traded_options['DTE']/365
traded_options = traded_options.rename(columns={'DTE': 'MATURITIES'})
traded_options['MARKET_PRICE'] = (traded_options['C_ASK']+traded_options['C_BID'])/2

# Risk free interest rate estimation (using 1 month as we will be examining short term options) and interpolating for missing data
traded_options = pd.merge(traded_options, rates_df[['Date','1 Mo']], left_on = 'QUOTE_DATE', right_on = 'Date', how='outer')
traded_options = traded_options.rename(columns={'1 Mo': 'RISK_FREE_RATE'})
traded_options['RISK_FREE_RATE'] = traded_options['RISK_FREE_RATE']/100
traded_options['RISK_FREE_RATE'] = traded_options['RISK_FREE_RATE'].interpolate(method = 'nearest')

# Dropping unused columns and nulls
traded_options = traded_options.dropna()

traded_options


Unnamed: 0,UNDERLYING_LAST,QUOTE_DATE,MATURITIES,C_VOLUME,C_LAST,C_SIZE,C_BID,C_ASK,STRIKE,MARKET_PRICE,Date,RISK_FREE_RATE
0,143.15,2023-01-03,0.008219,814.0,4.75,48 x 113,4.70,4.80,141.0,4.750,2023-01-03,0.0417
1,143.15,2023-01-03,0.008219,933.0,4.2,423 x 26,4.10,4.20,142.0,4.150,2023-01-03,0.0417
2,143.15,2023-01-03,0.008219,1799.0,3.65,611 x 246,3.60,3.70,143.0,3.650,2023-01-03,0.0417
3,143.15,2023-01-03,0.008219,2277.0,3.19,729 x 75,3.10,3.20,144.0,3.150,2023-01-03,0.0417
4,143.15,2023-01-03,0.008219,4721.0,2.7,1 x 23,2.72,2.75,145.0,2.735,2023-01-03,0.0417
...,...,...,...,...,...,...,...,...,...,...,...,...
7763,467.70,2023-11-30,0.041096,827.0,0.46,92 x 56,0.47,0.49,540.0,0.480,2023-11-30,0.0556
7764,467.70,2023-11-30,0.041096,1035.0,0.36,58 x 111,0.33,0.35,550.0,0.340,2023-11-30,0.0556
7765,467.70,2023-11-30,0.060274,826.0,4.72,191 x 4,4.65,4.75,500.0,4.700,2023-11-30,0.0556
7766,467.70,2023-11-30,0.060274,631.0,0.38,56 x 93,0.37,0.40,565.0,0.385,2023-11-30,0.0556


In [None]:
# unused code for applying curve to interest rate
"""
# Mapping Nelson Siegel Svensson result function to date, then applying it to the list of maturities of the same date
rates_df = rates_df.reset_index()
function_mapping = dict(zip(rates_df['Date'], rates_df['curve_fit']))
traded_options = pd.merge(traded_options, rates_df[['Date','curve_fit']], left_on = 'QUOTE_DATE', right_on = 'Date', how='outer')

def apply_function(row):
    func = function_mapping.get(row['Date'])
    if func:
        return func(row['MATURITIES'])
    else:
        return np.nan 

traded_options['RISK_NEUTRAL_RATE'] = traded_options.apply(apply_function, axis=1)

# Interpolation to fill missing risk neutral rates
traded_options['RISK_NEUTRAL_RATE'] = traded_options['RISK_NEUTRAL_RATE'].interpolate(method = 'nearest')
traded_options = traded_options.drop(columns=['Date', 'curve_fit'])"""


# Calibration of data using a least squared error fit
To find the set of parameters that minimizes the square error:
sqErr(v0, kappa, theta, sigma, rho, lambd) = sum of (Market call price - heston model call price) squared 

Using Scipy (optimization) for minimizing sqErr:
- Problem 1: selecting suitable weight terms (for better calibration results: fitting to more important/reliable data) and penalty  (to avoid overfitting)

- Problem 2: given the problem (minimizing square err), what is the most suitable optimization method to use
    - non linear problem with non linear constraints -> 

- Problem 3: selecting suitable initial parameters and bounds (for convergence speed, avoiding local minima, good quality result)

The result for the parameters should be at a reasonable value, and have a low error when comparing model and real price



In [190]:
# Variables from options data
S0, K, r, tau, price = traded_options[['UNDERLYING_LAST', 'STRIKE', 'RISK_FREE_RATE', 'MATURITIES','MARKET_PRICE']].astype(float).to_numpy().T

# Parameters （Setting initial guess and upper lower bound)
params = {
    "v0": {"x0": 0.04, "lbub": [1e-3, 0.3]},
    "kappa": {"x0": 1.5, "lbub": [1e-2, 5]},
    "theta": {"x0": 0.04, "lbub": [1e-3, 0.2]},
    "sigma": {"x0": 0.3, "lbub": [1e-2, 2]},
    "rho": {"x0": -0.5, "lbub": [-1, 1]},
    "lambd": {"x0": 0.1, "lbub": [-1, 1]}
}

inverseMaturitiesSum = (1/tau).sum()

x0 = [param["x0"] for key, param in params.items()]
bnds = [param["lbub"] for key, param in params.items()]

In [191]:
def sqErr (x):
    v0, kappa, theta, sigma, rho, lambd = [param for param in x]
    
    # weight factor using inverse weighted average for maturities
    err = np.sum(1/tau/inverseMaturitiesSum*(price - heston_call_price(S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd))**2)
    # Penalty term: distance to initial parameter vector
    pen = np.sum([(param-initial)**2 for param, initial in zip(x,x0)])
    
    return err + pen


In [192]:
result = minimize(sqErr, x0, tol = 1e-3, method='SLSQP', options={'maxiter': 1e4 }, bounds=bnds)
result

 message: Optimization terminated successfully
 success: True
  status: 0
     fun: 3.761969135962585
       x: [ 2.212e-01  1.498e+00  3.885e-02  2.969e-01 -4.967e-01
            9.924e-02]
     nit: 6
     jac: [ 8.872e-02  2.394e-02 -1.955e-02 -6.670e-03  9.544e-03
            2.597e-02]
    nfev: 43
    njev: 6

In [193]:
v0, kappa, theta, sigma, rho, lambd = [param for param in result.x]
v0, kappa, theta, sigma, rho, lambd

(np.float64(0.2211637508434337),
 np.float64(1.497864895949708),
 np.float64(0.03885371267404367),
 np.float64(0.2968626090380853),
 np.float64(-0.4966888686355568),
 np.float64(0.09923813948158276))

In [194]:
heston_prices = heston_call_price(S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd)
traded_options['HESTON_PRICE'] = heston_prices
traded_options

Unnamed: 0,UNDERLYING_LAST,QUOTE_DATE,MATURITIES,C_VOLUME,C_LAST,C_SIZE,C_BID,C_ASK,STRIKE,MARKET_PRICE,Date,RISK_FREE_RATE,HESTON_PRICE
0,143.15,2023-01-03,0.008219,814.0,4.75,48 x 113,4.70,4.80,141.0,4.750,2023-01-03,0.0417,3.679038
1,143.15,2023-01-03,0.008219,933.0,4.2,423 x 26,4.10,4.20,142.0,4.150,2023-01-03,0.0417,3.071347
2,143.15,2023-01-03,0.008219,1799.0,3.65,611 x 246,3.60,3.70,143.0,3.650,2023-01-03,0.0417,2.528176
3,143.15,2023-01-03,0.008219,2277.0,3.19,729 x 75,3.10,3.20,144.0,3.150,2023-01-03,0.0417,2.050404
4,143.15,2023-01-03,0.008219,4721.0,2.7,1 x 23,2.72,2.75,145.0,2.735,2023-01-03,0.0417,1.637151
...,...,...,...,...,...,...,...,...,...,...,...,...,...
7763,467.70,2023-11-30,0.041096,827.0,0.46,92 x 56,0.47,0.49,540.0,0.480,2023-11-30,0.0556,0.800613
7764,467.70,2023-11-30,0.041096,1035.0,0.36,58 x 111,0.33,0.35,550.0,0.340,2023-11-30,0.0556,0.306055
7765,467.70,2023-11-30,0.060274,826.0,4.72,191 x 4,4.65,4.75,500.0,4.700,2023-11-30,0.0556,9.340522
7766,467.70,2023-11-30,0.060274,631.0,0.38,56 x 93,0.37,0.40,565.0,0.385,2023-11-30,0.0556,0.420568


In [183]:
# Visualization
fig = go.Figure(data = [go.Mesh3d(z=traded_options['MARKET_PRICE'], x=traded_options['MATURITIES'], y=traded_options['STRIKE'], colorscale='Viridis', opacity=0.55)])

# Add scatter plot
fig.add_trace(go.Scatter3d(z=traded_options['HESTON_PRICE'], x=traded_options['MATURITIES'], y=traded_options['STRIKE'], mode='markers', marker=dict(size=3, color='red', opacity=0.8)))

# Update layout
fig.update_layout(title='3D Surface Plot with Scatter Points', scene=dict(xaxis_title='Maturities', yaxis_title='Strike', zaxis_title='Price'))

# Show the figure
fig.show()

The results for parameters from optimization seems to be at a reasonable range, and the heston model price prediction overall matches decently well with the market price. It may be normal that the model doesn't fit certain points at the lower and upper end of strike prices due to low liquidity of these options, and the risk of overfitting the model. 

Still, there are many features that can be improved/ added in the future:
- Apply Jump diffusion to Heston model implementation for better calibration accuracy and speed
- Time dependant parameters if considering maturities with large time intervals
- C++ for speed
- Better calibration method for the dataset


# Model Validation using Monte Carlo methods

In [41]:
def heston_monte_carlo_prices(S0, v0, tau, r, K, sigma, rho, kappa, theta, paths, steps):
    option_values = []
    # Loop through each option (perform a monte carlo simulation for each option)
    for S, r, K, tau in zip(S0, r, K, tau):
        
        dt = tau / steps
        # Arrays to store the final asset prices
        final_prices = np.zeros(paths)

        # Loop for simulating paths 
        for i in range(paths):
            S_t = S
            v_t = v0
            for j in range(steps):
                # Generate correlated wiener processes for price and volatility
                Z1 = np.random.normal(0, 1)
                Z2 = rho * Z1 + np.sqrt(1 - rho**2) * np.random.normal(0, 1)
                
                # Applying heston discrete SDE 

                S_t = S_t*(np.exp((r- 0.5*v_t) * dt + np.sqrt(v_t) * Z1 * np.sqrt(dt)))
                v_t = np.abs(v_t + kappa * (theta - v_t) * dt + sigma * np.sqrt(v_t) * Z2 * np.sqrt(dt))
                
            final_prices[i] = S_t
            
        # Calculating option value by discounting expected payoff to present
        option_value = np.exp(-r * tau) * np.mean(np.maximum(final_prices - K, 0))
        option_values.append(option_value)
            
    return option_values

In [45]:
option_values = heston_monte_carlo_prices(S0, v0, tau, r, K, sigma, rho, kappa, theta, 500, 252)

In [178]:
traded_options['MONTE_CARLO_PRICE'] = option_values
traded_options

ValueError: Length of values (701) does not match length of index (674)

From the monte carlo simulation using the calibrated parameters, the results are close to the market price, which suggests that our calibration is done correctly and is at a good quality. Next step would be testing its performance (forward testing)

# Heston Model performance measure
Testing accuracy of calibrated parameters by comparing Black-Sholes Model and Heston Model prediction results for market price of options using performance metric RMSE.

In [185]:
# Using code above to clean and process options data
options_df_dec = pd.read_csv('/Users/wongmarco/Downloads/nvda_eod_2023q4-jf5cdq/nvda_eod_202312.txt')
options_df_dec.columns = options_df_dec.columns.str.replace('[\[\] ]', '', regex=True)
options_df_dec = options_df_dec.replace(' ',np.nan )
options_df_dec[['C_VOLUME','C_ASK','C_BID']] = options_df_dec[['C_VOLUME','C_ASK','C_BID']].astype(float)
options_df_dec.dropna()
options_df_dec = options_df_dec[options_df_dec['DTE'] != 0]
options_df_dec = options_df_dec[(options_df_dec['C_LAST'] != 0) & (options_df_dec['P_LAST'] != 0)]

traded_options_dec = options_df_dec[(options_df_dec['C_VOLUME'] > 500)&(options_df_dec['DTE']<30)][['UNDERLYING_LAST','DTE','C_BID','C_ASK','STRIKE']]
traded_options_dec['DTE'] = traded_options_dec['DTE']/365
traded_options_dec = traded_options_dec.rename(columns={'DTE': 'MATURITIES'})
traded_options_dec['MARKET_PRICE'] = (traded_options_dec['C_ASK']+traded_options_dec['C_BID'])/2
traded_options_dec['RISK_NEUTRAL_RATE'] = 0.055

In [208]:
from scipy.stats import norm
S0, K, r, tau, price = traded_options_dec[['UNDERLYING_LAST', 'STRIKE','RISK_NEUTRAL_RATE', 'MATURITIES','MARKET_PRICE']].to_numpy().T

def black_scholes(S, K, T, r, sigma):
    
    # Calculate d1 and d2
    d1 = (np.log(S/K) + (r + sigma**2/2)*T) / (sigma*np.sqrt(T))
    d2 = d1 - sigma * np.sqrt(T)
    price= S * norm.cdf(d1) - K * np.exp(-r*T)* norm.cdf(d2)
    
    return price

In [196]:
traded_options_dec['HESTON_PRICE'] = heston_call_price(S0, K, v0, tau, r, sigma, rho, kappa, theta, lambd)
traded_options_dec['BLACK-SHOLES_PRICE'] = black_scholes(S0,K,tau,r,sigma)
traded_options_dec

Unnamed: 0,UNDERLYING_LAST,MATURITIES,C_BID,C_ASK,STRIKE,MARKET_PRICE,RISK_NEUTRAL_RATE,HESTON_PRICE,BLACK-SHOLES_PRICE
173,467.65,0.019178,12.65,12.80,460.0,12.725,0.055,16.564650,12.352294
174,467.65,0.019178,9.60,9.80,465.0,9.700,0.055,13.707022,9.316115
175,467.65,0.019178,7.10,7.20,470.0,7.150,0.055,11.177497,6.792879
176,467.65,0.019178,6.00,6.10,472.5,6.050,0.055,10.035675,5.723820
177,467.65,0.019178,5.05,5.10,475.0,5.075,0.055,8.974659,4.779013
...,...,...,...,...,...,...,...,...,...
50138,497.05,0.057534,13.10,13.20,500.0,13.150,0.055,21.316864,13.461693
50141,497.05,0.057534,9.05,9.25,510.0,9.150,0.055,16.819599,9.318541
50143,497.05,0.057534,6.20,6.35,520.0,6.275,0.055,13.016548,6.199438
50145,497.05,0.057534,4.00,4.15,530.0,4.075,0.055,9.863416,3.961258


In [197]:
print(np.sqrt(np.mean((traded_options_dec['MARKET_PRICE'] - traded_options_dec['HESTON_PRICE'])**2)))
print(np.sqrt(np.mean((traded_options_dec['MARKET_PRICE'] - traded_options_dec['BLACK-SHOLES_PRICE'])**2)))

3.0353667856160005
0.8913760840744372
