In [1]:
from bs4 import BeautifulSoup as bs

import warnings
warnings.filterwarnings('ignore')

import requests
import pandas as pd
import numpy as np
import datetime as dt
import os
from scipy.stats import norm as norm

os.chdir('C:\\Users\\Fang\\Desktop\\Python Trading\\Trading\\Trading\\Modules\\DataCollection')
from yahoo_query import *
pd.options.display.float_format = '{:,.6f}'.format
%matplotlib inline
os.chdir('D:\Options Data\CBOE Manual Downloads')

In [14]:
filename = 'quotedata.dat'

vix = yahoo_query('^VIX',dt.datetime.today())
vix.minute_query()
vix = vix.minute_prices.dropna()

options_chain = pd.read_csv(filename, sep=',', header=0, skiprows=2)

i = 0
for line in open(filename,'r'):
    curr_line = [x.strip() for x in line.split(',')]
    if i == 0:
        curr_spx = float(curr_line[1])
    
    if i == 1:
        curr_time = curr_line[0].replace('@','').replace('  ',' ').replace(' ET','')
        curr_time = dt.datetime.strptime(curr_time, '%b %d %Y %H:%M')
    if i == 1:
        break
    i += 1
    
options_chain['Expiration Date'] = pd.to_datetime(options_chain['Expiration Date'])

universal_columns = ['Expiration Date','Strike']
call_columns = list(filter(lambda x: x in universal_columns or '1' not in x, options_chain.columns.tolist()))
put_columns = list(filter(lambda x: x in universal_columns or '1' in x, options_chain.columns.tolist()))

calls = options_chain[call_columns]
del calls['Calls'], calls['Puts']

a = (calls['IV']**2)/2
b = -calls['IV']*norm.ppf(calls['Delta'])
c = np.log(curr_spx/calls['Strike'])

calls['time_remaining'] = ((-b + np.sqrt(b**2 - 4*a*c))/(2*a))**2

puts = options_chain[put_columns]
puts.columns = [x.replace('.1','') for x in puts.columns.tolist()]

commissions = 0.0266

def create_spreads(spreads, contract_type = 'puts', net_delta_threshold = 0.275):

    spreads['Net Delta'] = abs(spreads['Short Delta'] - spreads['Long Delta'])
    spreads = spreads[spreads['Net Delta'] <= net_delta_threshold]
    spreads['Credit'] = spreads['Short Bid'] - spreads['Long Ask'] - commissions
    spreads['Required_Contracts'] = round(0.5/spreads['Net Delta'])
    spreads['Total Premo'] = spreads.Credit*100*spreads.Required_Contracts
    
    if contract_type == 'puts':
        spreads['Max Loss'] = (spreads['Long Strike'] - spreads['Short Strike'])*100*spreads.Required_Contracts + spreads['Total Premo']
        spreads['Break Even'] = spreads['Short Strike'] - spreads.Credit

        spreads['SPX Equiv Lower Loss'] = (spreads['Long Strike'] - curr_spx)*100
        spreads['SPX Equiv Break Even Loss'] = (spreads['Break Even'] - curr_spx)*100
        spreads['SPX Equiv Gain Level'] = curr_spx + spreads['Total Premo']/100

        spreads['Prob of Better Than ES'] = norm.cdf(spreads['SPX Equiv Gain Level']/curr_spx - 1,0,spreads['Weekly IV']) - norm.cdf(spreads['Break Even']/curr_spx - 1,0,spreads['Weekly IV']) + norm.cdf(spreads['Long Strike']/curr_spx - 1,0,spreads['Weekly IV'])

    if contract_type == 'calls':
        spreads['Max Loss'] = (spreads['Short Strike'] - spreads['Long Strike'])*100*spreads.Required_Contracts + spreads['Total Premo']
        spreads['Break Even'] = spreads['Short Strike'] + spreads.Credit

        spreads['SPX Equiv Lower Loss'] = (curr_spx - spreads['Long Strike'])*100
        spreads['SPX Equiv Break Even Loss'] = -(spreads['Break Even'] - curr_spx)*100
        spreads['SPX Equiv Gain Level'] = curr_spx - spreads['Total Premo']/100

        spreads['Prob of Better Than ES'] = norm.cdf(spreads['Break Even']/curr_spx - 1,0,spreads['Weekly IV']) - norm.cdf(spreads['SPX Equiv Gain Level']/curr_spx - 1,0,spreads['Weekly IV']) + 1 - norm.cdf(spreads['Long Strike']/curr_spx - 1,0,spreads['Weekly IV'])
    
    spreads['EV'] = np.nan
    spreads['Win Prob'] = np.nan
    stepsize = 0.05
    
    for idx, row in spreads.iterrows():
        
        if contract_type == 'puts':
            ev_df = pd.DataFrame({'SPX': np.arange(row['Long Strike'], row['Short Strike'] + stepsize, stepsize)})
            ev_df = ev_df[(ev_df['SPX'] < row['Short Strike'] + stepsize)]
            ev_df['PnL'] = ev_df['SPX'] - row['Short Strike'] + row.Credit
            
        if contract_type == 'calls':
            ev_df = pd.DataFrame({'SPX': np.arange(row['Short Strike'], row['Long Strike'] + stepsize, stepsize)})
            ev_df = ev_df[(ev_df['SPX'] < row['Long Strike'] + stepsize)]
            ev_df['PnL'] = row['Short Strike'] - ev_df['SPX'] + row.Credit
    
        ev_df['Prob'] = norm.cdf(ev_df['SPX']/curr_spx - 1,0,row['Weekly IV'])
        lb = ev_df.loc[0,'Prob']
        ub = ev_df.loc[len(ev_df) - 1,'Prob']

        ev_df['Prob'] = ev_df['Prob'].diff()
        ev_df.loc[0,'Prob'] = lb
        ev_df.loc[len(ev_df) - 1, 'Prob'] = 1 - ub

        ev_df['EV'] = ev_df.Prob*ev_df.PnL

        total_ev = sum(ev_df['EV'])
        win_prob = sum(ev_df[ev_df['PnL'] >= 0]['Prob'])

        spreads.loc[idx, 'EV'] = total_ev
        spreads.loc[idx, 'Win Prob'] = win_prob

    
    return spreads

In [25]:
day_diff = 8

bid_threshold = 0.5

net_delta_threshold = 0.5

weekly_puts = puts[(puts['Expiration Date'] - dt.datetime.today()).dt.days == day_diff]
weekly_puts = weekly_puts[(weekly_puts.Strike <= curr_spx) & 
                          (weekly_puts['Bid'] >= bid_threshold)].sort_values('Strike', ascending = False)
weekly_puts = weekly_puts.drop_duplicates(subset = ['Strike'], keep = 'last').reset_index(drop = True)

weekly_calls = calls[(calls['Expiration Date'] - dt.datetime.today()).dt.days == day_diff]
weekly_calls = weekly_calls[(weekly_calls.Strike >= curr_spx) & 
                            (weekly_calls['Bid'] >= bid_threshold)].sort_values('Strike', ascending = True)
weekly_calls = weekly_calls.drop_duplicates(subset = ['Strike'], keep = 'last').reset_index(drop = True)

time_remaining = weekly_calls.time_remaining.mean()

put_spreads_list = []
for idx, row in weekly_puts.iterrows():
    put_spreads = weekly_puts[weekly_puts.Strike < row.Strike][['Expiration Date','Strike','Ask','Delta']]
    if len(put_spreads) < 3:
        continue
    else:
        put_spreads.columns = ['Expiration Date','Long Strike','Long Ask', 'Long Delta']
        put_spreads['Short Strike'] = row.Strike
        put_spreads['Short Bid'] = row.Bid
        put_spreads['Short Delta'] = row.Delta
        put_spreads['Weekly IV'] = (vix.reset_index().loc[len(vix) - 1, '^VIX_close']/100)*np.sqrt(time_remaining)
    put_spreads_list.append(create_spreads(put_spreads, 'puts', net_delta_threshold))
    
put_spreads = pd.concat(put_spreads_list, axis = 0).dropna().reset_index(drop = True)
put_spreads = put_spreads[(put_spreads['Total Premo'] > weekly_puts.loc[0,'Bid']*100) & 
                          (put_spreads['Prob of Better Than ES'] > 0.5) & 
                          (put_spreads['Max Loss'] > -5000)].reset_index(drop = True)
put_spreads['Max Loss Differences'] = put_spreads['Max Loss'] - put_spreads['SPX Equiv Lower Loss']

put_spreads = put_spreads.sort_values('EV', ascending = False).reset_index(drop = True)
put_spreads[['Expiration Date','Long Strike','Short Strike','Required_Contracts','Credit','Total Premo','Max Loss','EV','Win Prob']]

Unnamed: 0,Expiration Date,Long Strike,Short Strike,Required_Contracts,Credit,Total Premo,Max Loss,EV,Win Prob


In [26]:
call_spreads_list = []
for idx, row in weekly_calls.iterrows():
    call_spreads = weekly_calls[weekly_calls.Strike > row.Strike][['Expiration Date','Strike','Ask','Delta']]
    if len(call_spreads) < 3:
        continue
    else:
        call_spreads.columns = ['Expiration Date','Long Strike','Long Ask', 'Long Delta']
        call_spreads['Short Strike'] = row.Strike
        call_spreads['Short Bid'] = row.Bid
        call_spreads['Short Delta'] = row.Delta
        call_spreads['Weekly IV'] = (vix.reset_index().loc[len(vix) - 1, '^VIX_close']/100)*np.sqrt(time_remaining)
    call_spreads_list.append(create_spreads(call_spreads, 'calls', net_delta_threshold))

call_spreads = pd.concat(call_spreads_list, axis = 0).dropna().reset_index(drop = True)
call_spreads = call_spreads[(call_spreads['Total Premo'] > weekly_calls.loc[0,'Bid']*100) & 
                            (call_spreads['Prob of Better Than ES'] > 0.5) &
                            (call_spreads['Max Loss'] > -5000)].reset_index(drop = True)
call_spreads['Max Loss Differences'] = call_spreads['Max Loss'] - call_spreads['SPX Equiv Lower Loss']

call_spreads = call_spreads.sort_values('EV', ascending = False).reset_index(drop = True)
call_spreads[['Expiration Date','Long Strike','Short Strike','Required_Contracts','Credit','Total Premo','Max Loss','EV','Win Prob']]

Unnamed: 0,Expiration Date,Long Strike,Short Strike,Required_Contracts,Credit,Total Premo,Max Loss,EV,Win Prob
0,2019-02-20,2740.0,2710.0,2.0,12.4734,2494.68,-3505.32,0.283464,0.578884
1,2019-02-20,2735.0,2710.0,3.0,10.7734,3232.02,-4267.98,0.240975,0.568396
2,2019-02-20,2745.0,2710.0,2.0,13.8734,2774.68,-4225.32,0.166086,0.58748
3,2019-02-20,2730.0,2710.0,3.0,8.8734,2662.02,-3337.98,0.143488,0.556616
4,2019-02-20,2740.0,2715.0,3.0,9.8734,2962.02,-4537.98,0.098882,0.593595
5,2019-02-20,2725.0,2710.0,4.0,6.8734,2749.36,-3250.64,0.095115,0.544163
6,2019-02-20,2750.0,2710.0,2.0,15.1734,3034.68,-4965.32,0.08322,0.595425
7,2019-02-20,2735.0,2715.0,3.0,8.1734,2452.02,-3547.98,0.056369,0.583187
8,2019-02-20,2745.0,2715.0,2.0,11.2734,2254.68,-3745.32,-0.01847,0.602117
9,2019-02-20,2730.0,2715.0,4.0,6.2734,2509.36,-3490.64,-0.041137,0.571486


In [5]:
stepsize = 0.05

weekly_puts['EV'] = np.nan
weekly_puts['Win Prob'] = np.nan

for idx, row in weekly_puts.iterrows():
    ev_df = pd.DataFrame({'SPX': np.arange(0, row['Strike'] + stepsize, stepsize)})
    ev_df = ev_df[(ev_df['SPX'] < row['Strike'] + stepsize)]
    ev_df['PnL'] = (row['Strike'] - ev_df['SPX'] - row.Ask)*100

    ev_df['Prob'] = norm.cdf(ev_df['SPX']/curr_spx - 1,0,
                             (vix.reset_index().loc[len(vix) - 1, '^VIX_close']/100)*np.sqrt(time_remaining))
    lb = ev_df.loc[0,'Prob']
    ub = ev_df.loc[len(ev_df) - 1,'Prob']

    ev_df['Prob'] = ev_df['Prob'].diff()
    ev_df.loc[0,'Prob'] = lb
    ev_df.loc[len(ev_df) - 1, 'Prob'] = 1 - ub

    ev_df['EV'] = ev_df.Prob*ev_df.PnL

    total_ev = sum(ev_df['EV'])
    win_prob = sum(ev_df[ev_df['PnL'] >= 0]['Prob'])
    
    weekly_puts.loc[idx, 'EV'] = total_ev
    weekly_puts.loc[idx, 'Win Prob'] = win_prob
    
weekly_puts

Unnamed: 0,Expiration Date,Strike,Last Sale,Net,Bid,Ask,Vol,IV,Delta,Gamma,Open Int,EV,Win Prob
0,2019-02-13,2705.0,11.4,-6.3,11.2,11.5,545,0.1508,-0.4699,0.0129,425,103.433126,0.345426
1,2019-02-13,2700.0,9.2,-6.1,9.3,9.6,1996,0.1547,-0.4082,0.0123,1939,69.603657,0.31177
2,2019-02-13,2695.0,7.69,-5.46,7.6,7.9,208,0.1588,-0.3516,0.0114,995,44.600009,0.278126
3,2019-02-13,2690.0,6.4,-4.85,6.3,6.5,267,0.1622,-0.2998,0.0105,945,17.267883,0.244034
4,2019-02-13,2685.0,5.18,-4.52,5.1,5.4,391,0.1651,-0.253,0.0095,659,-14.079967,0.208918
5,2019-02-13,2680.0,4.1,-4.2,4.2,4.4,291,0.1705,-0.215,0.0084,1760,-31.563684,0.176585
6,2019-02-13,2675.0,3.52,-3.63,3.4,3.6,1458,0.1743,-0.1799,0.0074,763,-47.590233,0.146252
7,2019-02-13,2670.0,3.05,-3.0,2.8,2.95,237,0.1784,-0.151,0.0064,594,-59.746068,0.118748
8,2019-02-13,2665.0,2.35,-2.85,2.3,2.4,187,0.182,-0.1251,0.0055,786,-65.663559,0.094617
9,2019-02-13,2660.0,1.91,-2.49,1.85,1.95,405,0.1859,-0.1041,0.0048,4273,-67.907717,0.073894


In [6]:
weekly_calls['EV'] = np.nan
weekly_calls['Win Prob'] = np.nan

for idx, row in weekly_calls.iterrows():
    ev_df = pd.DataFrame({'SPX': np.arange(row['Strike'], curr_spx*1.20, stepsize)})
    ev_df['PnL'] = (ev_df['SPX'] - row['Strike'] - row.Ask)*100

    ev_df['Prob'] = norm.cdf(ev_df['SPX']/curr_spx - 1,0,
                             (vix.reset_index().loc[len(vix) - 1, '^VIX_close']/100)*np.sqrt(time_remaining))
    lb = ev_df.loc[0,'Prob']
    ub = ev_df.loc[len(ev_df) - 1,'Prob']

    ev_df['Prob'] = ev_df['Prob'].diff()
    ev_df.loc[0,'Prob'] = lb
    ev_df.loc[len(ev_df) - 1, 'Prob'] = 1 - ub

    ev_df['EV'] = ev_df.Prob*ev_df.PnL

    total_ev = sum(ev_df['EV'])
    win_prob = sum(ev_df[ev_df['PnL'] >= 0]['Prob'])
    
    weekly_calls.loc[idx, 'EV'] = total_ev
    weekly_calls.loc[idx, 'Win Prob'] = win_prob
    
weekly_calls

Unnamed: 0,Expiration Date,Last Sale,Net,Bid,Ask,Vol,IV,Delta,Gamma,Open Int,Strike,time_remaining,EV,Win Prob
0,2019-02-13,11.0,1.7,10.4,10.7,3950,0.1461,0.4641,0.0133,368,2710.0,0.006449,133.34956,0.342705
1,2019-02-13,8.25,0.9,8.1,8.4,489,0.1446,0.3975,0.013,308,2715.0,0.005986,145.762909,0.313864
2,2019-02-13,6.0,0.35,6.1,6.4,380,0.1413,0.3306,0.0125,677,2720.0,0.005885,156.798891,0.283108
3,2019-02-13,4.6,0.3,4.5,4.7,559,0.1389,0.2671,0.0116,3859,2725.0,0.005825,165.174975,0.251044
4,2019-02-13,3.3,0.15,3.2,3.4,845,0.1367,0.2097,0.0103,1021,2730.0,0.005825,159.103508,0.217515
5,2019-02-13,2.2,-0.075,2.2,2.35,550,0.1346,0.1582,0.0088,377,2735.0,0.005785,151.399245,0.18475
6,2019-02-13,1.6,0.025,1.55,1.6,1348,0.134,0.1177,0.0072,871,2740.0,0.005776,134.603475,0.153136
7,2019-02-13,1.0,-0.05,1.0,1.1,297,0.1332,0.0845,0.0057,489,2745.0,0.005763,111.113163,0.123813
8,2019-02-13,0.7,-0.025,0.6,0.75,1817,0.1341,0.0614,0.0044,2407,2750.0,0.005776,88.304085,0.097897


In [None]:
stepsize = 0.01

curr_spx = 2775.54
curr_vix = 14.89/100
t = 216/365.25
curr_iv = curr_vix*np.sqrt(t)

ev_df = pd.DataFrame({'SPX': np.arange(0, 3200 + stepsize, stepsize)})

short_call_strike = 3050
long_call_strike = 3150
long_put_strike = 1825

credit = 6.20

ev_df['Put_PnL'] = long_put_strike - ev_df.SPX
ev_df.loc[ev_df['Put_PnL']<0,'Put_PnL'] = 0

ev_df['Long_Call_PnL'] = ev_df.SPX - long_call_strike
ev_df.loc[ev_df['Long_Call_PnL']<0,'Long_Call_PnL'] = 0

ev_df['Short_Call_PnL'] = ev_df.SPX - short_call_strike
ev_df.loc[ev_df['Short_Call_PnL']<0,'Short_Call_PnL'] = 0

ev_df['PnL'] = ev_df.Put_PnL + ev_df.Long_Call_PnL - ev_df.Short_Call_PnL + credit

ev_df['Prob'] = norm.cdf(ev_df['SPX']/curr_spx - 1,0, curr_iv)
lb = ev_df.loc[0,'Prob']
ub = ev_df.loc[len(ev_df) - 1,'Prob']
ev_df['Prob'] = ev_df['Prob'].diff()
ev_df.loc[0,'Prob'] = lb
ev_df.loc[len(ev_df) - 1, 'Prob'] = 1 - ub
ev_df['EV'] = ev_df.Prob*ev_df.PnL

total_ev = sum(ev_df['EV'])
win_prob = sum(ev_df[ev_df['PnL'] >= 0]['Prob'])

conditional_win = ev_df[ev_df['PnL'] >= 0]
conditional_win['Cond_Prob'] = conditional_win.Prob/sum(conditional_win.Prob)


conditional_loss = ev_df[ev_df['PnL'] < 0]
conditional_loss['Cond_Prob'] = conditional_loss.Prob/sum(conditional_loss.Prob)


print(total_ev)
print(win_prob)
print(sum(conditional_win.Cond_Prob*conditional_win.PnL))
print(sum(conditional_loss.Cond_Prob*conditional_loss.PnL))