In [1]:
import sqlite3
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy import stats
from statsmodels.tsa.stattools import adfuller

# Step 1: Create or connect to the SQLite database (it will open if it already exists)
conn = sqlite3.connect('1_financial_data.db')  # Connect to the existing SQLite database

# Step 2: Load the data from the SQLite database into pandas DataFrames

# Load equities_data from the 'equities_data' table
equities_data = pd.read_sql('SELECT * FROM equities_data', conn)

# Load volume_threshold_options_data from the 'volume_threshold_options_data' table
volume_threshold_options_data = pd.read_sql('SELECT * FROM volume_threshold_options_data', conn)

# Load merged_data from the 'merged_data' table
merged_data = pd.read_sql('SELECT * FROM merged_data', conn)

# Step 3: Close the connection
conn.close()


# #INPUT DATA FROM 1_clean_download_data.ipynb

# # Define the dates
# start_year = 2020
# start_month = 1
# start_day = 1

# end_year = 2023
# end_month = 12
# end_day = 30

In [6]:
# Optional: Print the data to verify
print("Equities Data:")
print(equities_data.head(3))

Equities Data:
   permno     cusip                 date    bid    ask       vol   shrout  \
0   10200  75991610  2020-01-02 00:00:00  93.72  93.78  313953.0  52078.0   
1   10200  75991610  2020-01-03 00:00:00  92.74  92.78  246742.0  52078.0   
2   10200  75991610  2020-01-06 00:00:00  93.89  93.90  380649.0  52078.0   

      prc      mktcap  
0  93.780  4883874.84  
1  92.740  4829713.72  
2  93.895  4889863.81  


In [7]:
print("\nVolume Threshold Options Data:")
print(volume_threshold_options_data.head(3))


Volume Threshold Options Data:
                  date ticker      exdate cp_flag  strike_price  \
0  2020-01-02 00:00:00   ABEO  2020-01-17       C        2500.0   
1  2020-01-02 00:00:00   ABEO  2020-01-17       P        2500.0   
2  2020-01-02 00:00:00   ABEO  2020-01-17       C        5000.0   

   strike_price_actual  best_bid  best_offer  volume  open_interest  \
0                 0.25      0.50        1.00    87.0         1661.0   
1                 0.25      0.05        0.15    16.0          760.0   
2                 0.50      0.05        0.10    40.0         2994.0   

   impl_volatility     delta     gamma      vega     theta  permno  
0         1.076193  0.895771  0.258311  0.117540 -1.576614   87656  
1         1.509266 -0.165591  0.253322  0.161895 -2.962448   87656  
2         1.773509  0.146708  0.199077  0.149495 -3.232589   87656  


In [8]:
print("\nMerged Data:")
print(merged_data.head(3))


Merged Data:
   permno     cusip                 date    bid    ask       vol   shrout  \
0   10200  75991610  2020-01-02 00:00:00  93.72  93.78  313953.0  52078.0   
1   10200  75991610  2020-01-02 00:00:00  93.72  93.78  313953.0  52078.0   
2   10200  75991610  2020-01-02 00:00:00  93.72  93.78  313953.0  52078.0   

     prc      mktcap ticker  ... strike_price_actual best_bid  best_offer  \
0  93.78  4883874.84   RGEN  ...                 9.5     1.40        1.75   
1  93.78  4883874.84   RGEN  ...                 7.5     0.25        0.40   
2  93.78  4883874.84   RGEN  ...                 8.0    13.00       14.80   

   volume  open_interest  impl_volatility     delta     gamma      vega  \
0     2.0           98.0         0.310298  0.396742  0.067700  7.253972   
1    10.0          528.0         0.390420 -0.053629  0.008045  3.776815   
2     2.0          377.0         0.270031  0.953724  0.012104  3.225182   

       theta  
0 -22.242290  
1  -5.439961  
2  -2.681417  

[3 row