In [1]:
# Import Libraries 
import pandas as pd
import numpy as np
from sklearn.preprocessing import MinMaxScaler
from sklearn.model_selection import train_test_split
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import LSTM, Dense, Dropout
import matplotlib.pyplot as plt
import pickle

# Load Dataset
dataset_path = "../data/IPO_dataset.csv"  # Adjust path as needed
data = pd.read_csv(dataset_path)

# Define Features and Target
features = ['issue_price', 'issue_size', 'hni_subscription', 'nii_subscription',
            'rii_subscription', 'revenue_2', 'revenue_1', 'eps_2', 'eps_1']  # Use only these 9 features
target = 'listing_gain'

# Drop Missing Values
data = data.dropna(subset=features + [target])

# Scale Only Features
scaler = MinMaxScaler()
X_scaled = scaler.fit_transform(data[features])  # Scale features only
y = data[target].values  # Keep target unscaled

# Combine Scaled Features and Target for Sequence Creation
data_scaled = np.hstack((X_scaled, y.reshape(-1, 1)))

# Create Sequences for LSTM
def create_sequences(data, time_steps=10):
    X, y = [], []
    for i in range(len(data) - time_steps):
        X.append(data[i:i + time_steps, :-1])  # Features
        y.append(data[i + time_steps, -1])    # Target
    return np.array(X), np.array(y)

X, y = create_sequences(data_scaled, time_steps=10)

# Train-Test Split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Define LSTM Model
model = Sequential([
    LSTM(64, return_sequences=True, input_shape=(X_train.shape[1], X_train.shape[2])),
    Dropout(0.2),
    LSTM(32),
    Dropout(0.2),
    Dense(1)  # Predict Listing Gain
])

# Compile Model
model.compile(optimizer='adam', loss='mse', metrics=['mae'])

# Train Model
history = model.fit(
    X_train, y_train,
    validation_split=0.2,
    epochs=20,
    batch_size=32,
    verbose=1
)

# Save Model and Scaler
model.save("../models/best_lstm_model.h5")
with open("../models/scaler.pkl", "wb") as f:
    pickle.dump(scaler, f)

print("Model and scaler saved successfully!")


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Model and scaler saved successfully!


  saving_api.save_model(
