# Imports

In [None]:
!pip uninstall deepdowmine -y
!pip install git+https://github.com/dsman1823/deepdowmine.git

In [1]:
import numpy as np
import pandas as pd
import torch

from matplotlib import pyplot as plt
from deepdowmine.data import InRAMDataset, RigidDataLoader, prepare_standard_scaler, Scale, SeqRigidDataLoader, WeeklyRigidDataLoader
from deepdowmine.losses import MeanReturns, SharpeRatio, MaximumDrawdown, StandardDeviation
from deepdowmine.nn import DenseNetFullOpti2, DenseNetMinVar2, RnnNetMinVar2, RnnNetMinVar, DenseNetFullOpti2, RnnNetFullOpti2, ConvNetFullOpti2
from deepdowmine.nn import LstmNetMinVar2, LstmNetFullOpti2, RnnNetMinVar3, RnnNetFullOpti3
from deepdowmine.experiments import Run
from deepdowmine.callbacks import EarlyStoppingCallback
from deepdowmine.visualize import generate_metrics_table, generate_weights_table, plot_metrics, plot_weight_heatmap




# Setup

In [2]:
np.random.seed(5)
returns = pd.read_csv('old_train_data_0.csv', index_col = 0).to_numpy()[1:]

In [3]:
len(returns)

2757

In [4]:
n_timesteps, n_assets = len(returns), 5#11**4, 450

#returns = np.random.normal(0, .2, size = (n_timesteps, n_assets))

lookback, gap, horizon = 50, 0, 5# 40, 0, 5   loss=-0.09645, test_loss=-0.08003]
n_samples = n_timesteps - lookback - horizon - gap + 1

indices = np.arange(n_samples)
split_ix = int(n_samples * 0.8)
indices_train = indices[:split_ix]
indices_test = indices[split_ix:]


# print('Train range: {}:{}\nTest range: {}:{}'.format(indices_train[0], indices_train[-1],
#                                                      indices_test[0], indices_test[-1]))

In [5]:
def transform_returns_to_Xy_tensors(returns, lookback, n_timesteps, horizon, gap):
    X_list, y_list = [], []

    for i in range(lookback, n_timesteps - horizon - gap + 1):
        X_list.append(returns[i - lookback: i, :])
        y_list.append(returns[i + gap: i + gap + horizon, :])

    X = np.stack(X_list, axis=0)[:, None, ...]
    y = np.stack(y_list, axis=0)[:, None, ...]

    return X, y

In [6]:

#returns = np.random.normal(0, .2, size = (n_timesteps, n_assets))

# X_list, y_list = [], []

# for i in range(lookback, n_timesteps - horizon - gap + 1):
#     X_list.append(returns[i - lookback: i, :])
#     y_list.append(returns[i + gap: i + gap + horizon, :])

# X = np.stack(X_list, axis=0)[:, None, ...]
# y = np.stack(y_list, axis=0)[:, None, ...]
X, y = transform_returns_to_Xy_tensors(returns, lookback, n_timesteps, horizon, gap)
#print('X: {}, y: {}'.format(X.shape, y.shape))

# means, stds = prepare_standard_scaler(X, indices=indices_train)
# print('mean: {}, std: {}'.format(means, stds))

dataset = InRAMDataset(X, y)
#, transform=Scale(means, stds))

torch.manual_seed(32)

dataloader_train = RigidDataLoader(dataset,
                                   indices=indices_train,
                                   batch_size=32)

dataloader_test = SeqRigidDataLoader(dataset,
                                  indices=indices_test,
                                  batch_size=32)

dataloader_train_for_retrain = RigidDataLoader(dataset,
                                  indices=indices_test,
                                  batch_size=32)
dataloader_test_for_retrain = SeqRigidDataLoader(dataset,
                                   indices=indices_train,
                                   batch_size=32)


# Network setup

In [7]:
network = DenseNetMinVar2(1, 50, 5,  max_weight=1, p=0.2)
print(network)
network = network.train()
loss = SharpeRatio()
run = Run(network,
          loss,
          dataloader_train,
          val_dataloaders={
              'test': dataloader_test,
              'train': dataloader_train
              },
          optimizer=torch.optim.Adam(network.parameters(), amsgrad=True, lr=0.001),
          callbacks=[EarlyStoppingCallback(metric_name='loss',
                                           dataloader_name='test',
                                           patience=5)]) #15 # patience controlls amount offffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffrfvd

DenseNetMinVar2(
  (norm_layer): BatchNorm1d(250, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (dropout_layer): Dropout(p=0.2, inplace=False)
  (linear_for_cov): Linear(in_features=250, out_features=750, bias=True)
  (covariance_layer): CovarianceMatrix()
  (portfolio_opt_layer): ThesisMarkowitzMinVar(
    (cvxpylayer): CvxpyLayer()
  )
)


# Train start

In [8]:
history = run.launch(200)
torch.save(network.state_dict(), 'network.pth')

Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 0: 100%|█████████████████| 68/68 [00:50<00:00,  1.35it/s, loss=-0.07489, test_loss=-0.08515, train_loss=-0.14565]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 1: 100%|█████████████████| 68/68 [00:53<00:00,  1.26it/s

Epoch 10: 100%|████████████████| 68/68 [01:02<00:00,  1.08it/s, loss=-0.43183, test_loss=-0.43727, train_loss=-0.56842]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 11: 100%|████████████████| 68/68 [00:58<00:00,  1.17it/s, loss=-0.45627, test_loss=-0.45733, train_loss=-0.60676]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github

Epoch 21: 100%|████████████████| 68/68 [01:06<00:00,  1.03it/s, loss=-0.55190, test_loss=-0.54495, train_loss=-0.72379]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 22: 100%|████████████████| 68/68 [00:59<00:00,  1.14it/s, loss=-0.58614, test_loss=-0.54375, train_loss=-0.73952]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github

Epoch 32: 100%|████████████████| 68/68 [00:57<00:00,  1.19it/s, loss=-0.67691, test_loss=-0.58934, train_loss=-0.81971]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 33: 100%|████████████████| 68/68 [00:55<00:00,  1.22it/s, loss=-0.68050, test_loss=-0.60301, train_loss=-0.84295]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github

Training interrupted
Training stopped early because there was no improvement in test_loss for 5 epochs


In [9]:
network

DenseNetMinVar2(
  (norm_layer): BatchNorm1d(250, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (dropout_layer): Dropout(p=0.2, inplace=False)
  (linear_for_cov): Linear(in_features=250, out_features=750, bias=True)
  (covariance_layer): CovarianceMatrix()
  (portfolio_opt_layer): ThesisMarkowitzMinVar(
    (cvxpylayer): CvxpyLayer()
  )
)

## Retrain the model on validation set with limited amount of epochs, and limited learning rate

In [11]:
network_retrained =  DenseNetMinVar2(1, 50, 5,  max_weight=1, p=0.2)
network_retrained.load_state_dict(network.state_dict())

##!!!!!!!!!!!!!!!!!!!!!!!!
# state_dict = torch.load('min_var_1.pth')
# network_retrained.load_state_dict(state_dict)
# ####


print(network_retrained)
network_retrained = network_retrained.train()
loss = SharpeRatio()
run = Run(network_retrained,
          loss,
          dataloader_train_for_retrain,
          val_dataloaders={
              'train': dataloader_train_for_retrain,
              'test': dataloader_test_for_retrain
              },
          optimizer=torch.optim.Adam(network_retrained.parameters(), amsgrad=True, lr=0.0005),
)

DenseNetMinVar2(
  (norm_layer): BatchNorm1d(250, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (dropout_layer): Dropout(p=0.2, inplace=False)
  (linear_for_cov): Linear(in_features=250, out_features=750, bias=True)
  (covariance_layer): CovarianceMatrix()
  (portfolio_opt_layer): ThesisMarkowitzMinVar(
    (cvxpylayer): CvxpyLayer()
  )
)


In [12]:
history_retrain = run.launch(20)
torch.save(network_retrained.state_dict(), 'network_retrained.pth')

Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 0: 100%|█████████████████| 17/17 [00:32<00:00,  1.94s/it, loss=-0.13171, test_loss=-0.89458, train_loss=-0.24655]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 1: 100%|█████████████████| 17/17 [00:30<00:00,  1.82s/it

Epoch 10: 100%|████████████████| 17/17 [00:30<00:00,  1.81s/it, loss=-0.61003, test_loss=-0.83114, train_loss=-0.74325]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md

Epoch 11: 100%|████████████████| 17/17 [00:30<00:00,  1.81s/it, loss=-0.62244, test_loss=-0.82674, train_loss=-0.78274]
Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github

In [None]:
network.gamma

# Check model perfomance

In [None]:
  # network = LstmNetMinVar(5)
  # network.load_state_dict(torch.load(fr'network_2.pth'))

In [14]:
per_epoch_results = history.metrics.groupby(['dataloader', 'metric', 'model', 'epoch'])['value']


KeyboardInterrupt



In [None]:
mean_test_loss = per_epoch_results.mean()['test']['loss']['network'] # tmp

# Plotting the mean test loss per epoch
mean_test_loss.plot()

# Finding the epoch with the minimum test loss
min_loss_epoch = mean_test_loss.idxmin()
min_loss_value = mean_test_loss.min()

# Adding a red vertical line at the epoch with minimum test loss
plt.axvline(x=min_loss_epoch, color='r', linestyle='--', label=f'Min Loss at Epoch {min_loss_epoch}')

# Adding some labels and title for clarity
plt.xlabel('Epoch')
plt.ylabel('Test Loss')
plt.title('Validation Loss per Epoch')
plt.legend()

# Show the plot
plt.show()

In [None]:
per_epoch_results.mean()['test']['loss']['network'].mean()

In [None]:
mean_train_loss = per_epoch_results.mean()['train']['loss']['network']

# Plotting the mean test loss per epoch
mean_train_loss.plot()



# Adding some labels and title for clarity
plt.xlabel('Epoch')
plt.ylabel('Train Loss')
plt.title('Train Loss per Epoch')
plt.axvline(x=min_loss_epoch, color='r', linestyle='--', label=f'The best model {min_loss_epoch}')

# Show the plot
plt.show()

In [None]:
network.tmp['output'].shape

# Compute validation factor

In [19]:
X_tensor = torch.tensor(X[indices_test], dtype=torch.float32)
y_tensor = torch.tensor(y[indices_test], dtype=torch.float32)

In [20]:
weights = network(X_tensor)
ewp = weights.new_full(weights.shape, 0.2)

Found Intel OpenMP ('libiomp') and LLVM OpenMP ('libomp') loaded at
the same time. Both libraries are known to be incompatible and this
can cause random crashes or deadlocks on Linux when loaded in the
same Python program.
Using threadpoolctl may cause crashes or deadlocks. For more
information and possible workarounds, please see
    https://github.com/joblib/threadpoolctl/blob/master/multiple_openmp.md



In [21]:
loss(weights, y_tensor).mean()  /  loss(ewp, y_tensor).mean()

tensor(1.5299, grad_fn=<DivBackward0>)

In [27]:
SPY_long = torch.zeros(742, 5)
SPY_long[:, 1] = 1
loss(weights, y_tensor).mean()  /  loss(SPY_long, y_tensor).mean()

tensor(0.8629, grad_fn=<DivBackward0>)

In [None]:
loss(SPY_long, y_tensor).mean()