In [2]:
%pip install torch
%pip install numpy
%pip install pandas
%pip install scikit-learn
%pip install coremltools

Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.
Note: you may need to restart the kernel to use updated packages.


In [7]:
import os
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import DataLoader, TensorDataset
from torch.optim import Adam
from sklearn.model_selection import train_test_split
import numpy as np
import pandas as pd
from numpy import genfromtxt
from sklearn.preprocessing import LabelEncoder

In [8]:
# Set up the paths
HOME_PATH = os.path.expanduser('~')
MODELS_PATH = f'{HOME_PATH}/Developer/BU/research/models'
DATASET_PATH = f'../../../data/'
data_features = f'{DATASET_PATH}/WISDM_x.csv'
data_labels = f'{DATASET_PATH}/WISDM_y.csv'

In [9]:
# Load Data
x = genfromtxt(data_features, delimiter=',')
y_df = pd.read_csv(data_labels)
y = y_df.values.flatten()  # Flatten if y is 2D

# Encode labels
label_encoder = LabelEncoder()
y_encoded = label_encoder.fit_transform(y)

# Function to create time series dataset
def create_series(x, y, timestep, overlap):
    slide_step = int(timestep * (1 - overlap))
    data_num = int((len(x) / slide_step) - 1)
    dataset = np.ndarray(shape=(data_num, timestep, x.shape[1]))
    labels = []

    for i in range(data_num):
        labels.append(y[slide_step * (i + 1) - 1])
        for j in range(timestep):
            dataset[i, j, :] = x[slide_step * i + j, :]

    return dataset, np.array(labels)

# Create time series
timestep = 16  # Replace with your value
overlap = 0.5  # Replace with your value
X_series, y_series = create_series(x, y_encoded, timestep, overlap)

In [10]:
# Split into train and test sets
X_train, X_test, y_train, y_test = train_test_split(X_series, y_series, test_size=0.2, random_state=42)

# Convert to PyTorch tensors
x_train_tensor = torch.tensor(X_train, dtype=torch.float32)
x_test_tensor = torch.tensor(X_test, dtype=torch.float32)
y_train_tensor = torch.tensor(y_train, dtype=torch.long)
y_test_tensor = torch.tensor(y_test, dtype=torch.long)



In [11]:
class LSTMNet(nn.Module):
    def __init__(self, input_size, hidden_size1, hidden_size2, output_size, n_steps):
        super(LSTMNet, self).__init__()
        self.hidden_size1 = hidden_size1
        self.hidden_size2 = hidden_size2
        self.lstm1 = nn.LSTM(input_size, hidden_size1, batch_first=True)
        self.dropout1 = nn.Dropout(0.2)
        self.lstm2 = nn.LSTM(hidden_size1, hidden_size2, batch_first=True)
        self.dropout2 = nn.Dropout(0.2)
        self.fc = nn.Linear(hidden_size2, output_size)

    def forward(self, x):
        # Initialize hidden state and cell state
        h0 = torch.zeros(1, x.size(0), self.hidden_size1).to(x.device)
        c0 = torch.zeros(1, x.size(0), self.hidden_size1).to(x.device)
        
        # First LSTM layer
        out, _ = self.lstm1(x, (h0, c0))
        out = self.dropout1(out)
        
        # Second LSTM layer
        h1 = torch.zeros(1, x.size(0), self.hidden_size2).to(x.device)
        c1 = torch.zeros(1, x.size(0), self.hidden_size2).to(x.device)
        out, _ = self.lstm2(out, (h1, c1))
        out = self.dropout2(out)

        # Dense layer
        out = self.fc(out[:, -1, :]) # Taking the last time step
        return out


In [12]:
# Parameters
input_size = 3  # Number of features
hidden_size1 = 50
hidden_size2 = 25
output_size = 6
n_steps = 16

# Create the model
model = LSTMNet(input_size, hidden_size1, hidden_size2, output_size, n_steps)

# Training setup (for demonstration)
# Define your dataset here
train_dataset = TensorDataset(torch.tensor(X_train, dtype=torch.float32), torch.tensor(y_train, dtype=torch.int64))
train_loader = DataLoader(train_dataset, batch_size=64, shuffle=True)

loss_fn = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(model.parameters(), lr=0.001)


In [13]:
def train(model, train_loader, loss_fn, optimizer, epochs=0):
    for epoch in range(epochs):
        model.train()
        running_loss = 0.0
        correct = 0
        total = 0

        for X_batch, y_batch in train_loader:
            optimizer.zero_grad()
            y_pred = model(X_batch)
            loss = loss_fn(y_pred, y_batch)
            loss.backward()
            optimizer.step()

            running_loss += loss.item()
            _, predicted = torch.max(y_pred.data, 1)
            total += y_batch.size(0)
            correct += (predicted == y_batch).sum().item()

        avg_loss = running_loss / len(train_loader)
        accuracy = 100 * correct / total
        print(f"Epoch [{epoch+1}/{epochs}], Loss: {avg_loss:.4f}, Accuracy: {accuracy:.2f}%")

train(model, train_loader, loss_fn, optimizer, epochs=20)


Epoch [1/20], Loss: 0.5909, Accuracy: 79.51%
Epoch [2/20], Loss: 0.3590, Accuracy: 87.68%
Epoch [3/20], Loss: 0.2889, Accuracy: 90.30%
Epoch [4/20], Loss: 0.2527, Accuracy: 91.64%
Epoch [5/20], Loss: 0.2293, Accuracy: 92.49%
Epoch [6/20], Loss: 0.2120, Accuracy: 93.09%
Epoch [7/20], Loss: 0.1968, Accuracy: 93.65%
Epoch [8/20], Loss: 0.1863, Accuracy: 93.96%
Epoch [9/20], Loss: 0.1772, Accuracy: 94.30%
Epoch [10/20], Loss: 0.1698, Accuracy: 94.55%
Epoch [11/20], Loss: 0.1624, Accuracy: 94.74%
Epoch [12/20], Loss: 0.1567, Accuracy: 94.90%
Epoch [13/20], Loss: 0.1509, Accuracy: 95.11%
Epoch [14/20], Loss: 0.1462, Accuracy: 95.32%
Epoch [15/20], Loss: 0.1399, Accuracy: 95.44%
Epoch [16/20], Loss: 0.1378, Accuracy: 95.54%
Epoch [17/20], Loss: 0.1345, Accuracy: 95.66%
Epoch [18/20], Loss: 0.1300, Accuracy: 95.85%
Epoch [19/20], Loss: 0.1265, Accuracy: 95.95%
Epoch [20/20], Loss: 0.1239, Accuracy: 96.02%


In [14]:
test_dataset = TensorDataset(torch.tensor(X_test, dtype=torch.float32), torch.tensor(y_test, dtype=torch.int64))
test_loader = DataLoader(test_dataset, batch_size=64, shuffle=False)
def evaluate(model, test_loader, loss_fn):
    model.eval()
    total_loss = 0
    correct = 0
    total = 0
    with torch.no_grad():
        for X_batch, y_batch in test_loader:
            y_pred = model(X_batch)
            total_loss += loss_fn(y_pred, y_batch).item()
            _, predicted = torch.max(y_pred.data, 1)
            total += y_batch.size(0)
            correct += (predicted == y_batch).sum().item()

    avg_loss = total_loss / len(test_loader)
    accuracy = correct / total
    return avg_loss, accuracy

avg_loss, accuracy = evaluate(model, test_loader, loss_fn)
print(f"Test Loss: {avg_loss:.4f}, Test Accuracy: {accuracy:.4f}")



Test Loss: 0.1556, Test Accuracy: 0.9512


In [16]:
model_path = f'{MODELS_PATH}/lstm_base.pth'
torch.save(model.state_dict(), model_path)

### Convert to Coreml

In [21]:
import coremltools as ct
example_input = torch.rand(1,16, 3) 

model.eval()
traced_model = torch.jit.trace(model, example_input)
out = traced_model(example_input)

# Convert to Core ML program using the Unified Conversion API.
mlp_coreml_model = ct.convert(
    traced_model,
    convert_to="mlprogram",
    inputs=[ct.TensorType(shape=example_input.shape)]
 )

# Save the converted model.
mlp_coreml_model.save(f'{MODELS_PATH}/lstm.mlpackage')

Converting PyTorch Frontend ==> MIL Ops:  99%|█████████▉| 113/114 [00:00<00:00, 10060.63 ops/s]
Running MIL frontend_pytorch pipeline: 100%|██████████| 5/5 [00:00<00:00, 3572.05 passes/s]
Running MIL default pipeline: 100%|██████████| 71/71 [00:00<00:00, 1915.76 passes/s]
Running MIL backend_mlprogram pipeline: 100%|██████████| 12/12 [00:00<00:00, 7937.49 passes/s]


### Define Coreml Metrics

In [30]:
from pathlib import Path

def coreml_metrics(model_name, X_test, y_test, model_path):
    predictions = []
    for id in range(len(X_test)):
        X_test_new = np.expand_dims(X_test[id], axis=0)
        output_dict = model_name.predict({'x': X_test_new})
        pred_class = np.argmax(output_dict['linear_0'])
        predictions.append(pred_class)
    
    accuracy = np.sum(predictions == y_test) / len(predictions)
    print("Accuracy:", accuracy)
    
    model_file = Path(model_path)
    
    # Size in bytes
    model_size_bytes = model_file.stat().st_size
    
    # Convert size to kilobytes (optional)
    model_size_kb = model_size_bytes / 1024
    print(f"Size of the model: {model_size_kb:.2f} KB")

In [31]:
import coremltools as ct
import coremltools.optimize.coreml as cto

lstm_coreml_model = ct.models.MLModel(f'{MODELS_PATH}/lstm.mlpackage')

In [32]:
model_name = lstm_coreml_model
model_path = f'{MODELS_PATH}/lstm.mlpackage'

coreml_metrics(model_name, X_test, y_test, model_path)

Accuracy: 0.9512474250400549
Size of the model: 0.12 KB


## Post Training Optimization

In [36]:
from coremltools.optimize.coreml import (
    OpThresholdPrunerConfig,
    OpMagnitudePrunerConfig,
    OpPalettizerConfig,
    OpLinearQuantizerConfig,
    OptimizationConfig,
    prune_weights,
)

### Quantization

In [37]:
op_config = OpLinearQuantizerConfig(
    mode="linear_symmetric", weight_threshold=512
)
config = OptimizationConfig(global_config=op_config)

compressed_8_bit_model = cto.linear_quantize_weights(lstm_coreml_model, config=config)

Running compression pass linear_quantize_weights: 100%|██████████| 11/11 [00:00<00:00, 3076.85 ops/s]
Running MIL frontend_milinternal pipeline: 0 passes [00:00, ? passes/s]
Running MIL default pipeline: 100%|██████████| 69/69 [00:00<00:00, 2681.46 passes/s]
Running MIL backend_mlprogram pipeline: 100%|██████████| 12/12 [00:00<00:00, 5464.30 passes/s]


In [38]:
compressed_8_bit_model.save(f'{MODELS_PATH}/lstm_8bitQuantized_mlmodel.mlpackage')

In [39]:
model_name = compressed_8_bit_model
model_path = f'{MODELS_PATH}/lstm_8bitQuantized_mlmodel.mlpackage'

coreml_metrics(model_name, X_test, y_test, model_path)

Accuracy: 0.9509040970473792
Size of the model: 0.12 KB


### Pruning

#### a) OpMagnitudePrunerConfig: Prune the weights with a constant sparsity percentile

In [40]:
op_config = OpMagnitudePrunerConfig(
    target_sparsity=0.6,
    weight_threshold=1024,
)
config = OptimizationConfig(global_config=op_config)
lstm_magnitude_pruner = prune_weights(lstm_coreml_model, config=config)


Running compression pass prune_weights: 100%|██████████| 11/11 [00:00<00:00, 2459.74 ops/s]
Running MIL frontend_milinternal pipeline: 0 passes [00:00, ? passes/s]
Running MIL default pipeline: 100%|██████████| 69/69 [00:00<00:00, 2707.27 passes/s]
Running MIL backend_mlprogram pipeline: 100%|██████████| 12/12 [00:00<00:00, 5454.82 passes/s]


In [41]:
lstm_magnitude_pruner.save(f'{MODELS_PATH}/lstm_magnitude_pruner.mlpackage')

In [42]:
model_name = lstm_magnitude_pruner
model_path = f'{MODELS_PATH}/lstm_magnitude_pruner.mlpackage'

coreml_metrics(model_name, X_test, y_test, model_path)

Accuracy: 0.7891203173876554
Size of the model: 0.12 KB


#### b) OpThresholdPrunerConfig: Sets all weight values below a certain value.

In [43]:
op_config = OpThresholdPrunerConfig(
    threshold=0.001,
    minimum_sparsity_percentile=0.01,
    weight_threshold=1024,
)

config = OptimizationConfig(global_config=op_config)
lstm_threshold_pruner = prune_weights(lstm_coreml_model, config=config)

Running compression pass prune_weights:   0%|          | 0/11 [00:00<?, ? ops/s]weight value has sparsity of 0.0024 < minimum_sparsity_percentile 0.01. Skipped.
weight value has sparsity of 0.0028 < minimum_sparsity_percentile 0.01. Skipped.
weight value has sparsity of 0.0052 < minimum_sparsity_percentile 0.01. Skipped.
Running compression pass prune_weights: 100%|██████████| 11/11 [00:00<00:00, 7519.12 ops/s]
Running MIL frontend_milinternal pipeline: 0 passes [00:00, ? passes/s]
Running MIL default pipeline: 100%|██████████| 69/69 [00:00<00:00, 3322.58 passes/s]
Running MIL backend_mlprogram pipeline: 100%|██████████| 12/12 [00:00<00:00, 6826.48 passes/s]


In [44]:
lstm_threshold_pruner.save(f'{MODELS_PATH}/lstm_threshold_pruner.mlpackage')

In [45]:
model_name = lstm_threshold_pruner
model_path = f'{MODELS_PATH}/lstm_threshold_pruner.mlpackage'

coreml_metrics(model_name, X_test, y_test, model_path)

Accuracy: 0.9512474250400549
Size of the model: 0.12 KB


### Palletization

In [46]:
op_config = OpPalettizerConfig(
    mode="kmeans", 
    nbits=6
)

config = OptimizationConfig(global_config=op_config)
lstm_palettizer = cto.palettize_weights(lstm_coreml_model, config=config)

Running compression pass palettize_weights: 100%|██████████| 11/11 [00:00<00:00, 30.84 ops/s]
Running MIL frontend_milinternal pipeline: 0 passes [00:00, ? passes/s]
Running MIL default pipeline: 100%|██████████| 69/69 [00:00<00:00, 2198.99 passes/s]
Running MIL backend_mlprogram pipeline: 100%|██████████| 12/12 [00:00<00:00, 2636.82 passes/s]


In [47]:
lstm_palettizer.save(f'{MODELS_PATH}/lstm_palettizer.mlpackage')

In [48]:
model_name = lstm_palettizer
model_path = f'{MODELS_PATH}/lstm_palettizer.mlpackage'

coreml_metrics(model_name, X_test, y_test, model_path)

Accuracy: 0.9506752117189288
Size of the model: 0.12 KB
