In [1]:
import pandas as pd
import yaml
import argparse
import torch
from model import YNet
from easydict import EasyDict

In [2]:
%load_ext autoreload
%autoreload 2

#### Load config file and print hyperparameters

In [3]:
model_dict = {
    'ynet': YNet,
}
CONFIG_FILE_PATH = 'config/sdd_trajnet.yaml'  # yaml config file containing all the hyperparameters
with open(CONFIG_FILE_PATH) as file:
    params = yaml.load(file, Loader=yaml.FullLoader)
params = EasyDict(params)
experiment_name = CONFIG_FILE_PATH.split('.yaml')[0].split('config/')[1]
params



{'resize': 0.33,
 'batch_size': 8,
 'viz_epoch': 10,
 'learning_rate': 0.0001,
 'num_epochs': 300,
 'temperature': 1.8,
 'loss_scale': 1000,
 'kernlen': 31,
 'nsig': 4,
 'unfreeze': 100,
 'use_TTST': True,
 'rel_threshold': 0.002,
 'use_CWS': True,
 'CWS_params': {'sigma_factor': 6, 'ratio': 2, 'rot': True},
 'dataset_name': 'ind',
 'train_data_path': '../dataset/inD/train.pkl',
 'train_image_path': '../dataset/inD/train',
 'val_data_path': '../dataset/inD/test.pkl',
 'val_image_path': '../dataset/inD/test',
 'num_goals': 20,
 'num_traj': 1,
 'experiment_name': 'ind_longterm',
 'waypoints': [14, 29],
 'model': {'name': 'ynet',
  'kwargs': {'obs_len': 5,
   'pred_len': 30,
   'segmentation_model_fp': 'segmentation_models/inD_segmentation.pth',
   'use_features_only': False,
   'semantic_classes': 6,
   'encoder_channels': [32, 32, 64, 64, 64],
   'decoder_channels': [64, 64, 64, 32, 32],
   'waypoints': [14, 29]}}}

#### Some hyperparameters and settings

In [4]:
EXPERIMENT_NAME = params.experiment_name  # arbitrary name for this experiment
DATASET_NAME = params.dataset_name

TRAIN_DATA_PATH = params.train_data_path
TRAIN_IMAGE_PATH = params.train_image_path
VAL_DATA_PATH = params.val_data_path
VAL_IMAGE_PATH = params.val_image_path
# OBS_LEN = params.obs_length  # in timesteps
# PRED_LEN = params.pred_len  # in timesteps
NUM_GOALS = params.num_goals  # K_e
NUM_TRAJ = params.num_traj  # K_a

BATCH_SIZE = params.batch_size


#### Load preprocessed Data

In [5]:
df_train = pd.read_pickle(TRAIN_DATA_PATH)
df_val = pd.read_pickle(VAL_DATA_PATH)

In [6]:
df_train.head()

Unnamed: 0,trackId,frame,x,y,sceneId,metaId,frame_diff,recId
0,31,2217,256.721335,69.443387,scene2,0,1.0,7
1,31,2242,267.350942,79.050983,scene2,0,1.0,7
2,31,2267,276.964578,91.597359,scene2,0,1.0,7
3,31,2292,287.502662,104.240274,scene2,0,1.0,7
4,31,2317,297.761057,116.633497,scene2,0,1.0,7


#### Initiate model

In [7]:
model = model_dict[params.model.name](**params.model.kwargs)



#### Start training
Note, the Val ADE and FDE are without TTST and CWS to save time. Therefore, the numbers will be worse than the final values.

In [8]:
model.train(df_train, df_val, params, train_image_path=TRAIN_IMAGE_PATH, val_image_path=VAL_IMAGE_PATH, 
            experiment_name=EXPERIMENT_NAME, batch_size=BATCH_SIZE, num_goals=NUM_GOALS, num_traj=NUM_TRAJ, 
            device=None, dataset_name=DATASET_NAME)

Preprocess data


Prepare Dataset: 100%|████████████████████████| 24/24 [00:00<00:00, 759.13it/s]
  return np.array(trajectories), meta, scene_list
Prepare Dataset: 100%|█████████████████████████| 1/1 [00:00<00:00, 1091.70it/s]


Start training


  return torch.Tensor(trajectories).squeeze(0), meta, scene[0]
  return _VF.meshgrid(tensors, **kwargs)  # type: ignore[attr-defined]
Epoch:   0%|                                           | 0/300 [00:15<?, ?it/s]


KeyboardInterrupt: 