In [1]:
import os
import pickle

data_folder = "./Data"
file_path = os.path.join(data_folder, "pytorch_database_short_seq.pkl")

with open(file_path, "rb") as f:
    loaded_data = pickle.load(f)


In [2]:
loaded_data.keys()

dict_keys(['sim_tensor', 'file_names', 'mode_descriptions'])

In [3]:
len(loaded_data['mode_descriptions'])

15000

In [4]:
# Modes for testing
test_modes = [
    ('Conduction2', 'Conduction2'),
    ('Conduction2', 'Keyhole2'),
    ('Keyhole2', 'Conduction2'),
    ('Keyhole2', 'Keyhole2'),
]

In [5]:
mode_descriptions = loaded_data['mode_descriptions']
# Identify indexes for test data
test_indexes = [i for i, mode in enumerate(mode_descriptions) if mode in test_modes]

len(test_indexes), len(test_indexes)/len(mode_descriptions)

(4500, 0.3)

In [6]:
# Identify indexes for train data
total_indexes = set(range(len(mode_descriptions)))
train_indexes = list(total_indexes - set(test_indexes))

# Function to extract sub-tensors based on indexes
def extract_sub_tensors(tensor, indexes):
    return tensor[indexes]

# Allocate data to train and test dictionaries
train_data = {
    "seq_tensor": extract_sub_tensors(loaded_data["sim_tensor"], train_indexes),
    "file_names": [loaded_data["file_names"][i] for i in train_indexes],
    "mode_descriptions": [loaded_data["mode_descriptions"][i] for i in train_indexes],
}

test_data = {
    "seq_tensor": extract_sub_tensors(loaded_data["sim_tensor"], test_indexes),
    "file_names": [loaded_data["file_names"][i] for i in test_indexes],
    "mode_descriptions": [loaded_data["mode_descriptions"][i] for i in test_indexes],
}


In [7]:
# Function to print file names and modes for a given dataset
def print_file_info(dataset, dataset_name):
    print(f"Files in {dataset_name}:")
    for file_name, mode in zip(dataset["file_names"], dataset["mode_descriptions"]):
        print(f"File Name: {file_name}, Mode: {mode}")
    print("\n")  


In [8]:
# Loop over all files in the train set
print_file_info(train_data, "Train Data")


Files in Train Data:
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conduction 2')
File Name: File_0, Mode: ('Conduction 2', 'Conducti

File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name: File_132, Mode: ('Conduction1', 'Keyhole1')
File Name:

File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: File_312, Mode: ('Keyhole1', 'Keyhole1')
File Name: F

In [9]:
# Loop over all files in the test set
print_file_info(test_data, "Test Data")

Files in Test Data:
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: File_70, Mode: ('Conduction2', 'Conduction2')
File Name: 

File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: File_347, Mode: ('Keyhole2', 'Keyhole2')
File Name: F

In [10]:
import torch

torch.save(train_data, './Data/train_classification_short_seq')
torch.save(test_data, './Data/test_classification_short_seq')