# AE on proteins in SA representation

In [1]:
import glob
import os
from collections import Counter
import string
from keras import Input
from keras.layers import Dense, Lambda, Conv1D
import keras.backend as K
from keras.models import Model
from keras.objectives import binary_crossentropy, mse
import os
import random
import numpy as np
import NotebookLoader
from keras.optimizers import RMSprop, Adam
from keras.utils.np_utils import to_categorical
from sklearn.model_selection import train_test_split
from keras.callbacks import ModelCheckpoint, TensorBoard
from keras.models import load_model
from tempfile import TemporaryFile
import csv

Using TensorFlow backend.


In [2]:
import Preprocessing as pre

importing Jupyter notebook from Preprocessing.ipynb


### Configs

In [3]:
lengths = {}
for f in pre.families:
    proteins = glob.glob(os.path.join(pre.family_paths[f], "*.out"))
    print("Proteins for family %s" %f)
    for p in proteins:
        print(p)
    lengths[f] = len(p)
total = sum([lengths[f] for f in pre.families])

Proteins for family fam_1
../dataset/families/fam_1/2EBN.lf_str.out
../dataset/families/fam_1/1JFX.lf_str.out
../dataset/families/fam_1/1ITX.lf_str.out
../dataset/families/fam_1/1NAR.lf_str.out
../dataset/families/fam_1/1KFW.lf_str.out
../dataset/families/fam_1/1B1Y.lf_str.out
../dataset/families/fam_1/1VFF.lf_str.out
../dataset/families/fam_1/1EDG.lf_str.out
../dataset/families/fam_1/1CNV.lf_str.out
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.ou

In [4]:
padding = True
num_classes = 25
categorical = False
use_angles = True
max_length = 668
flatten = True

In [5]:
batch_size = 64
intermediate_dim = 25
epochs = 20
learning_rate = 0.001

### Build the autoencoder

In [6]:
def create_checkpoints(f):
    checkpoints_path = os.path.join("models", f)
    tensorboard_path = os.path.join("logs", f)
    cp_cb = ModelCheckpoint(filepath=os.path.join(checkpoints_path, "model" + f + ".hdf5"), monitor='val_loss',
                            save_best_only=True)
    tb_cb = TensorBoard(log_dir=tensorboard_path)
    return [cp_cb, tb_cb]

In [7]:
#autoencoder
def get_ae():
    if categorical:
        if not flatten:
            model_input = Input(shape=(None,num_classes))
        else:
            model_input = Input(shape=(max_length*num_classes,))
    elif use_angles:
        model_input = Input(shape=(max_length*3,))
    else:
        model_input = Input(shape=(max_length,))
    #x=Conv1D(intermediate_dim, activation='sigmoid', kernel_size=3, padding='same', dilation_rate=1)(model_input)
    #encoded=Conv1D(intermediate_dim, activation='sigmoid', kernel_size=3, padding='same', dilation_rate=1, name="encoded")(x)
    #x=Conv1D(num_classes, activation='sigmoid', kernel_size=3, padding='same', dilation_rate=1)(encoded)
    encoded= Dense(intermediate_dim, activation='sigmoid')(model_input)
    if categorical:
        if not flatten:
            x = Dense(num_classes, activation='sigmoid')(encoded)
        else:
            x = Dense(max_length*num_classes, activation='sigmoid')(encoded)
    elif use_angles:
        x = Dense(max_length*3, activation='sigmoid')(encoded)
    else:
        x = Dense(max_length, activation='sigmoid')(encoded)
    ae=Model(inputs=model_input, outputs=[x])
    opt=RMSprop(lr=learning_rate)
    ae.compile(optimizer=opt, loss='binary_crossentropy', metrics=['mean_absolute_error'])
    ae.summary()
    return ae

### Train and evaluate the autoencoder for specific classes

In [8]:
models = {"fam_1": "models/fam_1/modelfam_1.hdf5",
          "fam_2": "models/fam_2/modelfam_2.hdf5",
          "fam_3": "models/fam_3/modelfam_3.hdf5",
          "fam_4": "models/fam_4/modelfam_4.hdf5",
          "fam_5": "models/fam_5/modelfam_5.hdf5",
          "fam_6": "models/fam_6/modelfam_6.hdf5",
          "fam_7": "models/fam_7/modelfam_7.hdf5",
          "fam_8": "models/fam_8/modelfam_8.hdf5",
          "fam_9": "models/fam_9/modelfam_9.hdf5"}

In [9]:
path = '/tmp/data_serialized_proteins'
#for r in range(1, 10):
#    os.makedirs(os.path.join(path, 'fam_%d' % r))

In [10]:
def evaluate_for_fam(f):
    print("Test for autoencoder on fam %s" %f)
    train_filename = os.path.join(path, f, "train.npy")
    train = np.load(train_filename)
    ae = load_model(models[f])
    ae.summary()
    losses_train = []
    for t in train:
        losses_train.append(ae.evaluate(np.array([t]),np.array([t]), verbose=0)[1])
    max_l = max(losses_train)
    losses_test = []
    del train
    tp, tn, fp, fn = 0, 0, 0, 0
    tp_p, tn_p, fp_p, fn_p = 0, 0, 0, 0
    for ft in pre.families:
        print("Test for fam %s" %ft)
        test_filename = os.path.join(path, ft, "test.npy")
        test = np.load(test_filename)
        for t in test:
            loss=ae.evaluate(np.array([t]),np.array([t]), verbose=0)[1]
            if loss > max_l:
                # predict other family
                if ft == f:
                    fn+=1
                else:
                    tn+=1
            else:
                # predict current family
                if ft == f:
                    tp+=1 
                else:
                    fp+=1
            # compute the probability
            if loss > max_l:
                pr = 1 - (max_l / (2 * loss))
            else:
                pr = loss / (2 * max_l)
            if pr >= 0.5:
                # predict other family
                if ft == f:
                    fn_p+=1
                else:
                    tn_p+=1
            else:
                # predict current family
                if ft == f:
                    tp_p+=1 
                else:
                    fp_p+=1  
        del test
    return [tp, tn, fp, fn], [tp_p, tn_p, fp_p, fn_p]

In [11]:
# %%capture output

res_fam = open('res_fam_conf.csv', mode='w')
res_avg = open('res_avg_conf.csv', mode='w')
writer_fam = csv.writer(res_fam, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
writer_fam.writerow(['Iteration', 'Superfamily', 'TP', 'TN', 'FP', 'FN', 'Prec', 'Recall', 'Spec', 'AUC'])
writer_avg = csv.writer(res_avg, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
writer_avg.writerow(['Iteration', 'Prec', 'Recall', 'Spec', 'AUC'])
for i in range(0,20):
    for f in pre.families:
        families_conf = pre.load_family(f)
        test_size = int(0.25 * len(families_conf))
        val_size =  int(0.15 * len(families_conf))
        train_all, test = train_test_split(families_conf, test_size=test_size, random_state=i)
        del families_conf
        train, val = train_test_split(train_all, test_size = val_size, random_state=i)
        del train_all
        train_filename = os.path.join(path, f, "train.npy")
      
        train = pre.process_conf(train, categorical=categorical, use_angles=use_angles, padding=padding, max_length=max_length, flatten=flatten)  
        print("train: " + repr(train.shape))
        np.save(train_filename, train)
        del train
        
        val = pre.process_conf(val, categorical=categorical, use_angles=use_angles, padding=padding, max_length=max_length, flatten=flatten)  
        print("val: " + repr(val.shape))
        val_filename = os.path.join(path, f, "val.npy")
        np.save(val_filename, val)
        del val
        
        test = pre.process_conf(test, categorical=categorical, use_angles=use_angles, padding=padding, max_length=max_length, flatten=flatten)  

        print("test: " + repr(test.shape))
        test_filename = os.path.join(path, f, "test.npy")
        np.save(test_filename, test)
        del test
        
    for f in pre.families:
        print("Training for family %s" %f)
        train_filename = os.path.join(path, f, "train.npy")
        test_filename = os.path.join(path, f, "val.npy")
        train = np.load(train_filename)
        test = np.load(test_filename)
        print("train: " + repr(train.shape))
        print("test" + repr(test.shape))
        ae = get_ae()
        ae.fit(train, train,
               shuffle=True,
               epochs=epochs,
               batch_size=batch_size,
               validation_data=(test, test),
               callbacks=create_checkpoints(f),
               verbose=1)    
        del train
        del test
    # evaluate
    tp, tn, fp, fn = {}, {}, {}, {}
    tp_p, tn_p, fp_p, fn_p = {}, {}, {}, {}
    prec, recall, spec, auc = {}, {}, {}, {}
    prec_p, recall_p, spec_p, auc_p = {}, {}, {}, {}
    for f in pre.families:
        print("Evaluating family %s" %f)
        [tp[f], tn[f], fp[f], fn[f]], [tp_p[f], tn_p[f], fp_p[f], fn_p[f]] = evaluate_for_fam(f)
        prec_p[f] = (1.0* tp_p[f] / (tp_p[f] + fp_p[f]))
        recall_p[f] = (1.0* tp_p[f] / (tp_p[f] + fn_p[f]))
        spec_p[f] = (1.0* tn_p[f] / (tn_p[f] + fp_p[f]))
        auc_p[f] = (recall_p[f] + spec_p[f]) / 2
        # write to csv 
        print([i, f, tp_p[f], tn_p[f], fp_p[f], tn_p[f], prec_p[f], recall_p[f], spec_p[f], auc_p[f]])
        writer_fam.writerow([i, f, tp_p[f], tn_p[f], fp_p[f], tn_p[f], prec_p[f], recall_p[f], spec_p[f], auc_p[f]])
    prec_wavg_p, recall_wavg_p, spec_wavg_p, auc_wavg_p = 0, 0, 0, 0
    for f in pre.families:
        prec_wavg_p += lengths[f] * prec_p[f] / total
        recall_wavg_p += lengths[f] * recall_p[f] / total
        spec_wavg_p += lengths[f] * spec_p[f] / total
        auc_wavg_p += lengths[f] * auc_p[f] / total
    # write to csv
    print([i, prec_wavg_p, recall_wavg_p, spec_wavg_p, auc_wavg_p])
    writer_avg.writerow([i, prec_wavg_p, recall_wavg_p, spec_wavg_p, auc_wavg_p])
res_fam.close()
res_avg.close()

Proteins for family fam_1
../dataset/families/fam_1/2EBN.lf_str.out
../dataset/families/fam_1/1JFX.lf_str.out
../dataset/families/fam_1/1ITX.lf_str.out
../dataset/families/fam_1/1NAR.lf_str.out
../dataset/families/fam_1/1KFW.lf_str.out
../dataset/families/fam_1/1B1Y.lf_str.out
../dataset/families/fam_1/1VFF.lf_str.out
../dataset/families/fam_1/1EDG.lf_str.out
../dataset/families/fam_1/1CNV.lf_str.out
Counter({282: 10000, 214: 10000, 416: 10000, 286: 10000, 432: 10000, 497: 10000, 420: 10000, 377: 10000, 280: 10000})
(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../datas

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_2 (InputLayer)         (None, 2004)              0         
_________________________________________________________________
dense_3 (Dense)              (None, 25)                50125     
_________________________________________________________________
dense_4 (Dense)              (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 

Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_4 (InputLayer)         (None, 2004)              0         
_________________________________________________________________
dense_7 (Dense)              (None, 25)                50125     
_________________________________________________________________
dense_8 (Dense)              (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16

Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_6 (InputLayer)         (None, 2004)              0         
_________________________________________________________________
dense_11 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_12 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14

Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_8 (InputLayer)         (None, 2004)              0         
_________________________________________________________________
dense_15 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_16 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/2

Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, 2004)              0         
_________________________________________________________________
dense_1 (Dense)              (None, 25)                50125     
_________________________________________________________________
dense_2 (Dense)              (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam f

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[0, 'fam_6', 12500, 122518, 2482, 122518, 0.8343345347750634, 1.0, 0.980144, 0.9900720000000001]
Evaluating family fam_7
Test for autoencoder on fam fam_7
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_7 (InputLayer)         (None, 2004)              0         
_________________________________________________________________
dense_13 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_14 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_

Train on 54000 samples, validate on 13500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_11 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_21 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_22 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoc

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_13 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_25 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_26 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_15 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_29 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_30 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_17 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_33 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_34 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_10 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_19 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_20 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[1, 'fam_5', 12500, 125000, 0, 125000, 1.0, 1.0, 1.0, 1.0]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_15 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_29 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_30 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_

Proteins for family fam_8
../dataset/families/fam_8/1AF7.lf_str.out
../dataset/families/fam_8/1Y8C.lf_str.out
../dataset/families/fam_8/1DUS.lf_str.out
../dataset/families/fam_8/1F3L.lf_str.out
../dataset/families/fam_8/1YUB.lf_str.out
Counter({271: 10000, 243: 10000, 191: 10000, 318: 10000, 242: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Proteins for family fam_9
../dataset/families/fam_9/1EE6.lf_str.out
../dataset/families/fam_9/1VBL.lf_str.out
../dataset/families/fam_9/1BHE.lf_str.out
../dataset/families/fam_9/1RU4.lf_str.out
../dataset/families/fam_9/1QCX.lf_str.out
Counter({194: 10000, 413: 10000, 373: 10000, 397: 10000, 356: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Training for family fam_1
train: (54000, 2004)
test(13500, 2004)
_____________________________

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_21 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_41 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_42 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_23 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_45 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_46 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17

Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_7
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_25 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_49 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_50 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15

Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_9
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_27 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_53 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_54 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[2, 'fam_2', 20000, 44976, 72524, 44976, 0.21616013142535992, 1.0, 0.3827744680851064, 0.6913872340425532]
Evaluating family fam_3
Test for autoencoder on fam fam_3
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_21 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_41 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_42 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test fo

(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Counter({144: 20000, 154: 10000, 146: 10000, 113: 10000, 279: 10000, 133: 10000, 143: 10000})
(48000, 668, 3)
(48000, 2004)
train: (48000, 2004)
(12000, 668, 3)
(12000, 2004)
val: (12000, 2004)
(20000, 668, 3)
(20000, 2004)
test: (20000, 2004)
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.out
../datas

Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_29 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_57 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_58 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(90

Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_31 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_61 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_62 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train:

Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_33 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_65 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_66 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training

Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_35 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_69 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_70 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_28 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_55 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_56 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[3, 'fam_1', 22500, 105291, 9709, 105291, 0.69856251358316, 1.0, 0.91557391

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[3, 'fam_7', 14999, 117419, 5081, 117419, 0.7469621513944223, 0.9999333333333333, 0.9585224489795918, 0.9792278911564626]
Evaluating family fam_8
Test for autoencoder on fam fam_8
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_35 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_69 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_70 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fa

Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_38 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_75 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_76 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20

Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_40 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_79 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_80 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
E

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_42 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_83 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_84 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_44 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_87 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_88 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_37 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_73 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_74 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[4, 'fam_5', 12500, 125000, 0, 125000, 1.0, 1.0, 1.0, 1.0]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_42 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_83 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_84 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_

Proteins for family fam_8
../dataset/families/fam_8/1AF7.lf_str.out
../dataset/families/fam_8/1Y8C.lf_str.out
../dataset/families/fam_8/1DUS.lf_str.out
../dataset/families/fam_8/1F3L.lf_str.out
../dataset/families/fam_8/1YUB.lf_str.out
Counter({271: 10000, 243: 10000, 191: 10000, 318: 10000, 242: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Proteins for family fam_9
../dataset/families/fam_9/1EE6.lf_str.out
../dataset/families/fam_9/1VBL.lf_str.out
../dataset/families/fam_9/1BHE.lf_str.out
../dataset/families/fam_9/1RU4.lf_str.out
../dataset/families/fam_9/1QCX.lf_str.out
Counter({194: 10000, 413: 10000, 373: 10000, 397: 10000, 356: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Training for family fam_1
train: (54000, 2004)
test(13500, 2004)
_____________________________

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_48 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_95 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_96 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_50 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_99 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_100 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17

Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_7
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_52 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_103 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_104 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15

Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_9
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_54 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_107 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_108 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[5, 'fam_2', 20000, 45057, 72443, 45057, 0.2163495343076274, 1.0, 0.38346382978723403, 0.691731914893617]
Evaluating family fam_3
Test for autoencoder on fam fam_3
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_48 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_95 (Dense)             (None, 25)                50125     
_________________________________________________________________
dense_96 (Dense)             (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for

(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Counter({144: 20000, 154: 10000, 146: 10000, 113: 10000, 279: 10000, 133: 10000, 143: 10000})
(48000, 668, 3)
(48000, 2004)
train: (48000, 2004)
(12000, 668, 3)
(12000, 2004)
val: (12000, 2004)
(20000, 668, 3)
(20000, 2004)
test: (20000, 2004)
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.out
../datas

Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_56 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_111 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_112 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(90

Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_58 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_115 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_116 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train:

Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_60 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_119 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_120 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training

Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_62 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_123 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_124 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_55 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_109 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_110 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[6, 'fam_1', 22497, 89978, 25022, 89978, 0.4734316799595951, 0.999866666666

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[6, 'fam_7', 15000, 117505, 4995, 117505, 0.7501875468867217, 1.0, 0.9592244897959183, 0.9796122448979592]
Evaluating family fam_8
Test for autoencoder on fam fam_8
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_62 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_123 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_124 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test fo

Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_65 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_129 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_130 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20

Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_67 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_133 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_134 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
E

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_69 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_137 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_138 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_71 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_141 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_142 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_64 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_127 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_128 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[7, 'fam_5', 12500, 125000, 0, 125000, 1.0, 1.0, 1.0, 1.0]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_69 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_137 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_138 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_

Proteins for family fam_8
../dataset/families/fam_8/1AF7.lf_str.out
../dataset/families/fam_8/1Y8C.lf_str.out
../dataset/families/fam_8/1DUS.lf_str.out
../dataset/families/fam_8/1F3L.lf_str.out
../dataset/families/fam_8/1YUB.lf_str.out
Counter({271: 10000, 243: 10000, 191: 10000, 318: 10000, 242: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Proteins for family fam_9
../dataset/families/fam_9/1EE6.lf_str.out
../dataset/families/fam_9/1VBL.lf_str.out
../dataset/families/fam_9/1BHE.lf_str.out
../dataset/families/fam_9/1RU4.lf_str.out
../dataset/families/fam_9/1QCX.lf_str.out
Counter({194: 10000, 413: 10000, 373: 10000, 397: 10000, 356: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Training for family fam_1
train: (54000, 2004)
test(13500, 2004)
_____________________________

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_75 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_149 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_150 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_77 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_153 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_154 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17

Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_7
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_79 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_157 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_158 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15

Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_9
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_81 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_161 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_162 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[8, 'fam_2', 20000, 44906, 72594, 44906, 0.21599671684990387, 1.0, 0.3821787234042553, 0.6910893617021276]
Evaluating family fam_3
Test for autoencoder on fam fam_3
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_75 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_149 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_150 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test fo

(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Counter({144: 20000, 154: 10000, 146: 10000, 113: 10000, 279: 10000, 133: 10000, 143: 10000})
(48000, 668, 3)
(48000, 2004)
train: (48000, 2004)
(12000, 668, 3)
(12000, 2004)
val: (12000, 2004)
(20000, 668, 3)
(20000, 2004)
test: (20000, 2004)
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.out
../datas

Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_83 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_165 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_166 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(90

Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_85 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_169 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_170 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train:

Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_87 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_173 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_174 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training

Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_89 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_177 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_178 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_82 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_163 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_164 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[9, 'fam_1', 22500, 89899, 25101, 89899, 0.4726791453961051, 1.0, 0.7817304

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[9, 'fam_7', 15000, 117545, 4955, 117545, 0.7516913054372337, 1.0, 0.9595510204081633, 0.9797755102040817]
Evaluating family fam_8
Test for autoencoder on fam fam_8
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_89 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_177 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_178 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test fo

Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_92 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_183 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_184 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20

Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_94 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_187 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_188 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
E

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_96 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_191 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_192 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_98 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_195 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_196 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_91 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_181 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_182 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[10, 'fam_5', 12498, 125000, 0, 125000, 1.0, 0.99984, 1.0, 0.9999199999999999]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_96 (InputLayer)        (None, 2004)              0         
_________________________________________________________________
dense_191 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_192 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam

(15000, 668, 3)
(15000, 2004)
test: (15000, 2004)
Proteins for family fam_8
../dataset/families/fam_8/1AF7.lf_str.out
../dataset/families/fam_8/1Y8C.lf_str.out
../dataset/families/fam_8/1DUS.lf_str.out
../dataset/families/fam_8/1F3L.lf_str.out
../dataset/families/fam_8/1YUB.lf_str.out
Counter({271: 10000, 243: 10000, 191: 10000, 318: 10000, 242: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Proteins for family fam_9
../dataset/families/fam_9/1EE6.lf_str.out
../dataset/families/fam_9/1VBL.lf_str.out
../dataset/families/fam_9/1BHE.lf_str.out
../dataset/families/fam_9/1RU4.lf_str.out
../dataset/families/fam_9/1QCX.lf_str.out
Counter({194: 10000, 413: 10000, 373: 10000, 397: 10000, 356: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Training for family fam_1
train: (54000, 200

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_102 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_203 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_204 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18

Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_104 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_207 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_208 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16

Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_7
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_106 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_211 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_212 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14

Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_9
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_108 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_215 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_216 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/2

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[11, 'fam_2', 19999, 44799, 72701, 44799, 0.21573894282632147, 0.99995, 0.381268085106383, 0.6906090425531914]
Evaluating family fam_3
Test for autoencoder on fam fam_3
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_102 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_203 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_204 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Tes

(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Counter({144: 20000, 154: 10000, 146: 10000, 113: 10000, 279: 10000, 133: 10000, 143: 10000})
(48000, 668, 3)
(48000, 2004)
train: (48000, 2004)
(12000, 668, 3)
(12000, 2004)
val: (12000, 2004)
(20000, 668, 3)
(20000, 2004)
test: (20000, 2004)
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.out
../datas

Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_110 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_219 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_220 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(90

Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_112 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_223 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_224 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train:

Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_114 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_227 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_228 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training

Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_116 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_231 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_232 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_109 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_217 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_218 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[12, 'fam_1', 22500, 102696, 12304, 102696, 0.6464774163889209, 1.0, 0.8930

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[12, 'fam_7', 15000, 117439, 5061, 117439, 0.7477194556602362, 1.0, 0.9586857142857143, 0.9793428571428571]
Evaluating family fam_8
Test for autoencoder on fam fam_8
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_116 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_231 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_232 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test f

Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_119 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_237 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_238 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20

Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_121 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_241 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_242 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
E

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_123 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_245 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_246 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_125 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_249 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_250 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_118 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_235 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_236 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[13, 'fam_5', 12499, 125000, 0, 125000, 1.0, 0.99992, 1.0, 0.99996]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_123 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_245 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_246 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for

Proteins for family fam_8
../dataset/families/fam_8/1AF7.lf_str.out
../dataset/families/fam_8/1Y8C.lf_str.out
../dataset/families/fam_8/1DUS.lf_str.out
../dataset/families/fam_8/1F3L.lf_str.out
../dataset/families/fam_8/1YUB.lf_str.out
Counter({271: 10000, 243: 10000, 191: 10000, 318: 10000, 242: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Proteins for family fam_9
../dataset/families/fam_9/1EE6.lf_str.out
../dataset/families/fam_9/1VBL.lf_str.out
../dataset/families/fam_9/1BHE.lf_str.out
../dataset/families/fam_9/1RU4.lf_str.out
../dataset/families/fam_9/1QCX.lf_str.out
Counter({194: 10000, 413: 10000, 373: 10000, 397: 10000, 356: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Training for family fam_1
train: (54000, 2004)
test(13500, 2004)
_____________________________

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_129 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_257 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_258 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_131 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_261 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_262 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17

Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_7
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_133 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_265 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_266 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15

Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_9
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_135 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_269 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_270 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[14, 'fam_2', 19999, 45027, 72473, 45027, 0.21627087118262825, 0.99995, 0.38320851063829786, 0.6915792553191489]
Evaluating family fam_3
Test for autoencoder on fam fam_3
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_129 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_257 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_258 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
T

(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Counter({144: 20000, 154: 10000, 146: 10000, 113: 10000, 279: 10000, 133: 10000, 143: 10000})
(48000, 668, 3)
(48000, 2004)
train: (48000, 2004)
(12000, 668, 3)
(12000, 2004)
val: (12000, 2004)
(20000, 668, 3)
(20000, 2004)
test: (20000, 2004)
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.out
../datas

Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_137 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_273 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_274 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(90

Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_139 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_277 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_278 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train:

Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_141 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_281 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_282 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training

Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_143 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_285 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_286 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_136 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_271 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_272 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[15, 'fam_1', 22500, 88786, 26214, 88786, 0.4618795418154945, 1.0, 0.772052

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[15, 'fam_7', 15000, 117513, 4987, 117513, 0.7504878170811027, 1.0, 0.9592897959183674, 0.9796448979591836]
Evaluating family fam_8
Test for autoencoder on fam fam_8
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_143 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_285 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_286 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test f

Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_146 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_291 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_292 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20

Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_148 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_295 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_296 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
E

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_150 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_299 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_300 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_152 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_303 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_304 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_145 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_289 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_290 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[16, 'fam_5', 12499, 125000, 0, 125000, 1.0, 0.99992, 1.0, 0.99996]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_150 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_299 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_300 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for

(15000, 668, 3)
(15000, 2004)
test: (15000, 2004)
Proteins for family fam_8
../dataset/families/fam_8/1AF7.lf_str.out
../dataset/families/fam_8/1Y8C.lf_str.out
../dataset/families/fam_8/1DUS.lf_str.out
../dataset/families/fam_8/1F3L.lf_str.out
../dataset/families/fam_8/1YUB.lf_str.out
Counter({271: 10000, 243: 10000, 191: 10000, 318: 10000, 242: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Proteins for family fam_9
../dataset/families/fam_9/1EE6.lf_str.out
../dataset/families/fam_9/1VBL.lf_str.out
../dataset/families/fam_9/1BHE.lf_str.out
../dataset/families/fam_9/1RU4.lf_str.out
../dataset/families/fam_9/1QCX.lf_str.out
Counter({194: 10000, 413: 10000, 373: 10000, 397: 10000, 356: 10000})
(30000, 668, 3)
(30000, 2004)
train: (30000, 2004)
(7500, 668, 3)
(7500, 2004)
val: (7500, 2004)
(12500, 668, 3)
(12500, 2004)
test: (12500, 2004)
Training for family fam_1
train: (54000, 200

Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_156 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_311 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_312 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18

Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_158 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_315 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_316 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16

Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_7
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_160 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_319 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_320 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14

Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_9
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_162 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_323 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_324 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/2

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[17, 'fam_2', 19999, 115003, 2497, 115003, 0.8890024893314367, 0.99995, 0.9787489361702127, 0.9893494680851064]
Evaluating family fam_3
Test for autoencoder on fam fam_3
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_156 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_311 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_312 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Te

(54000, 668, 3)
(54000, 2004)
train: (54000, 2004)
(13500, 668, 3)
(13500, 2004)
val: (13500, 2004)
(22500, 668, 3)
(22500, 2004)
test: (22500, 2004)
Proteins for family fam_2
../dataset/families/fam_2/1HLB.lf_str.out
../dataset/families/fam_2/2LHB.lf_str.out
../dataset/families/fam_2/1DLW.lf_str.out
../dataset/families/fam_2/1ITH.lf_str.out
../dataset/families/fam_2/1ECA.lf_str.out
../dataset/families/fam_2/1ASH.lf_str.out
../dataset/families/fam_2/1MBA.lf_str.out
../dataset/families/fam_2/2HBG.lf_str.out
Counter({144: 20000, 154: 10000, 146: 10000, 113: 10000, 279: 10000, 133: 10000, 143: 10000})
(48000, 668, 3)
(48000, 2004)
train: (48000, 2004)
(12000, 668, 3)
(12000, 2004)
val: (12000, 2004)
(20000, 668, 3)
(20000, 2004)
test: (20000, 2004)
Proteins for family fam_3
../dataset/families/fam_3/2SAS.lf_str.out
../dataset/families/fam_3/1OMR.lf_str.out
../dataset/families/fam_3/1SRA.lf_str.out
../dataset/families/fam_3/1CB1.lf_str.out
../dataset/families/fam_3/1IQ3.lf_str.out
../datas

Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_164 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_327 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_328 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_3
train: (36000, 2004)
test(90

Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_166 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_331 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_332 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_5
train:

Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_168 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_335 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_336 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training

Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_170 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_339 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_340 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19

Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_163 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_325 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_326 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[18, 'fam_1', 22500, 99009, 15991, 99009, 0.5845522329895301, 1.0, 0.860947

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[18, 'fam_7', 15000, 117535, 4965, 117535, 0.7513148009015778, 1.0, 0.959469387755102, 0.9797346938775511]
Evaluating family fam_8
Test for autoencoder on fam fam_8
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_170 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_339 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_340 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test fo

Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_2
train: (48000, 2004)
test(12000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_173 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_345 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_346 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_4
train: (36000, 2004)
test(9000, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_175 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_349 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_350 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 36000 samples, validate on 9000 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_6
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_177 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_353 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_354 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 36000 samples, validate on 9000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Training for family fam_8
train: (30000, 2004)
test(7500, 2004)
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_179 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_357 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_358 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Train on 30000 samples, validate on 7500 samples
Epoch 1

Train on 30000 samples, validate on 7500 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Evaluating family fam_1
Test for autoencoder on fam fam_1
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_172 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_343 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_344 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test 

Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam_6
Test for fam fam_7
Test for fam fam_8
Test for fam fam_9
[19, 'fam_5', 12500, 125000, 0, 125000, 1.0, 1.0, 1.0, 1.0]
Evaluating family fam_6
Test for autoencoder on fam fam_6
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_177 (InputLayer)       (None, 2004)              0         
_________________________________________________________________
dense_353 (Dense)            (None, 25)                50125     
_________________________________________________________________
dense_354 (Dense)            (None, 2004)              52104     
Total params: 102,229
Trainable params: 102,229
Non-trainable params: 0
_________________________________________________________________
Test for fam fam_1
Test for fam fam_2
Test for fam fam_3
Test for fam fam_4
Test for fam fam_5
Test for fam fam