In [1]:
!guild compare --csv results_quality.csv

Wrote 52 row(s) to results_quality.csv


In [2]:
import pandas as pd

In [3]:
df = pd.read_csv('results_quality.csv')

In [4]:
df.columns

Index(['run', 'operation', 'started', 'time', 'status', 'label', 'base_loss',
       'batch_size', 'csv_train', 'decay_f', 'exp', 'lambd', 'load_checkpoint',
       'lr', 'metric', 'model_name', 'n_classes', 'n_epochs', 'optimizer',
       'oversample', 'patience', 'pretrained', 'save_model', 'step', 'acc',
       'auc', 'kappa'],
      dtype='object')

In [5]:
df = df.drop(['run', 'operation', 'started', 'time', 'status', 'label', 'batch_size', 'decay_f', 'n_classes',
              'optimizer', 'oversample', 'patience', 'pretrained', 'save_model', 'step', 'n_epochs',
              'exp', 'lambd', 'load_checkpoint', 'metric'], axis=1)

In [6]:
df.columns

Index(['base_loss', 'csv_train', 'lr', 'model_name', 'acc', 'auc', 'kappa'], dtype='object')

In [7]:
df_clarity = df[df.csv_train=='train_clarity.csv']
df_clarity = df_clarity.drop(['csv_train'], axis=1)

In [8]:
df_quality = df[df.csv_train=='train_quality.csv']
df_quality = df_quality.drop(['csv_train','kappa'], axis=1)

In [9]:
df_field_def = df[df.csv_train=='train_field_def.csv']
df_field_def = df_field_def.drop(['csv_train'], axis=1)

In [10]:
df_field_artifact = df[df.csv_train=='train_artifact.csv']
df_field_artifact = df_field_artifact.drop(['csv_train'], axis=1)

# Analyzing Quality Results

In [11]:
df_quality.sort_values(by ='auc', ascending=False).head()

Unnamed: 0,base_loss,lr,model_name,acc,auc
42,ce,0.0001,resnext50_sws,0.76,0.838402
44,ce,0.0001,resnet50_sws,0.775,0.835022
43,ce,0.0001,resnext50,0.745,0.833455
45,ce,0.0001,resnet50,0.735,0.830949
34,focal_loss,0.0001,resnext50_sws,0.7475,0.828232


In [12]:
df_quality.sort_values(by ='acc', ascending=False).head()

Unnamed: 0,base_loss,lr,model_name,acc,auc
44,ce,0.0001,resnet50_sws,0.775,0.835022
49,ce,0.001,resnet50,0.7675,0.824613
42,ce,0.0001,resnext50_sws,0.76,0.838402
34,focal_loss,0.0001,resnext50_sws,0.7475,0.828232
36,focal_loss,0.0001,resnet50_sws,0.7475,0.820847


### Conclusions
* Training with lr=0.0001 is way better
* Training with ce seems also much better
* I guess resnext50_sws is best (1st auc, 3rd acc).
* resnet50_sws is also very good (2nd auc, 1st acc). But we trust more AUC at this point.

# Analyzing Clarity Results

In [13]:
df_clarity.sort_values(by ='auc', ascending=False).head(10)

Unnamed: 0,base_loss,lr,model_name,acc,auc,kappa
5,focal_loss,0.001,resnext50,0.58,0.871427,0.738754
8,ce,0.0001,resnext50_sws,0.53,0.866204,0.74666
9,ce,0.0001,resnext50,0.5325,0.864844,0.746635
0,focal_loss,0.0001,resnext50_sws,0.545,0.862738,0.771517
1,focal_loss,0.0001,resnext50,0.5275,0.860815,0.74515
3,focal_loss,0.0001,resnet50,0.5625,0.860022,0.74467
12,ce,0.001,resnext50_sws,0.56,0.859043,0.716096
13,ce,0.001,resnext50,0.5775,0.857485,0.724669
4,focal_loss,0.001,resnext50_sws,0.53,0.856989,0.720102
6,focal_loss,0.001,resnet50_sws,0.54,0.85667,0.729781


In [14]:
df_clarity.sort_values(by ='acc', ascending=False).head(10)

Unnamed: 0,base_loss,lr,model_name,acc,auc,kappa
5,focal_loss,0.001,resnext50,0.58,0.871427,0.738754
13,ce,0.001,resnext50,0.5775,0.857485,0.724669
3,focal_loss,0.0001,resnet50,0.5625,0.860022,0.74467
7,focal_loss,0.001,resnet50,0.56,0.856247,0.723526
12,ce,0.001,resnext50_sws,0.56,0.859043,0.716096
10,ce,0.0001,resnet50_sws,0.5575,0.851869,0.728541
2,focal_loss,0.0001,resnet50_sws,0.5525,0.855901,0.75722
0,focal_loss,0.0001,resnext50_sws,0.545,0.862738,0.771517
15,ce,0.001,resnet50,0.5425,0.851844,0.709565
6,focal_loss,0.001,resnet50_sws,0.54,0.85667,0.729781
