# load data

In [1]:
from glob import glob
import os
images=[]
labels=[]
for folder in os.listdir('../dataset/wrist_xray'):
    for pic in glob('../dataset/wrist_xray/{}/*.jpg'.format(folder)):
        images.append(pic)
        labels.append(folder)
        

In [2]:
import pandas as pd
data=pd.DataFrame(zip(images,labels),columns=['img','label'])
data.label=data.label.map({'Fracture':0,'Normal':1})
data = data.sample(frac=1).reset_index(drop=True)
data.head()

Unnamed: 0,img,label
0,../dataset/wrist_xray/Normal\17.jpg,1
1,../dataset/wrist_xray/Normal\39.jpg,1
2,../dataset/wrist_xray/Normal\78.jpg,1
3,../dataset/wrist_xray/Normal\12.jpg,1
4,../dataset/wrist_xray/Normal\72.jpg,1


# top 5 lightest models in torchvision
1	squeezenet1_1	1235496  
2	shufflenet_v2_x0_5	1366792  
3	mnasnet0_5	2218512  
4	mobilenet_v2	3504872  
5	densenet121	7978856  `

In [3]:
import sys
sys.path.append("../src") 

In [4]:
from models.squeezenet import squeezenet1_1
from models.mymodels import mymodel1,mymodel2,mymodel3,mymodel4
from models.shufflenet import shufflenet_v2_x0_5
from models.mnastnet import mnasnet0_5
from models.densenet import densenet121
from models.mobilenet import mobilenet
from cross_vals import kfoldcv

In [5]:
def count_parameters(model):
    return sum(p.numel() for p in model.parameters() if p.requires_grad)/1e6

  and should_run_async(code)


In [6]:
print('MyNet1 parameters :' ,count_parameters(mymodel1()))
print('MyNet2 parameters :', count_parameters(mymodel2()))
print('MyNet3 parameters :', count_parameters(mymodel3()))
print('MyNet4 parameters :', count_parameters(mymodel4()))



MyNet1 parameters : 1.158232
MyNet2 parameters : 1.158232
MyNet3 parameters : 1.157848
MyNet4 parameters : 1.157848


In [7]:
epoch=32
batchsize=8
lr=0.001

dim='3D' or '2D' for 3D images and 2D iamges
skip_tuning=False, no grid search applied for hyper-parameter tuning, 
aug=1-> pytorch augmentation
aug=0-> no augmentation
aug=2-> albumentation augmentation
aug=3-> rand augmentation

# MyNet

In [8]:
%%time
train_cv,clf_report=kfoldcv(model=mymodel1(),epochs=epoch,batchsize=batchsize,data=data,\
                            lr=lr,skip_tuning=False,aug=1,dim='2D',pca=False)
for clf in ['Decision Tree','SVM',"logistic regression",'K Nearest neighbors','autoML']:
    print('------------------',clf,'----------------')
    print(clf_report[0][clf][0])
    
print('--------------------------Accuracy Table-----------------------------------')
clf_report[1]

------------------ Decision Tree ----------------
          precision  recall  f1-score
Class 0       0.786   0.788     0.780
Class 1       0.700   0.696     0.684
macro         0.742   0.742     0.732
weighted      0.756   0.740     0.738
------------------ SVM ----------------
          precision  recall  f1-score
Class 0       0.762   0.828     0.790
Class 1       0.756   0.648     0.686
macro         0.760   0.738     0.736
weighted      0.766   0.750     0.748
------------------ logistic regression ----------------
          precision  recall  f1-score
Class 0       0.790   0.830     0.806
Class 1       0.778   0.702     0.720
macro         0.786   0.764     0.760
weighted      0.792   0.772     0.768
------------------ K Nearest neighbors ----------------
          precision  recall  f1-score
Class 0       0.800   0.796     0.792
Class 1       0.720   0.714     0.704
macro         0.760   0.756     0.748
weighted      0.772   0.758     0.754
------------------ autoML ------------

Unnamed: 0,DT,SVM,LR,KNN,ML
0,0.69,0.67,0.72,0.69,0.74
1,0.64,0.79,0.77,0.69,0.9
2,0.82,0.79,0.79,0.85,0.87
3,0.79,0.74,0.79,0.82,0.87
4,0.76,0.76,0.79,0.74,0.82
mean,0.74,0.75,0.772,0.758,0.84


In [9]:
%%time
train_cv,clf_report=kfoldcv(model=mymodel2(),epochs=epoch,batchsize=batchsize,data=data,\
                            lr=lr,skip_tuning=False,aug=1,dim='2D',pca=False)
for clf in ['Decision Tree','SVM',"logistic regression",'K Nearest neighbors','autoML']:
    print('------------------',clf,'----------------')
    print(clf_report[0][clf][0])
    
print('--------------------------Accuracy Table-----------------------------------')
clf_report[1]

------------------ Decision Tree ----------------
          precision  recall  f1-score
Class 0       0.748   0.758     0.740
Class 1       0.678   0.644     0.642
macro         0.712   0.700     0.692
weighted      0.722   0.706     0.700
------------------ SVM ----------------
          precision  recall  f1-score
Class 0       0.748   0.712     0.726
Class 1       0.636   0.670     0.646
macro         0.690   0.690     0.686
weighted      0.704   0.696     0.694
------------------ logistic regression ----------------
          precision  recall  f1-score
Class 0       0.698   0.764     0.730
Class 1       0.638   0.548     0.582
macro         0.668   0.660     0.654
weighted      0.676   0.676     0.668
------------------ K Nearest neighbors ----------------
          precision  recall  f1-score
Class 0       0.726   0.748     0.730
Class 1       0.638   0.614     0.614
macro         0.682   0.682     0.674
weighted      0.698   0.688     0.682
------------------ autoML ------------

Unnamed: 0,DT,SVM,LR,KNN,ML
0,0.64,0.72,0.62,0.67,0.72
1,0.67,0.67,0.62,0.62,0.69
2,0.69,0.67,0.67,0.59,0.77
3,0.71,0.68,0.71,0.74,0.76
4,0.82,0.74,0.76,0.82,0.82
mean,0.706,0.696,0.676,0.688,0.752


In [10]:
%%time
train_cv,clf_report=kfoldcv(model=mymodel3(),epochs=epoch,batchsize=batchsize,data=data,\
                            lr=lr,skip_tuning=False,aug=1,dim='2D',pca=False)
for clf in ['Decision Tree','SVM',"logistic regression",'K Nearest neighbors','autoML']:
    print('------------------',clf,'----------------')
    print(clf_report[0][clf][0])
    
print('--------------------------Accuracy Table-----------------------------------')
clf_report[1]

------------------ Decision Tree ----------------
          precision  recall  f1-score
Class 0       0.852   0.858     0.854
Class 1       0.802   0.798     0.794
macro         0.826   0.828     0.822
weighted      0.836   0.830     0.828
------------------ SVM ----------------
          precision  recall  f1-score
Class 0       0.944   0.864     0.898
Class 1       0.834   0.928     0.876
macro         0.888   0.894     0.888
weighted      0.900   0.890     0.892
------------------ logistic regression ----------------
          precision  recall  f1-score
Class 0       0.918   0.856     0.882
Class 1       0.816   0.890     0.848
macro         0.866   0.874     0.866
weighted      0.878   0.870     0.870
------------------ K Nearest neighbors ----------------
          precision  recall  f1-score
Class 0       0.916   0.894     0.904
Class 1       0.856   0.894     0.874
macro         0.888   0.896     0.888
weighted      0.896   0.890     0.892
------------------ autoML ------------

Unnamed: 0,DT,SVM,LR,KNN,ML
0,0.72,0.9,0.87,0.85,0.92
1,0.9,0.9,0.85,0.92,0.9
2,0.92,0.92,0.92,0.92,0.95
3,0.82,0.89,0.89,0.89,0.89
4,0.79,0.84,0.82,0.87,0.89
mean,0.83,0.89,0.87,0.89,0.91


In [11]:
%%time
train_cv,clf_report=kfoldcv(model=mymodel4(),epochs=epoch,batchsize=batchsize,data=data,\
                            lr=lr,skip_tuning=False,aug=1,dim='2D',pca=False)
for clf in ['Decision Tree','SVM',"logistic regression",'K Nearest neighbors','autoML']:
    print('------------------',clf,'----------------')
    print(clf_report[0][clf][0])
    
print('--------------------------Accuracy Table-----------------------------------')
clf_report[1]

------------------ Decision Tree ----------------
          precision  recall  f1-score
Class 0       0.860   0.790     0.820
Class 1       0.770   0.830     0.790
macro         0.818   0.812     0.806
weighted      0.828   0.808     0.808
------------------ SVM ----------------
          precision  recall  f1-score
Class 0       0.832   0.792     0.806
Class 1       0.758   0.786     0.760
macro         0.796   0.790     0.784
weighted      0.808   0.788     0.790
------------------ logistic regression ----------------
          precision  recall  f1-score
Class 0       0.848   0.828     0.832
Class 1       0.794   0.796     0.782
macro         0.820   0.812     0.808
weighted      0.830   0.814     0.812
------------------ K Nearest neighbors ----------------
          precision  recall  f1-score
Class 0       0.854   0.812     0.826
Class 1       0.784   0.804     0.778
macro         0.820   0.808     0.804
weighted      0.832   0.808     0.808
------------------ autoML ------------

Unnamed: 0,DT,SVM,LR,KNN,ML
0,0.77,0.77,0.77,0.77,0.79
1,0.9,0.87,0.87,0.85,0.92
2,0.77,0.72,0.82,0.87,0.9
3,0.76,0.76,0.79,0.76,0.87
4,0.84,0.82,0.82,0.79,0.89
mean,0.808,0.788,0.814,0.808,0.874
