In [1]:
from torchvision.models import *
import wandb
from sklearn.model_selection import train_test_split
import os,cv2
import numpy as np
import matplotlib.pyplot as plt
from torch.nn import *
import torch,torchvision
from tqdm import tqdm
device = 'cuda'
PROJECT_NAME = 'Hutton-Rock-Dataset'

In [10]:
def load_data():
    data = []
    labels = {}
    labels_r = {}
    idx = 0
    for folder in os.listdir('./data/'):
        idx += 1
        labels[folder] = idx
        labels_r[idx] = folder
    print(labels)
    print(idx)
    for folder in tqdm(os.listdir('./data/')):
        print(folder)
        for file in tqdm(os.listdir(f'./data/{folder}')):
            try:
                img = cv2.imread(f'./data/{folder}/{file}')
                img = cv2.resize(img,(112,112))
                img = img / 255.0
                data.append([img,np.eye(labels[folder],idx)[labels[folder]-1]])
            except:
                pass
    X = []
    y = []
    for d in data:
        X.append(d[0])
        y.append(d[1])
    X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.25,shuffle=False,random_state=2008)
    X_train = torch.from_numpy(np.array(X_train)).view(-1,3,112,112).to(device).float()
    X_test = torch.from_numpy(np.array(X_test)).view(-1,3,112,112).to(device).float()
    y_train = torch.from_numpy(np.array(y_train)).to(device).float()
    y_test = torch.from_numpy(np.array(y_test)).to(device).float()
    return X_train,X_test,y_train,y_test,X,y,labels,labels_r,idx,data

In [11]:
X_train,X_test,y_train,y_test,X,y,labels,labels_r,idx,data = load_data()

{'basalt': 1, 'granite': 2, 'andesite': 3}
3


  0%|                                                     | 0/3 [00:00<?, ?it/s]

basalt



  0%|                                                   | 0/122 [00:00<?, ?it/s][A
100%|████████████████████████████████████████| 122/122 [00:00<00:00, 430.78it/s][A
 33%|███████████████                              | 1/3 [00:00<00:00,  3.50it/s]

granite



  0%|                                                   | 0/187 [00:00<?, ?it/s][A
 24%|█████████▋                               | 44/187 [00:00<00:00, 414.77it/s][A
 48%|███████████████████▋                     | 90/187 [00:00<00:00, 437.89it/s][A
 72%|████████████████████████████▋           | 134/187 [00:00<00:00, 382.53it/s][A
100%|████████████████████████████████████████| 187/187 [00:00<00:00, 364.13it/s][A
 67%|██████████████████████████████               | 2/3 [00:00<00:00,  2.37it/s]

andesite



  0%|                                                    | 0/99 [00:00<?, ?it/s][A
 25%|██████████▌                               | 25/99 [00:00<00:00, 237.13it/s][A
 65%|███████████████████████████▏              | 64/99 [00:00<00:00, 319.08it/s][A
100%|██████████████████████████████████████████| 99/99 [00:00<00:00, 273.16it/s][A
100%|█████████████████████████████████████████████| 3/3 [00:01<00:00,  2.57it/s]


In [12]:
def get_loss(model,X,y,criterion):
    preds = model(X)
    loss = criterion(preds,y)
    return loss.item()

In [13]:
def get_accuracy(model,X,y):
    correct = 0
    total = 0
    preds = model(X)
    for pred,y_batch in zip(preds,y):
        pred = int(torch.argmax(pred))
        y_batch = int(torch.argmax(y_batch))
        if pred == y_batch:
            correct += 1
        total += 1
    acc = round(correct/total,3)*100
    return acc

In [21]:
model = resnet18().to(device)

In [22]:
model.fc

Linear(in_features=512, out_features=1000, bias=True)

In [23]:
model.fc = Linear(512,2)

In [24]:
model.fc

Linear(in_features=512, out_features=2, bias=True)

In [25]:
criterion = MSELoss()

In [27]:
optimizer = torch.optim.Adam(model.parameters(),lr=0.001)

In [28]:
batch_size = 32
epochs = 100

In [None]:
torch.cuda.empty_cache()
wandb.init(project=PROJECT_NAME,name='baseline')
torch.cuda.empty_cache()
for _ in tqdm(range(epochs)):
    torch.cuda.empty_cache()
    for i in range(0,len(X_train),batch_size):
        torch.cuda.empty_cache()
        X_batch = X_train[i:i+batch_size].to(device)
        y_batch = y_train[i:i+batch_size].to(device)
        preds = model(X_batch)
        loss = criterion(preds,y_batch)
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        torch.cuda.empty_cache()
    torch.cuda.empty_cache()
    wandb.log({'Loss':(get_loss(model,X_train,y_train,criterion)+get_loss(model,X_batch,y_batch,criterion))/2})
    torch.cuda.empty_cache()
    wandb.log({'Val Loss':get_loss(model,X_test,y_test,criterion)})
    torch.cuda.empty_cache()
    wandb.log({'Acc':(get_accuracy(model,X_train,y_train)+get_accuracy(model,X_batch,y_batch))/2})
    torch.cuda.empty_cache()
    wandb.log({'Val ACC':get_accuracy(model,X_test,y_test)})
    torch.cuda.empty_cache()
torch.cuda.empty_cache()
wandb.finish()
torch.cuda.empty_cache()

[34m[1mwandb[0m: Currently logged in as: [33mranuga-d[0m (use `wandb login --relogin` to force relogin)
