In [37]:
import torch
import torchvision
from torchvision import datasets
from torchvision import transforms
import ignite
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import cv2
import numpy as np
from tqdm import tqdm
from torch.utils.data import Dataset
import os, shutil
from natsort import natsorted
from PIL import Image

In [39]:
REBUILD_DATA = True # set to true to one once, then back to false unless you want to change something in your training data.
class VibroData():
    IMG_SIZE = 800
    DOWNS = "Train/downs"
    PEAKS = "Train/peaks"
    
    TESTING = "Test"
    LABELS = {DOWNS: 0, PEAKS: 1}
    training_data = []
    dcount = 0
    pcount = 0
    def make_training_data(self):
        for label in self.LABELS:
            print(label)
            for f in tqdm(os.listdir(label)):
                if "jpg" in f:
                    try:
                        path = os.path.join(label, f)
                        img = cv2.imread(path, cv2.IMREAD_GRAYSCALE)
                        img = cv2.resize(img, (self.IMG_SIZE, self.IMG_SIZE))
                        self.training_data.append([np.array(img), np.eye(2)[self.LABELS[label]]])  # do something like print(np.eye(2)[1]), just makes one_hot 
                        #print(np.eye(2)[self.LABELS[label]])
                        if label == self.DOWNS:
                            self.dcount += 1
                        elif label == self.PEAKS:
                            self.pcount += 1   
                    except Exception as e:
                        pass
                        #print(label, f, str(e))
        np.random.shuffle(self.training_data)
        np.save("training_data.npy", self.training_data)
        print('Downs:',VibroData.dcount)
        print('Peaks:',VibroData.pcount)
if REBUILD_DATA:
    Vibdata = VibroData()
    Vibdata.make_training_data() 


 45%|████▍     | 134/300 [00:00<00:00, 661.29it/s]

Train/downs


100%|██████████| 300/300 [00:00<00:00, 628.63it/s]
 44%|████▎     | 131/300 [00:00<00:00, 651.36it/s]

Train/peaks


100%|██████████| 300/300 [00:00<00:00, 610.91it/s]


Downs: 0
Peaks: 0


In [40]:
class Net(nn.Module):
    def __init__(self):
        super().__init__() # just run the init of parent class (nn.Module)
        self.conv1 = nn.Conv2d(1, 32, 5) # вход 1 изображение, выход 32 канала, ядро свертки размером 5x5
        self.conv2 = nn.Conv2d(32, 64, 5) # вход 32, так как выход первого слоя 32. Выход будет 64 канала, ядро свертки размером 5x5
        self.conv3 = nn.Conv2d(64, 128, 5)
        x = torch.randn(50,50).view(-1,1,50,50)
        self._to_linear = None
        self.convs(x)
        self.fc1 = nn.Linear(self._to_linear, 512) #выпрямление.
        self.fc2 = nn.Linear(512, 2) # 512 вход, 2 выход так как у нас два класса (собаки и кошки).
    def convs(self, x):
        # max pooling over 2x2
        x = F.max_pool2d(F.relu(self.conv1(x)), (2, 2))
        x = F.max_pool2d(F.relu(self.conv2(x)), (2, 2))
        x = F.max_pool2d(F.relu(self.conv3(x)), (2, 2))
        if self._to_linear is None:
            self._to_linear = x[0].shape[0]*x[0].shape[1]*x[0].shape[2]
        return x
    def forward(self, x):
        x = self.convs(x)
        x = x.view(-1, self._to_linear)  # .view is reshape ... this flattens X before 
        x = F.relu(self.fc1(x))
        x = self.fc2(x) # Это наш выходной слой. Функции активации тут нет.
        return F.softmax(x, dim=1)
net = Net()
print(net) 

Net(
  (conv1): Conv2d(1, 32, kernel_size=(5, 5), stride=(1, 1))
  (conv2): Conv2d(32, 64, kernel_size=(5, 5), stride=(1, 1))
  (conv3): Conv2d(64, 128, kernel_size=(5, 5), stride=(1, 1))
  (fc1): Linear(in_features=512, out_features=512, bias=True)
  (fc2): Linear(in_features=512, out_features=3, bias=True)
)


In [41]:
training_data = np.load("training_data.npy", allow_pickle=True)
print(len(training_data))

600


In [42]:
optimizer = optim.Adam(net.parameters(), lr=0.001)
loss_function = nn.MSELoss() 

In [43]:
X = torch.Tensor([i[0] for i in training_data]).view(-1,50,50)
X = X/255.0
y = torch.Tensor([i[1] for i in training_data])
VAL_PCT = 0.1  # lets reserve 10% of our data for validation
val_size = int(len(X)*VAL_PCT)
train_X = X[:-val_size]
train_y = y[:-val_size]
test_X = X[-val_size:]
test_y = y[-val_size:]

In [44]:
BATCH_SIZE = 100
EPOCHS = 1
for epoch in range(EPOCHS):
    for i in tqdm(range(0, len(train_X), BATCH_SIZE)): # from 0, to the len of x, stepping BATCH_SIZE at a time. [:50] ..for now just to dev
        #print(f"{i}:{i+BATCH_SIZE}")
        batch_X = train_X[i:i+BATCH_SIZE].view(-1, 1, 50, 50)
        batch_y = train_y[i:i+BATCH_SIZE]
        net.zero_grad()
        outputs = net(batch_X)
        loss = loss_function(outputs, batch_y)
        loss.backward()
        optimizer.step()    # Does the update
    print(f"Epoch: {epoch}. Loss: {loss}") 

  0%|          | 0/1383 [00:00<?, ?it/s]


RuntimeError: The size of tensor a (3) must match the size of tensor b (2) at non-singleton dimension 1

In [None]:
correct = 0
total = 0
with torch.no_grad():
    for i in tqdm(range(len(test_X))):
        real_class = torch.argmax(test_y[i])
        net_out = net(test_X[i].view(-1, 1, 50, 50))[0]  # returns a list, 
        predicted_class = torch.argmax(net_out)
        if predicted_class == real_class:
            correct += 1
        total += 1
print("Accuracy: ", round(correct/total, 3)) 