In [1]:
import torch
import torchvision

model = torchvision.models.alexnet(pretrained=False)
model.classifier[6] = torch.nn.Linear(model.classifier[6].in_features, 2)

In [2]:
model.load_state_dict(torch.load('best_model.pth'))

<All keys matched successfully>

In [3]:
device = torch.device('cuda')
model = model.to(device)

In [4]:
import cv2
import numpy as np

mean = 255.0 * np.array([0.485, 0.456, 0.406])
stdev = 255.0 * np.array([0.229, 0.224, 0.225])

normalize = torchvision.transforms.Normalize(mean, stdev)

def preprocess(camera_value):
    global device, normalize
    x = camera_value
    x = cv2.cvtColor(x, cv2.COLOR_BGR2RGB)
    x = x.transpose((2, 0, 1))
    x = torch.from_numpy(x).float()
    x = normalize(x)
    x = x.to(device)
    x = x[None, ...]
    return x

In [11]:
import traitlets
from IPython.display import display
import ipywidgets.widgets as widgets
from jetbot import Camera, bgr8_to_jpeg

camera = Camera.instance(width=224, height=224)
image = widgets.Image(format='jpeg', width=224, height=224)
blocked_slider = widgets.FloatSlider(description='no stop sign', min=0.0, max=1.0, orientation='vertical')

camera_link = traitlets.dlink((camera, 'value'), (image, 'value'), transform=bgr8_to_jpeg)

display(widgets.HBox([image, blocked_slider]))

HBox(children=(Image(value=b'\xff\xd8\xff\xe0\x00\x10JFIF\x00\x01\x01\x00\x00\x01\x00\x01\x00\x00\xff\xdb\x00C…

In [12]:
import torch.nn.functional as F
import datetime
import time

def update(change):
    global blocked_slider, robot
    x = change['new'] 
    x = preprocess(x)
    y = model(x)
    
    # we apply the `softmax` function to normalize the output vector so it sums to 1 (which makes it a probability distribution)
    y = F.softmax(y, dim=1)
    
    prob_blocked = float(y.flatten()[0])
    
    blocked_slider.value = prob_blocked
    
    if prob_blocked < 0.5:
        print('Stop sign detected', datetime.datetime.now().time())
    
    time.sleep(0.001)
        
update({'new': camera.value})  # we call the function once to intialize

In [13]:
camera.observe(update, names='value')  # this attaches the 'update' function to the 'value' traitlet of our camera

Stop sign detected 09:18:10.960712
Stop sign detected 09:18:11.357047
Stop sign detected 09:18:11.458355
Stop sign detected 09:18:11.561954
Stop sign detected 09:18:11.616127
Stop sign detected 09:18:12.080340
Stop sign detected 09:18:12.281796
Stop sign detected 09:18:12.331587
Stop sign detected 09:18:12.830153
Stop sign detected 09:18:12.946812
Stop sign detected 09:18:12.996973
Stop sign detected 09:18:13.665040
Stop sign detected 09:18:13.765056
Stop sign detected 09:18:13.916042
Stop sign detected 09:18:13.969808
Stop sign detected 09:18:14.026470
Stop sign detected 09:18:14.086385
Stop sign detected 09:18:14.142465
Stop sign detected 09:18:14.193093
Stop sign detected 09:18:14.243530
Stop sign detected 09:18:14.339590
Stop sign detected 09:18:14.391536
Stop sign detected 09:18:14.443418
Stop sign detected 09:18:14.492210
Stop sign detected 09:18:14.589492
Stop sign detected 09:18:14.787437
Stop sign detected 09:18:14.837631
Stop sign detected 09:18:14.887338
Stop sign detected 0

In [14]:
camera.unobserve(update, names='value')

time.sleep(0.1)  # add a small sleep to make sure frames have finished processing

Stop sign detected 09:18:56.413520
Stop sign detected 09:18:56.479174


In [15]:
camera.stop()