In [16]:
import torch
import torchvision

model = torchvision.models.alexnet(pretrained=False)
model.classifier[6] = torch.nn.Linear(model.classifier[6].in_features, 2)

In [17]:
model.load_state_dict(torch.load('best_model.pth'))

<All keys matched successfully>

In [18]:
device = torch.device('cuda')
model = model.to(device)

In [19]:
import cv2
import numpy as np

mean = 255.0 * np.array([0.485, 0.456, 0.406])
stdev = 255.0 * np.array([0.229, 0.224, 0.225])

normalize = torchvision.transforms.Normalize(mean, stdev)

def preprocess(camera_value):
    global device, normalize
    x = camera_value
    x = cv2.cvtColor(x, cv2.COLOR_BGR2RGB)
    x = x.transpose((2, 0, 1))
    x = torch.from_numpy(x).float()
    x = normalize(x)
    x = x.to(device)
    x = x[None, ...]
    return x

In [20]:
import traitlets
from IPython.display import display
import ipywidgets.widgets as widgets
from jetbot import Camera, bgr8_to_jpeg

camera = Camera.instance(width=224, height=224)
image = widgets.Image(format='jpeg', width=224, height=224)
blocked_slider = widgets.FloatSlider(description='no stop sign', min=0.0, max=1.0, orientation='vertical')

camera_link = traitlets.dlink((camera, 'value'), (image, 'value'), transform=bgr8_to_jpeg)

display(widgets.HBox([image, blocked_slider]))

HBox(children=(Image(value=b'\xff\xd8\xff\xe0\x00\x10JFIF\x00\x01\x01\x00\x00\x01\x00\x01\x00\x00\xff\xdb\x00C…

In [21]:
import torch.nn.functional as F
import datetime
import time

def update(change):
    global blocked_slider, robot
    x = change['new'] 
    x = preprocess(x)
    y = model(x)
    
    # we apply the `softmax` function to normalize the output vector so it sums to 1 (which makes it a probability distribution)
    y = F.softmax(y, dim=1)
    
    prob_blocked = float(y.flatten()[0])
    
    blocked_slider.value = prob_blocked
    
    if prob_blocked < 0.5:
        print('Stop sign detected', datetime.datetime.now().time())
    
    time.sleep(0.001)
        
update({'new': camera.value})  # we call the function once to intialize

Stop sign detected 09:37:11.696549


In [22]:
camera.observe(update, names='value')  # this attaches the 'update' function to the 'value' traitlet of our camera

Stop sign detected 09:37:14.094133
Stop sign detected 09:37:14.165754
Stop sign detected 09:37:14.222126
Stop sign detected 09:37:14.275694
Stop sign detected 09:37:14.326501
Stop sign detected 09:37:14.378157
Stop sign detected 09:37:14.426949
Stop sign detected 09:37:14.475773
Stop sign detected 09:37:14.522794
Stop sign detected 09:37:14.572893
Stop sign detected 09:37:14.624861
Stop sign detected 09:37:14.673532
Stop sign detected 09:37:14.720717
Stop sign detected 09:37:14.770731
Stop sign detected 09:37:14.821144
Stop sign detected 09:37:14.868712
Stop sign detected 09:37:14.917705
Stop sign detected 09:37:14.966097
Stop sign detected 09:37:15.016389
Stop sign detected 09:37:15.067868
Stop sign detected 09:37:15.116299
Stop sign detected 09:37:15.170731
Stop sign detected 09:37:15.219082
Stop sign detected 09:37:15.265552
Stop sign detected 09:37:15.314086
Stop sign detected 09:37:15.363154
Stop sign detected 09:37:15.412187
Stop sign detected 09:37:15.459847
Stop sign detected 0

In [23]:
camera.unobserve(update, names='value')

time.sleep(0.1)  # add a small sleep to make sure frames have finished processing

Stop sign detected 09:38:42.046249
Stop sign detected 09:38:42.105981


In [24]:
camera.stop()