In [1]:
import torch
import torchvision

model = torchvision.models.alexnet(pretrained=False)
model.classifier[6] = torch.nn.Linear(model.classifier[6].in_features, 2)

In [2]:
model.load_state_dict(torch.load('best_model.pth'))

<All keys matched successfully>

In [3]:
device = torch.device('cuda')
model = model.to(device)

In [4]:
import cv2
import numpy as np

mean = 255.0 * np.array([0.485, 0.456, 0.406])
stdev = 255.0 * np.array([0.229, 0.224, 0.225])

normalize = torchvision.transforms.Normalize(mean, stdev)

def preprocess(camera_value):
    global device, normalize
    x = camera_value
    x = cv2.cvtColor(x, cv2.COLOR_BGR2RGB)
    x = x.transpose((2, 0, 1))
    x = torch.from_numpy(x).float()
    x = normalize(x)
    x = x.to(device)
    x = x[None, ...]
    return x

In [5]:
import traitlets
from IPython.display import display
import ipywidgets.widgets as widgets
from jetbot import Camera, bgr8_to_jpeg

camera = Camera.instance(width=224, height=224)
image = widgets.Image(format='jpeg', width=224, height=224)
blocked_slider = widgets.FloatSlider(description='no stop sign', min=0.0, max=1.0, orientation='vertical')

camera_link = traitlets.dlink((camera, 'value'), (image, 'value'), transform=bgr8_to_jpeg)

display(widgets.HBox([image, blocked_slider]))

HBox(children=(Image(value=b'\xff\xd8\xff\xe0\x00\x10JFIF\x00\x01\x01\x00\x00\x01\x00\x01\x00\x00\xff\xdb\x00Câ€¦

In [7]:
from jetbot import Robot

robot = Robot()

In [8]:
import torch.nn.functional as F
import datetime
import time

def update(change):
    global blocked_slider, robot
    x = change['new'] 
    x = preprocess(x)
    y = model(x)
    
    # we apply the `softmax` function to normalize the output vector so it sums to 1 (which makes it a probability distribution)
    y = F.softmax(y, dim=1)
    
    prob_blocked = float(y.flatten()[0])
    
    blocked_slider.value = prob_blocked
    
    if prob_blocked < 0.6:
        time.sleep(1)
        print('Stop sign detected', datetime.datetime.now().time())
        robot.stop()
        time.sleep(1)
        robot.forward(0.4)
    else:
        robot.forward(0.4)
    
    time.sleep(0.001)
        
update({'new': camera.value})  # we call the function once to intialize

In [9]:
camera.observe(update, names='value')  # this attaches the 'update' function to the 'value' traitlet of our camera

Stop sign detected 10:17:06.548156
Stop sign detected 10:17:08.700891
Stop sign detected 10:17:10.948844
Stop sign detected 10:17:13.155193
Stop sign detected 10:17:15.315805
Stop sign detected 10:17:17.605084
Stop sign detected 10:17:19.839466
Stop sign detected 10:17:22.031245
Stop sign detected 10:17:31.860919
Stop sign detected 10:17:35.634359
Stop sign detected 10:17:37.787503
Stop sign detected 10:17:40.058435
Stop sign detected 10:17:42.266535
Stop sign detected 10:17:44.828468
Stop sign detected 10:17:46.991645
Stop sign detected 10:17:49.089066
Stop sign detected 10:17:51.190256
Stop sign detected 10:17:53.292688
Stop sign detected 10:17:55.402427
Stop sign detected 10:17:57.499349
Stop sign detected 10:17:59.592697
Stop sign detected 10:18:01.706254
Stop sign detected 10:18:03.797072
Stop sign detected 10:18:05.894165
Stop sign detected 10:18:08.090757
Stop sign detected 10:18:10.258324
Stop sign detected 10:18:12.556181
Stop sign detected 10:18:14.664003
Stop sign detected 1

In [12]:
camera.unobserve(update, names='value')

time.sleep(0.1)  # add a small sleep to make sure frames have finished processing



ValueError: list.remove(x): x not in list

In [11]:
camera.stop()

In [13]:
robot.stop()