In [99]:
import cv2
# import matplotlib
# import matplotlib.pyplot as plt
import numpy as np
import glob
import torch
import torch.nn as nn 
import time
import math
# import torch.nn.functional as F
import onnx

In [100]:
# --------------------------------------------------------
# DaSiamRPN
# Licensed under The MIT License
# Written by Qiang Wang (wangqiang2015 at ia.ac.cn)
# --------------------------------------------------------
import torch.nn as nn
import torch.nn.functional as F

size = 1
configs = [3, 96, 256, 384, 384, 256]
configs = list(map(lambda x: 3 if x==3 else x*size, configs))
feat_in = configs[-1]
feature_out = 256
anchor=5
class SiamRPN(nn.Module):
    def __init__(self):
#     def __init__(self, size=2, feature_out=512, anchor=5):
        
        super(SiamRPN, self).__init__()
        self.featureExtract = nn.Sequential(
            nn.Conv2d(configs[0], configs[1] , kernel_size=11, stride=2),
            nn.BatchNorm2d(configs[1]),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[1], configs[2], kernel_size=5),
            nn.BatchNorm2d(configs[2]),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[2], configs[3], kernel_size=3),
            nn.BatchNorm2d(configs[3]),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[3], configs[4], kernel_size=3),
            nn.BatchNorm2d(configs[4]),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[4], configs[5], kernel_size=3),
            nn.BatchNorm2d(configs[5]),
        )

        self.anchor = anchor
        self.feature_out = feature_out

        self.conv_r1 = nn.Conv2d(feat_in, feature_out*4*anchor, 3)
        self.conv_r2 = nn.Conv2d(feat_in, feature_out, 3)
        self.conv_cls1 = nn.Conv2d(feat_in, feature_out*2*anchor, 3)
        self.conv_cls2 = nn.Conv2d(feat_in, feature_out, 3)
        self.regress_adjust = nn.Conv2d(4*anchor, 4*anchor, 1)

#         self.r1_kernel = []
#         self.cls1_kernel = []

        self.cfg = {}

    def forward(self, x):
        x_f = self.featureExtract(x)
        return self.regress_adjust(F.conv2d(self.conv_r2(x_f), self.r1_kernel)), \
               F.conv2d(self.conv_cls2(x_f), self.cls1_kernel)

    def temple(self, z):
        z_f = self.featureExtract(z)
        r1_kernel_raw = self.conv_r1(z_f)
        cls1_kernel_raw = self.conv_cls1(z_f)
        kernel_size = r1_kernel_raw.data.size()[-1]
        self.r1_kernel = r1_kernel_raw.view(self.anchor*4, self.feature_out, kernel_size, kernel_size)
        self.cls1_kernel = cls1_kernel_raw.view(self.anchor*2, self.feature_out, kernel_size, kernel_size)


class SiamRPNBIG(SiamRPN):
    def __init__(self):
        super(SiamRPNBIG, self).__init__(size=2) 
        # self.cfg = {'lr':0.295, 'window_influence': 0.42, 'penalty_k': 0.055, 'instance_size': 271, 'adaptive': True} # 0.383
        self.cfg = {'lr':0.295, 'window_influence': 0.42, 'penalty_k': 0.055, 'instance_size': 271, 'adaptive': True} # 0.383


class SiamRPNvot(SiamRPN):
    def __init__(self):
        super(SiamRPNvot, self).__init__(size=1, feature_out=256)
        self.cfg = {'lr':0.45, 'window_influence': 0.44, 'penalty_k': 0.04, 'instance_size': 271, 'adaptive': True} # 0.355


class SiamRPNotb(SiamRPN):
    def __init__(self):
        super(SiamRPNotb, self).__init__()#size=1, feature_out=256)
        self.cfg = {'lr': 0.30, 'window_influence': 0.40, 'penalty_k': 0.22, 'instance_size': 271, 'adaptive': True} # 0.655


In [101]:
net = SiamRPNotb()
net.eval()
net.cuda()
z = torch.randn(1,3,127,127).cuda()
net.temple(z)
x = torch.randn(1,3,271,271).cuda()
delta, score = net(x)

    

In [103]:
delta = delta.permute(1, 2, 3, 0).contiguous().view(4, -1)

In [112]:
score.shape

torch.Size([1, 10, 19, 19])

In [None]:
delta = delta.permute(1, 2, 3, 0).contiguous().view(4, -1).data.cpu().numpy()

In [5]:
# --------------------------------------------------------
# DaSiamRPN
# Licensed under The MIT License
# Written by Qiang Wang (wangqiang2015 at ia.ac.cn)
# --------------------------------------------------------
import torch.nn as nn
import torch.nn.functional as F

size = 1
configs = [3, 96, 256, 384, 384, 256]
configs = list(map(lambda x: 3 if x==3 else x*size, configs))
feat_in = configs[-1]
feature_out = 256
anchor=5
class Temple(nn.Module):
    def __init__(self):        
        super(Temple, self).__init__()
        self.cfg = {'lr': 0.30, 'window_influence': 0.40, 'penalty_k': 0.22, 'instance_size': 271, 'adaptive': True} # 0.655

        self.featureExtract = nn.Sequential(
            nn.Conv2d(configs[0], configs[1] , kernel_size=11, stride=2),
            nn.BatchNorm2d(configs[1]),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[1], configs[2], kernel_size=5),
            nn.BatchNorm2d(configs[2]),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[2], configs[3], kernel_size=3),
            nn.BatchNorm2d(configs[3]),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[3], configs[4], kernel_size=3),
            nn.BatchNorm2d(configs[4]),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[4], configs[5], kernel_size=3),
            nn.BatchNorm2d(configs[5]),
        )

        self.anchor = anchor
        self.feature_out = feature_out

        self.conv_r1 = nn.Conv2d(feat_in, feature_out*4*anchor, 3)
        self.conv_r2 = nn.Conv2d(feat_in, feature_out, 3)
        self.conv_cls1 = nn.Conv2d(feat_in, feature_out*2*anchor, 3)
        self.conv_cls2 = nn.Conv2d(feat_in, feature_out, 3)
        self.regress_adjust = nn.Conv2d(4*anchor, 4*anchor, 1)

        

    def forward(self, z):
        with torch.no_grad():
            z_f = self.featureExtract(z)
            r1_kernel_raw = self.conv_r1(z_f)
            cls1_kernel_raw = self.conv_cls1(z_f)
            kernel_size = r1_kernel_raw.data.size()[-1]
            r1_kernel = r1_kernel_raw.view(self.anchor*4, self.feature_out, kernel_size, kernel_size)
            cls1_kernel = cls1_kernel_raw.view(self.anchor*2, self.feature_out, kernel_size, kernel_size)
        return r1_kernel,cls1_kernel


In [7]:
model = Temple()
model.load_state_dict(torch.load('SiamRPNOTB.model'))
z = torch.randn(1,3,127,127).cuda()
model.eval()
model.cuda()
ONNX_FILE_PATH = "temple.onnx"

# torch.onnx.export(model, z, ONNX_FILE_PATH, input_names=["z"], output_names=["zf"], export_params=True)

torch.onnx.export(model, z, ONNX_FILE_PATH, input_names=["z"], output_names=["r1_kernel","cls1_kernel"], export_params=True)


In [8]:
r1_kernel,cls1_kernel = model(z)

In [6]:

size = 1
configs = [3, 96, 256, 384, 384, 256]
configs = list(map(lambda x: 3 if x==3 else x*size, configs))
feat_in = configs[-1]
feature_out = 256
anchor=5
class SiamRPN(nn.Module):
    def __init__(self):
#     def __init__(self, size=2, feature_out=512, anchor=5):
        
        super(SiamRPN, self).__init__()
        self.featureExtract = nn.Sequential(
            nn.Conv2d(configs[0], configs[1] , kernel_size=11, stride=2),
            nn.BatchNorm2d(configs[1]),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[1], configs[2], kernel_size=5),
            nn.BatchNorm2d(configs[2]),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[2], configs[3], kernel_size=3),
            nn.BatchNorm2d(configs[3]),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[3], configs[4], kernel_size=3),
            nn.BatchNorm2d(configs[4]),
            nn.ReLU(inplace=True),
            nn.Conv2d(configs[4], configs[5], kernel_size=3),
            nn.BatchNorm2d(configs[5]),
        )

        self.anchor = anchor
        self.feature_out = feature_out

        self.conv_r1 = nn.Conv2d(feat_in, feature_out*4*anchor, 3)
        self.conv_r2 = nn.Conv2d(feat_in, feature_out, 3)
        self.conv_cls1 = nn.Conv2d(feat_in, feature_out*2*anchor, 3)
        self.conv_cls2 = nn.Conv2d(feat_in, feature_out, 3)
        self.regress_adjust = nn.Conv2d(4*anchor, 4*anchor, 1)

#         self.r1_kernel = []
#         self.cls1_kernel = []

        self.cfg = {}

    def forward(self, x):
        x_f = self.featureExtract(x)
        return self.conv_r2(x_f),self.conv_cls2(x_f)
#         return self.regress_adjust(F.conv2d(self.conv_r2(x_f), self.r1_kernel)), \
#                F.conv2d(self.conv_cls2(x_f), self.cls1_kernel)
    
        
#     def temple(self, z):
#         z_f = self.featureExtract(z)
#         r1_kernel_raw = self.conv_r1(z_f)
#         cls1_kernel_raw = self.conv_cls1(z_f)
#         kernel_size = r1_kernel_raw.data.size()[-1]
#         self.r1_kernel = r1_kernel_raw.view(self.anchor*4, self.feature_out, kernel_size, kernel_size)
#         self.cls1_kernel = cls1_kernel_raw.view(self.anchor*2, self.feature_out, kernel_size, kernel_size)


In [10]:
model = SiamRPN()
model.load_state_dict(torch.load('SiamRPNOTB.model'))
x = torch.randn(1,3,271,271).cuda()
model.eval()
model.cuda()
ONNX_FILE_PATH = "SiamRPNOTB.onnx"

# torch.onnx.export(model, z, ONNX_FILE_PATH, input_names=["z"], output_names=["zf"], export_params=True)

torch.onnx.export(model,x, ONNX_FILE_PATH, input_names=["x"], 
                  output_names=["delta", "score" ], export_params=True)


In [7]:
temple = Temple()
temple = Temple()
temple.load_state_dict(torch.load('SiamRPNOTB.model'))
z = torch.randn(1,3,127,127).cuda()
temple.eval()
temple.cuda()
r1_kernel,cls1_kernel = temple(z)

In [8]:
siam = SiamRPN()
siam.load_state_dict(torch.load('SiamRPNOTB.model'))
x = torch.randn(1,3,271,271).cuda()
siam.eval()
siam.cuda()
delta,score = siam(x)

In [9]:
delta2 = F.conv2d(delta, r1_kernel)

In [10]:
score2 = F.conv2d(score, cls1_kernel)
score2.shape

torch.Size([1, 10, 19, 19])

In [11]:
delta2.shape

torch.Size([1, 20, 19, 19])

In [12]:
r1_kernel.shape

torch.Size([20, 256, 4, 4])

In [13]:
cls1_kernel.shape

torch.Size([10, 256, 4, 4])

In [108]:
class RegressAdjust(nn.Module):
    def __init__(self):
        super(RegressAdjust, self).__init__()
        self.conv = siam.regress_adjust
    def forward(self,delta2):
        delta = self.conv(delta2)
        delta = delta.permute(1, 2, 3, 0).contiguous().view(4, -1)
        return delta

In [109]:
model = RegressAdjust()
# model.load_state_dict(torch.load('SiamRPNOTB.model'))
x = torch.randn(1,20,19,19).cuda()
model.eval()
model.cuda()
ONNX_FILE_PATH = "RegressAdjust.onnx"

# torch.onnx.export(model, z, ONNX_FILE_PATH, input_names=["z"], output_names=["zf"], export_params=True)

torch.onnx.export(model,x, ONNX_FILE_PATH, input_names=["delta2"], 
                  output_names=["final_delta" ], export_params=True)

In [110]:
y = model(x)
y.shape

torch.Size([4, 1805])

In [111]:
y

tensor([[ 0.0012, -0.1298, -0.0033,  ...,  0.0602, -0.0365,  0.1280],
        [-0.1015, -0.0980, -0.0731,  ..., -0.0420,  0.1005, -0.1431],
        [-0.2207, -0.3327, -0.1688,  ...,  0.1557,  0.1316,  0.1862],
        [ 0.3933,  0.0751,  0.1954,  ..., -0.3612,  0.0348, -0.1545]],
       device='cuda:0', grad_fn=<ViewBackward0>)

In [96]:


def generate_anchor(total_stride, scales, ratios, score_size):
    anchor_num = len(ratios) * len(scales)
    anchor = np.zeros((anchor_num, 4),  dtype=np.float32)
    size = total_stride * total_stride
    count = 0
    for ratio in ratios:
        # ws = int(np.sqrt(size * 1.0 / ratio))
        ws = int(np.sqrt(size / ratio))
        hs = int(ws * ratio)
        for scale in scales:
            wws = ws * scale
            hhs = hs * scale
            anchor[count, 0] = 0
            anchor[count, 1] = 0
            anchor[count, 2] = wws
            anchor[count, 3] = hhs
            count += 1

    anchor = np.tile(anchor, score_size * score_size).reshape((-1, 4))
    ori = - (score_size / 2) * total_stride
    xx, yy = np.meshgrid([ori + total_stride * dx for dx in range(score_size)],
                         [ori + total_stride * dy for dy in range(score_size)])
    xx, yy = np.tile(xx.flatten(), (anchor_num, 1)).flatten(), \
             np.tile(yy.flatten(), (anchor_num, 1)).flatten()
    anchor[:, 0], anchor[:, 1] = xx.astype(np.float32), yy.astype(np.float32)
    return anchor

In [97]:
score_size = (271-127) / 8 + 1
anchor1= generate_anchor(total_stride=8, scales= [8, ], 
                         ratios = [0.33, 0.5, 1, 2, 3], score_size =int(score_size))

In [66]:
total_stride=8 
scales= [8, ]
ratios = [0.33, 0.5, 1, 2, 3]
score_size =int(score_size)

anchor_num = len(ratios) * len(scales)
anchor = np.zeros((anchor_num, 4),  dtype=np.float32)
size = total_stride * total_stride
count = 0
for ratio in ratios:
    # ws = int(np.sqrt(size * 1.0 / ratio))
    ws = int(np.sqrt(size / ratio))
    hs = int(ws * ratio)
    for scale in scales:
        wws = ws * scale
        hhs = hs * scale
        anchor[count, 0] = 0
        anchor[count, 1] = 0
        anchor[count, 2] = wws
        anchor[count, 3] = hhs
        count += 1

anchor = np.tile(anchor, score_size * score_size).reshape((-1, 4))

ori = - (score_size / 2) * total_stride

xx, yy = np.meshgrid([ori + total_stride * dx for dx in range(score_size)],
                    [ori + total_stride * dy for dy in range(score_size)])

xx, yy = np.tile(xx.flatten(), (anchor_num, 1)).flatten(), \
         np.tile(yy.flatten(), (anchor_num, 1)).flatten()

In [98]:
anchor1

array([[-76., -76., 104.,  32.],
       [-68., -76., 104.,  32.],
       [-60., -76., 104.,  32.],
       ...,
       [ 52.,  68.,  32.,  96.],
       [ 60.,  68.,  32.,  96.],
       [ 68.,  68.,  32.,  96.]], dtype=float32)

In [95]:
(yy[:19*19]+76)/8

array([ 0.,  0.,  0.,  0.,  0.,  0.,  0.,  0.,  0.,  0.,  0.,  0.,  0.,
        0.,  0.,  0.,  0.,  0.,  0.,  1.,  1.,  1.,  1.,  1.,  1.,  1.,
        1.,  1.,  1.,  1.,  1.,  1.,  1.,  1.,  1.,  1.,  1.,  1.,  2.,
        2.,  2.,  2.,  2.,  2.,  2.,  2.,  2.,  2.,  2.,  2.,  2.,  2.,
        2.,  2.,  2.,  2.,  2.,  3.,  3.,  3.,  3.,  3.,  3.,  3.,  3.,
        3.,  3.,  3.,  3.,  3.,  3.,  3.,  3.,  3.,  3.,  3.,  4.,  4.,
        4.,  4.,  4.,  4.,  4.,  4.,  4.,  4.,  4.,  4.,  4.,  4.,  4.,
        4.,  4.,  4.,  4.,  5.,  5.,  5.,  5.,  5.,  5.,  5.,  5.,  5.,
        5.,  5.,  5.,  5.,  5.,  5.,  5.,  5.,  5.,  5.,  6.,  6.,  6.,
        6.,  6.,  6.,  6.,  6.,  6.,  6.,  6.,  6.,  6.,  6.,  6.,  6.,
        6.,  6.,  6.,  7.,  7.,  7.,  7.,  7.,  7.,  7.,  7.,  7.,  7.,
        7.,  7.,  7.,  7.,  7.,  7.,  7.,  7.,  7.,  8.,  8.,  8.,  8.,
        8.,  8.,  8.,  8.,  8.,  8.,  8.,  8.,  8.,  8.,  8.,  8.,  8.,
        8.,  8.,  9.,  9.,  9.,  9.,  9.,  9.,  9.,  9.,  9.,  9