support input transformations

huanzhang12 · Aug 7, 2018 · 6955b49 · 6955b49
1 parent 1fe1bd7
commit 6955b49
Show file tree

Hide file tree

Showing 5 changed files with 362 additions and 7 deletions.
diff --git a/README.md b/README.md
@@ -18,6 +18,13 @@ by Tsui-Wei Weng\*, Huan Zhang\*, Pin-Yu Chen, Dong Su, Yupeng Gao, Jinfeng Yi,
 
 \* Equal contribution
 
+News
+-------------------------------------
+
+- Aug 6, 2018: CLEVER evaluation with input transformations (e.g., staircase
+  function or JPEG compression) is implemented via BPDA (Backward Pass
+  Differentiable Approximation)
+
 Discussion with Ian Goodfellow and Our Clarifications 
 -------------------------------------
 
@@ -103,6 +110,20 @@ a few `.mat` files.
 
 Run `python3 collect_gradients.py -h` for additional help information.
 
+**Updated:** For model with input transformation, use an additional parameter
+`--transform`.  Currently three input transformations are supported (bit-depth
+reduction, JPEG compression and PNG compression, corresponding to
+`defend_reduce`, `defend_jpeg`, `defend_png` options).  For example:
+
+```
+python3 collect_gradients.py --dataset cifar --numimg 10 --transform defend_jpeg
+```
+
+You should expect roughly the same CLEVER score with input transformations,
+as input transformations do not increase model's intrinsic robustness and can
+be broken by BPDA.
+See `defense.py` for the implementations of input transformations.
+
 ### Step 2: Compute the CLEVER score
 
 To compute CLEVER score using the collected gradients, 

diff --git a/collect_gradients.py b/collect_gradients.py
@@ -40,6 +40,7 @@
     parser.add_argument("--ids", default = "", help = "use a filelist of image IDs in CSV file for attack (UNSUPPORTED)")
     parser.add_argument("--target_type", type=int, default=0b01111, help = "Binary mask for selecting targeted attack classes. bit0: top-2, bit1: random, bit2: least likely, bit3: use --ids override (UNSUPPORTED), bit4: use all labels (for untargeted)")
     parser.add_argument("-f", "--firstimg", type=int, default=0, help = "start from which image in dataset")
+    parser.add_argument("--transform", default="", help = "input transformation function (defend_reduce, defend_jpeg, defend_png)")
     parser.add_argument("--compute_slope", action='store_true', help = "collect slope estimate")
     parser.add_argument("--sample_norm", type=str, choices=["l2", "li", "l1"], help = "norm of sampling ball (l2, l1 or li)", default="l2")
     parser.add_argument("--fix_dirty_bug", action='store_true', help = "do not use (UNSUPPORTED)")
@@ -141,7 +142,7 @@
             print('Target class: ', target_label)
             sys.stdout.flush()
 
-            [L2_max,L1_max,Li_max,G2_max,G1_max,Gi_max,g_x0,pred] = clever_estimator.estimate(input_img, true_label, target_label, Nsamp, Niters, args['sample_norm'])
+            [L2_max,L1_max,Li_max,G2_max,G1_max,Gi_max,g_x0,pred] = clever_estimator.estimate(input_img, true_label, target_label, Nsamp, Niters, args['sample_norm'], args['transform'])
             print("[STATS][L1] total = {}, seq = {}, id = {}, time = {:.3f}, true_class = {}, target_class = {}, info = {}".format(total, i, true_ids[i], time.time() - timestart, true_label, target_label, img_info[i]))
             # save to sampling results to matlab ;)
             mat_path = "{}/{}_{}/{}_{}_{}_{}_{}_{}".format(save_path, dataset, model_name, Nsamp, Niters, true_ids[i], true_label, target_label, img_info[i])

diff --git a/defense.py b/defense.py
@@ -0,0 +1,323 @@
+import PIL
+import PIL.Image
+from io import BytesIO
+import numpy as np
+import tensorflow as tf
+from numba import njit
+
+def defend_reduce(arr, depth=3):
+    arr = (arr * 255.0).astype(np.uint8)
+    shift = 8 - depth
+    arr = (arr >> shift) << shift
+    arr = arr.astype(np.float32)/255.0
+    return arr
+
+def defend_jpeg(input_array):
+    pil_image = PIL.Image.fromarray((input_array*255.0).astype(np.uint8))
+    f = BytesIO()
+    pil_image.save(f, format='jpeg', quality=75) # quality level specified in paper
+    jpeg_image = np.asarray(PIL.Image.open(f)).astype(np.float32)/255.0
+    return jpeg_image
+
+def defend_png(input_array):
+    pil_image = PIL.Image.fromarray((np.around(input_array*255.0)).astype(np.uint8))
+    f = BytesIO()
+    pil_image.save(f, format='png')
+    png_image = np.asarray(PIL.Image.open(f)).astype(np.float32)/255.0
+    return png_image
+
+# for testing implementation
+def defend_none(input_array):
+    # this convertion should be lossless
+    pil_image = PIL.Image.fromarray(input_array)
+    ret_image = np.asarray(pil_image)
+    return ret_image
+
+# based on https://github.com/scikit-image/scikit-image/blob/master/skimage/restoration/_denoise_cy.pyx
+
+# super slow since this is implemented in pure python :'(
+
+@njit
+def bregman(image, mask, weight, eps=1e-3, max_iter=100):
+    rows, cols, dims = image.shape
+    rows2 = rows + 2
+    cols2 = cols + 2
+    total = rows * cols * dims
+    shape_ext = (rows2, cols2, dims)
+
+    u = np.zeros(shape_ext)
+    dx = np.zeros(shape_ext)
+    dy = np.zeros(shape_ext)
+    bx = np.zeros(shape_ext)
+    by = np.zeros(shape_ext)
+
+    u[1:-1, 1:-1] = image
+    # reflect image
+    u[0, 1:-1] = image[1, :]
+    u[1:-1, 0] = image[:, 1]
+    u[-1, 1:-1] = image[-2, :]
+    u[1:-1, -1] = image[:, -2]
+
+    i = 0
+    rmse = np.inf
+    lam = 2 * weight
+    norm = (weight + 4 * lam)
+
+    while i < max_iter and rmse > eps:
+        rmse = 0
+
+        for k in range(dims):
+            for r in range(1, rows+1):
+                for c in range(1, cols+1):
+                    uprev = u[r, c, k]
+
+                    # forward derivatives
+                    ux = u[r, c+1, k] - uprev
+                    uy = u[r+1, c, k] - uprev
+
+                    # Gauss-Seidel method
+                    if mask[r-1, c-1]:
+                        unew = (lam * (u[r+1, c, k] +
+                                      u[r-1, c, k] +
+                                      u[r, c+1, k] +
+                                      u[r, c-1, k] +
+                                      dx[r, c-1, k] -
+                                      dx[r, c, k] +
+                                      dy[r-1, c, k] -
+                                      dy[r, c, k] -
+                                      bx[r, c-1, k] +
+                                      bx[r, c, k] -
+                                      by[r-1, c, k] +
+                                      by[r, c, k]
+                                     ) + weight * image[r-1, c-1, k]
+                               ) / norm
+                    else:
+                        # similar to the update step above, except we take
+                        # lim_{weight->0} of the update step, effectively
+                        # ignoring the l2 loss
+                        unew = (u[r+1, c, k] +
+                                  u[r-1, c, k] +
+                                  u[r, c+1, k] +
+                                  u[r, c-1, k] +
+                                  dx[r, c-1, k] -
+                                  dx[r, c, k] +
+                                  dy[r-1, c, k] -
+                                  dy[r, c, k] -
+                                  bx[r, c-1, k] +
+                                  bx[r, c, k] -
+                                  by[r-1, c, k] +
+                                  by[r, c, k]
+                                 ) / 4.0
+                    u[r, c, k] = unew
+
+                    # update rms error
+                    rmse += (unew - uprev)**2
+
+                    bxx = bx[r, c, k]
+                    byy = by[r, c, k]
+
+                    # d_subproblem
+                    s = ux + bxx
+                    if s > 1/lam:
+                        dxx = s - 1/lam
+                    elif s < -1/lam:
+                        dxx = s + 1/lam
+                    else:
+                        dxx = 0
+                    s = uy + byy
+                    if s > 1/lam:
+                        dyy = s - 1/lam
+                    elif s < -1/lam:
+                        dyy = s + 1/lam
+                    else:
+                        dyy = 0
+
+                    dx[r, c, k] = dxx
+                    dy[r, c, k] = dyy
+
+                    bx[r, c, k] += ux - dxx
+                    by[r, c, k] += uy - dyy
+
+        rmse = np.sqrt(rmse / total)
+        i += 1
+
+    # return np.squeeze(np.asarray(u[1:-1, 1:-1]))
+    return u[1:-1, 1:-1]
+
+@njit
+def defend_tv(input_array, keep_prob=0.5, lambda_tv=0.03):
+    mask = np.random.uniform(0.0, 1.0, size=input_array.shape[:2])
+    mask = mask < keep_prob
+    return bregman(input_array, mask, weight=2.0/lambda_tv)
+
+def make_defend_quilt(sess):
+    # setup for quilting
+    quilt_db = np.load('data/quilt_db.npy')
+    quilt_db_reshaped = quilt_db.reshape(1000000, -1)
+    TILE_SIZE = 5
+    TILE_OVERLAP = 2
+    tile_skip = TILE_SIZE - TILE_OVERLAP
+    K = 10
+    db_tensor = tf.placeholder(tf.float32, quilt_db_reshaped.shape)
+    query_imgs = tf.placeholder(tf.float32, (TILE_SIZE * TILE_SIZE * 3, None))
+    norms = tf.reduce_sum(tf.square(db_tensor), axis=1)[:, tf.newaxis] \
+                    - 2*tf.matmul(db_tensor, query_imgs)
+    _, topk_indices = tf.nn.top_k(-tf.transpose(norms), k=K, sorted=False)
+    def min_error_table(arr, direction):
+        assert direction in ('horizontal', 'vertical')
+        y, x = arr.shape
+        cum = np.zeros_like(arr)
+        if direction == 'horizontal':
+            cum[:, -1] = arr[:, -1]
+            for ix in range(x-2, -1, -1):
+                for iy in range(y):
+                    m = arr[iy, ix+1]
+                    if iy > 0:
+                        m = min(m, arr[iy-1, ix+1])
+                    if iy < y - 1:
+                        m = min(m, arr[iy+1, ix+1])
+                    cum[iy, ix] = arr[iy, ix] + m
+        elif direction == 'vertical':
+            cum[-1, :] = arr[-1, :]
+            for iy in range(y-2, -1, -1):
+                for ix in range(x):
+                    m = arr[iy+1, ix]
+                    if ix > 0:
+                        m = min(m, arr[iy+1, ix-1])
+                    if ix < x - 1:
+                        m = min(m, arr[iy+1, ix+1])
+                    cum[iy, ix] = arr[iy, ix] + m
+        return cum
+    def index_exists(arr, index):
+        if arr.ndim != len(index):
+            return False
+        return all(i > 0 for i in index) and all(index[i] < arr.shape[i] for i in range(arr.ndim))
+    def assign_block(ix, iy, tile, synth):
+        posx = tile_skip * ix
+        posy = tile_skip * iy
+
+        if ix == 0 and iy == 0:
+            synth[posy:posy+TILE_SIZE, posx:posx+TILE_SIZE, :] = tile
+        elif iy == 0:
+            # first row, only have horizontal overlap of the block
+            tile_left = tile[:, :TILE_OVERLAP, :]
+            synth_right = synth[:TILE_SIZE, posx:posx+TILE_OVERLAP, :]
+            errors = np.sum(np.square(tile_left - synth_right), axis=2)
+            table = min_error_table(errors, direction='vertical')
+            # copy row by row into synth
+            xoff = np.argmin(table[0, :])
+            synth[posy, posx+xoff:posx+TILE_SIZE] = tile[0, xoff:]
+            for yoff in range(1, TILE_SIZE):
+                # explore nearby xoffs
+                candidates = [(yoff, xoff), (yoff, xoff-1), (yoff, xoff+1)]
+                index = min((i for i in candidates if index_exists(table, i)), key=lambda i: table[i])
+                xoff = index[1]
+                synth[posy+yoff, posx+xoff:posx+TILE_SIZE] = tile[yoff, xoff:]
+        elif ix == 0:
+            # first column, only have vertical overlap of the block
+            tile_up = tile[:TILE_OVERLAP, :, :]
+            synth_bottom = synth[posy:posy+TILE_OVERLAP, :TILE_SIZE, :]
+            errors = np.sum(np.square(tile_up - synth_bottom), axis=2)
+            table = min_error_table(errors, direction='horizontal')
+            # copy column by column into synth
+            yoff = np.argmin(table[:, 0])
+            synth[posy+yoff:posy+TILE_SIZE, posx] = tile[yoff:, 0]
+            for xoff in range(1, TILE_SIZE):
+                # explore nearby yoffs
+                candidates = [(yoff, xoff), (yoff-1, xoff), (yoff+1, xoff)]
+                index = min((i for i in candidates if index_exists(table, i)), key=lambda i: table[i])
+                yoff = index[0]
+                synth[posy+yoff:posy+TILE_SIZE, posx+xoff] = tile[yoff:, xoff]
+        else:
+            # glue cuts along diagonal
+            tile_up = tile[:TILE_OVERLAP, :, :]
+            synth_bottom = synth[posy:posy+TILE_OVERLAP, :TILE_SIZE, :]
+            errors_up = np.sum(np.square(tile_up - synth_bottom), axis=2)
+            table_up = min_error_table(errors_up, direction='horizontal')
+            tile_left = tile[:, :TILE_OVERLAP, :]
+            synth_right = synth[:TILE_SIZE, posx:posx+TILE_OVERLAP, :]
+            errors_left = np.sum(np.square(tile_left - synth_right), axis=2)
+            table_left = min_error_table(errors_left, direction='vertical')
+            glue_index = -1
+            glue_value = np.inf
+            for i in range(TILE_OVERLAP):
+                e = table_up[i, i] + table_left[i, i]
+                if e < glue_value:
+                    glue_value = e
+                    glue_index = i
+            # copy left part first, up to the overlap column
+            xoff = glue_index
+            synth[posy+glue_index, posx+xoff:posx+TILE_OVERLAP] = tile[glue_index, xoff:TILE_OVERLAP]
+            for yoff in range(glue_index+1, TILE_SIZE):
+                # explore nearby xoffs
+                candidates = [(yoff, xoff), (yoff, xoff-1), (yoff, xoff+1)]
+                index = min((i for i in candidates if index_exists(table_left, i)), key=lambda i: table_left[i])
+                xoff = index[1]
+                synth[posy+yoff, posx+xoff:posx+TILE_OVERLAP] = tile[yoff, xoff:TILE_OVERLAP]
+            # copy right part, down to overlap row
+            yoff = glue_index
+            synth[posy+yoff:posy+TILE_OVERLAP, posx+glue_index] = tile[yoff:TILE_OVERLAP, glue_index]
+            for xoff in range(glue_index+1, TILE_SIZE):
+                # explore nearby yoffs
+                candidates = [(yoff, xoff), (yoff-1, xoff), (yoff+1, xoff)]
+                index = min((i for i in candidates if index_exists(table_up, i)), key=lambda i: table_up[i])
+                yoff = index[0]
+                synth[posy+yoff:posy+TILE_OVERLAP, posx+xoff] = tile[yoff:TILE_OVERLAP, xoff]
+            # copy rest of image
+            synth[posy+TILE_OVERLAP:posy+TILE_SIZE, posx+TILE_OVERLAP:posx+TILE_SIZE] = tile[TILE_OVERLAP:, TILE_OVERLAP:]
+    KNN_MAX_BATCH = 1000
+    def quilt(arr, graphcut=True):
+        h, w, c = arr.shape
+        assert (h - TILE_SIZE) % tile_skip == 0
+        assert (w - TILE_SIZE) % tile_skip == 0
+        horiz_blocks = (w - TILE_SIZE) // tile_skip + 1
+        vert_blocks = (h - TILE_SIZE) // tile_skip + 1
+        num_patches = horiz_blocks * vert_blocks
+        patches = np.zeros((TILE_SIZE * TILE_SIZE * 3, num_patches))
+        idx = 0
+        for iy in range(vert_blocks):
+            for ix in range(horiz_blocks):
+                posx = tile_skip*ix
+                posy = tile_skip*iy
+                patches[:, idx] = arr[posy:posy+TILE_SIZE, posx:posx+TILE_SIZE, :].ravel()
+                idx += 1
+
+        ind = []
+        for chunk in range(num_patches // KNN_MAX_BATCH + (1 if num_patches % KNN_MAX_BATCH != 0 else 0)):
+            start = KNN_MAX_BATCH * chunk
+            end = start + KNN_MAX_BATCH
+            # for some reason, the code below is 10x slower when run in a Jupyter notebook
+            # not sure why...
+            indices_ = sess.run(topk_indices, {db_tensor: quilt_db_reshaped, query_imgs: patches[:, start:end]})
+            for i in indices_:
+                ind.append(np.random.choice(i))
+
+        synth = np.zeros((299, 299, 3))
+
+        idx = 0
+        for iy in range(vert_blocks):
+            for ix in range(horiz_blocks):
+                posx = tile_skip*ix
+                posy = tile_skip*iy
+                tile = quilt_db[ind[idx]]
+                if not graphcut:
+                    synth[posy:posy+TILE_SIZE, posx:posx+TILE_SIZE, :] = tile
+                else:
+                    assign_block(ix, iy, tile, synth)
+                idx += 1
+        return synth
+
+    return quilt
+
+# x is a square image (3-tensor)
+def defend_crop(x, crop_size=90, ensemble_size=30):
+    x_size = tf.to_float(x.shape[1])
+    frac = crop_size/x_size
+    start_fraction_max = (x_size - crop_size)/x_size
+    def randomizing_crop(x):
+        start_x = tf.random_uniform((), 0, start_fraction_max)
+        start_y = tf.random_uniform((), 0, start_fraction_max)
+        return tf.image.crop_and_resize([x], boxes=[[start_y, start_x, start_y+frac, start_x+frac]],
+                                 box_ind=[0], crop_size=[crop_size, crop_size])
+
+    return tf.concat([randomizing_crop(x) for _ in range(ensemble_size)], axis=0)