biostat93
diff --git a/‎MLiP-week06-07/06-07 Linear Classification.ipynb
Lines changed: 1975 additions & 0 deletions b/‎MLiP-week06-07/06-07 Linear Classification.ipynb
Lines changed: 1975 additions & 0 deletions
diff --git a/‎MLiP-week06-07/data_utils.py
Lines changed: 79 additions & 0 deletions b/‎MLiP-week06-07/data_utils.py
Lines changed: 79 additions & 0 deletions
diff --git a/‎MLiP-week06-07/imgs/Linear2.png
134 KB b/‎MLiP-week06-07/imgs/Linear2.png
134 KB
diff --git a/‎MLiP-week06-07/imgs/Linear3.png
137 KB b/‎MLiP-week06-07/imgs/Linear3.png
137 KB
diff --git a/‎MLiP-week06-07/imgs/LinearClassification_prototypes.png
218 KB b/‎MLiP-week06-07/imgs/LinearClassification_prototypes.png
218 KB
diff --git a/‎MLiP-week06-07/imgs/Linear_4.png
424 KB b/‎MLiP-week06-07/imgs/Linear_4.png
424 KB
diff --git a/‎MLiP-week06-07/imgs/backward_gradient.jpg
112 KB b/‎MLiP-week06-07/imgs/backward_gradient.jpg
112 KB
diff --git a/‎MLiP-week06-07/imgs/classifydemo.jpeg
72.8 KB b/‎MLiP-week06-07/imgs/classifydemo.jpeg
72.8 KB
diff --git a/‎MLiP-week06-07/imgs/cross_entropy_formula.jpg
105 KB b/‎MLiP-week06-07/imgs/cross_entropy_formula.jpg
105 KB
diff --git a/‎MLiP-week06-07/imgs/cross_entropy_loss.jpg
108 KB b/‎MLiP-week06-07/imgs/cross_entropy_loss.jpg
108 KB
diff --git a/‎MLiP-week06-07/imgs/gradient_descent_fig.jpg
88.7 KB b/‎MLiP-week06-07/imgs/gradient_descent_fig.jpg
88.7 KB
diff --git a/‎MLiP-week06-07/imgs/gradient_descent_line_graph.gif
1.58 MB b/‎MLiP-week06-07/imgs/gradient_descent_line_graph.gif
1.58 MB
diff --git a/‎MLiP-week06-07/imgs/linear1.png
125 KB b/‎MLiP-week06-07/imgs/linear1.png
125 KB
diff --git a/‎MLiP-week06-07/imgs/loss.png
166 KB b/‎MLiP-week06-07/imgs/loss.png
166 KB
diff --git a/‎MLiP-week06-07/imgs/margin.jpg
13 KB b/‎MLiP-week06-07/imgs/margin.jpg
13 KB
diff --git a/‎MLiP-week06-07/imgs/regularization_loss.jpg
128 KB b/‎MLiP-week06-07/imgs/regularization_loss.jpg
128 KB
diff --git a/‎MLiP-week06-07/imgs/svm-loss.jpg
143 KB b/‎MLiP-week06-07/imgs/svm-loss.jpg
143 KB
diff --git a/‎MLiP-week06-07/imgs/svm_half_vectorized.jpg
146 KB b/‎MLiP-week06-07/imgs/svm_half_vectorized.jpg
146 KB
diff --git a/‎MLiP-week06-07/imgs/wb.jpeg
82.4 KB b/‎MLiP-week06-07/imgs/wb.jpeg
82.4 KB
diff --git a/‎MLiP-week06-07/layers.py
Lines changed: 235 additions & 0 deletions b/‎MLiP-week06-07/layers.py
Lines changed: 235 additions & 0 deletions
@@ -0,0 +1,79 @@
+from six.moves import cPickle as pickle
+import numpy as np
+import os
+from scipy.misc import imread
+import platform
+
+def load_pickle(f):
+    version = platform.python_version_tuple()
+    if version[0] == '2':
+        return  pickle.load(f)
+    elif version[0] == '3':
+        return  pickle.load(f, encoding='latin1')
+    raise ValueError("invalid python version: {}".format(version))
+
+def load_CIFAR_batch(filename):
+  """ load single batch of cifar """
+  with open(filename, 'rb') as f:
+    datadict = load_pickle(f)
+    X = datadict['data']
+    Y = datadict['labels']
+    X = X.reshape(10000, 3, 32, 32).transpose(0,2,3,1).astype("float")
+    Y = np.array(Y)
+    return X, Y
+
+def load_CIFAR10(ROOT):
+  """ load all of cifar """
+  xs = []
+  ys = []
+  for b in range(1,6):
+    f = os.path.join(ROOT, 'data_batch_%d' % (b, ))
+    X, Y = load_CIFAR_batch(f)
+    xs.append(X)
+    ys.append(Y)    
+  Xtr = np.concatenate(xs)
+  Ytr = np.concatenate(ys)
+  del X, Y
+  Xte, Yte = load_CIFAR_batch(os.path.join(ROOT, 'test_batch'))
+  return Xtr, Ytr, Xte, Yte
+
+
+def get_CIFAR10_data(cifar10_dir, num_training=49000, num_validation=1000, num_test=1000,
+                     subtract_mean=True):
+    """
+    Load the CIFAR-10 dataset from disk and perform preprocessing to prepare
+    it for classifiers. These are the same steps as we used for the SVM, but
+    condensed to a single function.
+    """
+    # Load the raw CIFAR-10 data
+    X_train, y_train, X_test, y_test = load_CIFAR10(cifar10_dir)
+        
+    # Subsample the data
+    mask = list(range(num_training, num_training + num_validation))
+    X_val = X_train[mask]
+    y_val = y_train[mask]
+    mask = list(range(num_training))
+    X_train = X_train[mask]
+    y_train = y_train[mask]
+    mask = list(range(num_test))
+    X_test = X_test[mask]
+    y_test = y_test[mask]
+
+    # Normalize the data: subtract the mean image
+    if subtract_mean:
+      mean_image = np.mean(X_train, axis=0)
+      X_train -= mean_image
+      X_val -= mean_image
+      X_test -= mean_image
+    
+    # Transpose so that channels come first
+    X_train = X_train.transpose(0, 3, 1, 2).copy()
+    X_val = X_val.transpose(0, 3, 1, 2).copy()
+    X_test = X_test.transpose(0, 3, 1, 2).copy()
+
+    # Package data into a dictionary
+    return {
+      'X_train': X_train, 'y_train': y_train,
+      'X_val': X_val, 'y_val': y_val,
+      'X_test': X_test, 'y_test': y_test,
+    }
@@ -0,0 +1,235 @@
+import numpy as np
+
+
+def affine_forward(x, W, b):
+    """
+    A linear mapping from inputs to scores.
+    
+    Inputs:
+        - x: input matrix (N, d_1, ..., d_k)
+        - W: weigh matrix (D, C)
+        - b: bias vector  (C, )
+    
+    Outputs:
+        - out: output of linear layer (N, C)
+    """
+    x2d = np.reshape(x, (x.shape[0], -1))  # convert 4D input matrix to 2D    
+    out = np.dot(x2d, W) + b               # linear transformation
+    cache = (x, W, b)                      # keep for backward step (stay with us)
+    return out, cache
+
+
+def affine_backward(dout, cache):
+    """
+    Computes the backward pass for an affine layer.
+
+    Inputs:
+        - dout: Upstream derivative, of shape (N, C)
+        - cache: Tuple of:
+            - x: Input data, of shape (N, d_1, ... d_k)
+            - w: Weights, of shape (D, C)
+            - b: biases, of shape (C,)
+
+    Outputs:
+        - dx: Gradient with respect to x, of shape (N, d1, ..., d_k)
+        - dw: Gradient with respect to w, of shape (D, C)
+        - db: Gradient with respect to b, of shape (C,)
+    """
+    x, w, b = cache
+    x2d = np.reshape(x, (x.shape[0], -1))
+
+    # compute gradients
+    db = np.sum(dout, axis=0)
+    dw = np.dot(x2d.T, dout)
+    dx = np.dot(dout, w.T)
+
+    # reshape dx to match the size of x
+    dx = dx.reshape(x.shape)
+    
+    return dx, dw, db
+
+def svm_loss_naive(scores, y, W, reg=1e-3):
+    """
+    Naive implementation of SVM loss function.
+
+    Inputs:
+        - scores: scores for all training data (N, C)
+        - y: correct labels for the training data
+        - reg: regularization strength (lambd)
+
+    Outputs:
+       - loss: data loss plus L2 regularization loss
+       - grads: graidents of loss wrt scores
+    """
+
+    N, C = scores.shape
+
+    # Compute svm data loss
+    loss = 0.0
+    for i in range(N):
+        s = scores[i]  # scores for the ith data
+        correct_class = y[i]  # correct class score
+
+        for j in range(C):
+            if j == y[i]:
+                continue
+            else:
+                # loss += max(0, s[j] - s[correct_class] + 1.0)
+                margin = s[j] - s[correct_class] + 1.0
+                if margin > 0:
+                    loss += margin
+    loss /= N
+
+    # Adding L2-regularization loss
+    loss += 0.5 * reg * np.sum(W * W)
+
+    # Compute gradient off loss function w.r.t. scores
+    # We will write this part later
+    grads = {} 
+
+    return loss, grads
+
+def svm_loss_half_vectorized(scores, y, W, reg=1e-3):
+    """
+    Half-vectorized implementation of SVM loss function.
+
+    Inputs:
+        - scores: scores for all training data (N, C)
+        - y: correct labels for the training data
+        - reg: regularization strength (lambd)
+
+    Outputs:
+       - loss: data loss plus L2 regularization loss
+       - grads: graidents of loss wrt scores
+    """
+
+    N, C = scores.shape
+
+    # Compute svm data loss
+    loss = 0.0
+    for i in range(N):
+        s = scores[i]  # scores for the ith data
+        correct_class = y[i]  # correct class score
+
+        margins = np.maximum(0.0, s - s[correct_class] + 1.0)
+        margins[correct_class] = 0.0
+        loss += np.sum(margins)
+
+    loss /= N
+
+    # Adding L2-regularization loss
+    loss += 0.5 * reg * np.sum(W * W)
+
+    # Compute gradient off loss function w.r.t. scores
+    # We will write this part later
+    grads = {} 
+
+    return loss, grads
+
+
+def svm_loss(scores, y, W, reg=1e-3):
+    """
+    Fully-vectorized implementation of SVM loss function.
+
+    Inputs:
+        - scores: scores for all training data (N, C)
+        - y: correct labels for the training data
+        - reg: regularization strength (lambd)
+
+    Outputs:
+       - loss: data loss plus L2 regularization loss
+       - grads: graidents of loss wrt scores
+    """
+
+    N = scores.shape[0]
+
+    # Compute svm data loss
+    correct_class_scores = scores[range(N), y]
+    margins = np.maximum(0.0, scores - correct_class_scores[:, None] + 1.0)
+    margins[range(N), y] = 0.0
+    loss = np.sum(margins) / N
+
+    # Adding L2-regularization loss
+    loss += 0.5 * reg * np.sum(W * W)
+
+    # Compute gradient off loss function w.r.t. scores
+    # We will write this part later
+    grads = {} 
+
+    return loss, grads
+
+
+def softmax_loss_naive(scores, y, W, reg=1e-3):
+    """
+    Softmax loss function, naive implementation (with loops)
+
+    Inputs have dimension D, there are C classes, and we operate on minibatches
+    of N examples.
+
+    Inputs:
+        - scores: A numpy array of shape (N, C).
+        - y: A numpy array of shape (N,) containing training labels;
+        - W: A numpy array of shape (D, C) containing weights.
+        - reg: (float) regularization strength
+
+    Outputs:
+        - loss as single float
+        - gradient with respect to weights W; an array of same shape as W
+    """
+    N, C = scores.shape
+
+    # compute data loss
+    loss = 0.0
+    for i in range(N):
+        correct_class = y[i]
+        score = scores[i]
+        score -= np.max(scores)
+        exp_score = np.exp(score)
+        probs = exp_score / np.sum(exp_score)
+        loss += -np.log(probs[correct_class])
+
+    loss /= N
+
+    # compute regularization loss
+    loss += 0.5 * reg * np.sum(W * W)
+
+    # Compute gradient off loss function w.r.t. scores
+    # We will write this part later
+    grads = {}  
+
+    return loss, grads
+
+
+def softmax_loss(scores, y, W, reg=1e-3):
+    """
+    Softmax loss function, naive implementation (with loops)
+
+    Inputs have dimension D, there are C classes, and we operate on minibatches
+    of N examples.
+
+    Inputs:
+        - scores: A numpy array of shape (N, C).
+        - y: A numpy array of shape (N,) containing training labels;
+        - W: A numpy array of shape (D, C) containing weights.
+        - reg: (float) regularization strength
+
+    Outputs:
+        - loss as single float
+        - gradient with respect to weights W; an array of same shape as W
+    """
+    N = scores.shape[0]  # number of input data
+
+    # compute data loss
+    scores -= np.max(scores, axis=1, keepdims=True)
+    exp_scores = np.exp(scores)
+    probs = exp_scores / np.sum(exp_scores, axis=1, keepdims=True)
+    loss = -np.sum(np.log(probs[range(N), y])) / N
+
+    # compute regularization loss
+    loss += 0.5 * reg * np.sum(W * W)
+
+    # Compute gradient off loss function w.r.t. scores
+    # We will write this part later
+    grads = {}  
+
+    return loss, grads