Skip to content


add regularization to linear models
Browse files Browse the repository at this point in the history
  • Loading branch information
FlorianMuellerklein committed Mar 4, 2015
1 parent 3d6b15b commit f0416ed
Show file tree
Hide file tree
Showing 3 changed files with 79 additions and 90 deletions.
1 change: 1 addition & 0 deletions Data/ionosphere.csv

Large diffs are not rendered by default.

19 changes: 15 additions & 4 deletions
Expand Up @@ -5,10 +5,12 @@ class LinReg(object):
multivariate linear regression using gradient descent!!
takes three arguments: alpha (learning rate), number of iterations for SGD, and verbose if you want to see output
def __init__(self, alpha = 0.01, iterations = 50, verbose = 0):
def __init__(self, alpha = 0.01, iterations = 50, verbose = 0, l2 = 0, intercept = True):
self.alpha = alpha
self.iterations = iterations
self.intercept = intercept
self.verbose = verbose
self.l2 = l2
self.theta = None
self.mean = []
self.std = []
Expand All @@ -19,16 +21,20 @@ def fit(self, X, y):
take steps in direction of steepest decrease of J.
:return: value of theta that minimizes J(theta) and J_history
if self.intercept:
intercept = np.ones((np.shape(X)[0],1))
X = np.concatenate((intercept, X), 1)

num_examples, num_features = np.shape(X)

# initialize theta to 1
self.theta = np.ones(num_features)

for i in range(self.iterations):
# make prediction
predicted =, self.theta)
predicted =, self.theta.T)
# update theta with gradient descent
self.theta = self.theta - self.alpha / num_examples * - y), X)
self.theta = (self.theta * (1 - (self.alpha * self.l2))) - self.alpha / num_examples * - y).T, X)
# sum of squares cost
error = predicted - y
cost = np.sum(error**2) / (2 * num_examples)
Expand All @@ -46,6 +52,10 @@ def predict(self, X):
:param X: new data to make predictions on
:return: return prediction
if self.intercept:
intercept = np.ones((np.shape(X)[0],1))
X = np.concatenate((intercept, X), 1)

num_examples, num_features = np.shape(X)
prediction = []
for sample in range(num_examples):
Expand All @@ -60,8 +70,9 @@ def demo():
# initialize linear regression parameters
iterations = 2000
alpha = 0.1
l2 = 0.0001

linearReg = LinReg(alpha = alpha, iterations = iterations, verbose = 1)
linearReg = LinReg(alpha = alpha, iterations = iterations, verbose = 1, l2 = l2)

data = np.genfromtxt('Data/blood_pressure.csv', delimiter = ',', skip_header = 1)
X = data[:, 1:]
Expand Down
149 changes: 63 additions & 86 deletions
Expand Up @@ -7,11 +7,13 @@ class Logit(object):
logistic regression using gradient descent!!
takes three arguments: alpha (learning rate), number of iterations for SGD, and verbose if you want to see output
def __init__(self, alpha, iterations, verbose, tolerance):
def __init__(self, alpha, iterations, verbose, tolerance, l2, intercept = True):
self.alpha = alpha
self.iterations = iterations
self.tolerance = tolerance
self.intercept = intercept
self.verbose = verbose
self.l2 = l2
self.theta = None
self.mean = []
self.std = []
Expand All @@ -26,7 +28,7 @@ def sigmoid(self, x):
# typical sigmoid py line, seems to get errors with arrays
return 1 / (1 + np.exp(-x))

def gradient_descent(self, X, y):
def fit(self, X, y):
Search algorithm - loops over theta and updates to
take steps in direction of steepest decrease of J.
Expand All @@ -35,21 +37,26 @@ def gradient_descent(self, X, y):
:input y: must be numpy vector of 0 and 1
:return: value of theta that minimizes J(theta) and J_history
if self.intercept:
intercept = np.ones((np.shape(X)[0],1))
X = np.concatenate((intercept, X), 1)

num_examples, num_features = np.shape(X)

# initialize theta to 1
self.theta = np.ones(num_features)

for i in range(self.iterations):
# make predictions
predicted = self.sigmoid(, self.theta))
predicted = self.sigmoid(, self.theta.T))
# update theta with gradient descent
self.theta = self.theta - self.alpha / num_examples * - y), X)
#self.theta -= self.alpha / num_examples * ( - y).T, X) + (self.l2 * self.theta))
self.theta = (self.theta * (1 - (self.alpha * self.l2))) - self.alpha * - y).T, X)
# sum of squares cost
error = predicted - y
cost = np.sum(error**2) / (2 * num_examples)

if i % 5000 == 0 and self.verbose == True:
if i % (self.iterations/10) == 0 and self.verbose == True:
print 'iteration:', i
print 'theta:', self.theta
print 'cost:', cost
Expand All @@ -60,30 +67,6 @@ def gradient_descent(self, X, y):

return self.theta

def transform(self, data):
Calculate mean and standard deviation of data
Transform data by subtracting by mean and
dividing by std
:param data: data file
:return: transformed data

# transform
X_norm = data
for i in range(data.shape[1]):
mean = np.mean(data[:,i])
std = np.std(data[:,i])
X_norm[:,i] = (X_norm[:,i] - mean) / std

X_int = np.ones(shape =(X_norm.shape[0],1))
X_norm = np.hstack((X_int, X_norm))

return X_norm

def predict(self, X, labels):
Make linear prediction based on cost and gradient descent
Expand All @@ -92,73 +75,67 @@ def predict(self, X, labels):
:param labels: boolean
:return: return prediction
num_examples = X.size
prediction = 0
for value in range(num_examples):
prediction = prediction + X[value] * self.theta[value]

prediction = self.sigmoid(prediction)

if labels:
if prediction > 0.5:
prediction = int(1)
if self.intercept:
intercept = np.ones((np.shape(X)[0],1))
X = np.concatenate((intercept, X), 1)

num_examples, num_features = np.shape(X)
prediction = []
for sample in range(num_examples):
yhat = 0
for value in range(num_features):
yhat += X[sample, value] * self.theta[value]

pred = self.sigmoid(yhat)

if labels:
if pred > 0.5:
prediction = int(0)

return prediction

def demo():
########## Test file for Logistic Classifier #############

from sklearn.cross_validation import train_test_split
from sklearn.metrics import confusion_matrix, classification_report
# initialize linear regression parameters
iterations = 100000
alpha = 0.01
max_iterations = 50000
alpha = 0.0001
l2 = 1.0

# plot the data with seaborn (add this later)

lgit = Logit(alpha = alpha, iterations = iterations, verbose = True, tolerance = 0.02)
lgit = Logit(alpha = alpha, iterations = max_iterations,
verbose = True, tolerance = 0.001, l2 = l2)

# load the example data stolen from ''
data = np.loadtxt('Data/heart.txt', delimiter = ',')
data = np.loadtxt('Data/ionosphere.csv', delimiter = ',')
X = data[:, 1:]
y = data[:, 0]

################### DEBUG BABY! ##########################

#import pdb
# creates breakpoint for manually interaction dawg

# transform data
#X = lgit.transform(X)
#print X[1,:]

# fit the linear reg
lgit.gradient_descent(X = X, y = y)

# load testing dataset
test = np.loadtxt('Data/heart_test.txt', delimiter = ',')
X_test = test[:, 1:]
y_test = test[:, 0]

# transform testing data
#X_test = lgit.transform(X_test)
#print X_test[1,:]

# make a predictions
prediction = np.zeros(shape = (y_test.size, 2))
correct = 0
for i in range(y_test.size):
prediction[i,0] = lgit.predict(X_test[i, :], labels = True)
prediction[i, 1] = y_test[i]
if prediction[i, 0] == prediction[i, 1]:
correct += 1

print 'correct: ', correct
#np.savetxt('logitpreds.csv', prediction, delimiter = ',')

# scale data
max = np.amax(X)
X /= max

prediction = []
correct = []
for i in range(0,10):

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.1)

# fit the reg = X_train, y = y_train)

# make a predictions
prediction.append(lgit.predict(X_test, labels = True))

print prediction
print correct
print classification_report(np.array(correct), np.array(prediction))

if __name__ == '__main__':

0 comments on commit f0416ed

Please sign in to comment.