-
Notifications
You must be signed in to change notification settings - Fork 0
/
SVRG_adapRestart_pflug_sc.m
74 lines (59 loc) · 2.61 KB
/
SVRG_adapRestart_pflug_sc.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
function [all_S_pflug, all_eta, time_passes, obj_value, w] = SVRG_adapRestart_pflug_sc(X_train, Y_train, x_tilde, omega, L, m, b, S, eta, lambda1, lambda2, innerPt_no)
[data_dim, data_size] = size(X_train);
innerPt_no = min(floor(sqrt(m)), innerPt_no);
obj_value = zeros(S*(1 + innerPt_no) + 1, 1);
all_S_pflug = zeros(S, 1);
all_eta = zeros(S,1);
time_passes = zeros(S*(1 + innerPt_no) + 1, 1);
count = 1;
obj_value(count) = obj_logreg_r1r2(lambda1, lambda2, x_tilde, X_train, Y_train);
burnin = floor(m-1);
tic
for s = 1: S
S_pflug = 0;
count = count + 1;
obj_value(count) = obj_value(count-1);
time_passes(count) = toc;
[full_gradient, eachComponent] = FullLogR2Gradient_eachComponent(0, x_tilde, X_train, Y_train);
tau = 0;
x = x_tilde;
x_previous = x_tilde;
x_previous_previous = x_previous;
g = zeros(data_dim,1);
g_previous = g;
for k = 1: m
rand_idx = randi([1, data_size], [1, b]);
gradient = LogR2Gradient(0, rand_idx, x, X_train, Y_train);
%sum_each_component = sum(eachComponent(:,rand_idx),2) * 1.0/b;
sum_each_component = eachComponent(:,rand_idx) * ones(size(rand_idx))' * 1.0/b;
x_previous_previous = x_previous;
x_previous = x;
g_previous = g;
g = gradient - sum_each_component + full_gradient;
x = prox_map(x - eta*g, eta*lambda1, eta*lambda2);
if(k > 1)
term1 = ((x_previous - x_previous_previous)'*(x - x_previous))/(norm(x - x_previous)*norm(x_previous - x_previous_previous));
S_pflug = S_pflug + 1.0 * term1;
%S_pflug = S_pflug + 1.0*((g_previous - g_previous_previous)'*(g - g_previous))/(norm(g_previous - g_previous_previous)*norm(g - g_previous));
%S_pflug = S_pflug + 1.0*(g_previous'*g)/(norm(g_previous)*norm(g));
end
if rem(k, ceil(m/(innerPt_no + 1)) ) == 0 && k ~= m
count = count + 1;
time_passes(count) = toc;
obj_value(count) = obj_logreg_r1r2(lambda1, lambda2, x, X_train, Y_train);
end
end
S_pflug = S_pflug/(m-1);
all_S_pflug(s) = S_pflug;
all_eta(s) = eta;
UB = 0.90;
LB = -0.00;
if S_pflug < LB
eta = eta*0.70;
elseif S_pflug > UB
eta = eta*1.40;
end
x_tilde = x;
end
w = x_tilde;
end