ZIB-IOL · alejandro-carderera · Mar 12, 2021 · Mar 4, 2021 · Mar 9, 2021 · Mar 9, 2021
diff --git a/examples/blended_cg.jl b/examples/blended_cg.jl
@@ -2,9 +2,11 @@ import FrankWolfe
 using LinearAlgebra
 using Random
 using DoubleFloats
+using FrankWolfe
 
 n = Int(1e4)
-k = 3000
+#n = Int(1e3)
+k = 1000
 
 s = rand(1:100)
 @info "Seed $s"
@@ -17,10 +19,24 @@ xpi = rand(n);
 total = sum(xpi);
 const xp = xpi # ./ total;
 
+#matrix = rand(n, n)
+#hessian = matrix * transpose(matrix)
+#linear_term = rand(n)
+#constant_term = rand()
+#f(x) = constant_term + dot(linear_term, x) + 0.5* transpose(x) * hessian * x
+#function grad!(storage, x)
+#    storage .= linear_term +  hessian * x
+#end
+#gradient = zeros(n)
+
+
 f(x) = norm(x - xp)^2
 function grad!(storage, x)
     @. storage = 2 * (x - xp)
 end
+hessian = Matrix(1.0I, n, n) 
-hessian = Matrix(1.0I, n, n) 
+hessian = Matrix(2I, n, n) 
-hessian = Matrix(1.0I, n, n) 
+hessian = Matrix(2I, n, n) 
+
+
 
 # better for memory consumption as we do coordinate-wise ops
 
@@ -33,63 +49,73 @@ function cgrad!(storage, x, xp)
 end
 
 # this LMO might produce numerical instabilities do demonstrate the recovery feature
-const lmo = FrankWolfe.KSparseLMO(100, 1.0)
+#const lmo = FrankWolfe.KSparseLMO(100, 1.0)
 
 # full upgrade of the lmo (and hence optimization) to Double64.
 # the same lmo with Double64 is much more numerically robust. costs relatively little in speed.
-# const lmo = FrankWolfe.KSparseLMO(100, Double64(1.0))
+ #const lmo = FrankWolfe.KSparseLMO(100, Double64(1.0))
 
 # as above but now to bigfloats
 # the same lmo here with bigfloat. even more robust but much slower
 # const lmo = FrankWolfe.KSparseLMO(100, big"1.0")
 
 # other oracles to test / experiment with
 # const lmo = FrankWolfe.LpNormLMO{Float64,1}(1.0)
-# const lmo = FrankWolfe.ProbabilitySimplexOracle(Double64(1.0));
+#const lmo = FrankWolfe.ProbabilitySimplexOracle(Double64(1.0));
+const lmo = FrankWolfe.ProbabilitySimplexOracle(1.0);
 # const lmo = FrankWolfe.UnitSimplexOracle(1.0);
 
 const x00 = FrankWolfe.compute_extreme_point(lmo, zeros(n))
 
+#active_set = FrankWolfe.ActiveSet([(1.0, x00)]) 
+#vect = FrankWolfe.compute_extreme_point(lmo, rand(n))
+#FrankWolfe.active_set_update!(active_set, 0.2, vect)
+#vect = FrankWolfe.compute_extreme_point(lmo, rand(n))
+#FrankWolfe.active_set_update!(active_set, 0.2, vect)
+
 FrankWolfe.benchmark_oracles(x -> cf(x, xp), (str, x) -> cgrad!(str, x, xp), ()->randn(n), lmo; k=100)
 
 # copying here and below the x00 as the algorithms write back into the variables to save memory.
 # as we do multiple runs from the same initial point we do not want this here.
 
 x0 = deepcopy(x00)
-
-@time x, v, primal, dual_gap, trajectorySs = FrankWolfe.fw(
+x, v, primal, dual_gap, trajectoryBCG = FrankWolfe.bcg(
     f,
     grad!,
     lmo,
     x0,
     max_iteration=k,
-    line_search=FrankWolfe.shortstep,
-    L=2,
+    line_search=FrankWolfe.adaptive,
     print_iter=k / 10,
+    hessian = hessian,
     emphasis=FrankWolfe.memory,
+    L=2,
     verbose=true,
     trajectory=true,
-);
+    Ktolerance=1.00,
+    goodstep_tolerance=0.95,
+    weight_purge_threshold=1e-10,
+)
 
 x0 = deepcopy(x00)
-
-@time x, v, primal, dual_gap, trajectoryAda = FrankWolfe.afw(
+x, v, primal, dual_gap, trajectoryBCG2 = FrankWolfe.bcg(
     f,
     grad!,
     lmo,
     x0,
     max_iteration=k,
     line_search=FrankWolfe.adaptive,
-    L=100,
     print_iter=k / 10,
     emphasis=FrankWolfe.memory,
+    L=2,
     verbose=true,
     trajectory=true,
-);
-
-x0 = deepcopy(x00)
+    Ktolerance=1.00,
+    goodstep_tolerance=0.95,
+    weight_purge_threshold=1e-10,
+)
 
-x, v, primal, dual_gap, trajectoryBCG = FrankWolfe.bcg(
+x, v, primal, dual_gap, trajectoryBCG_backup = FrankWolfe.bcg_backup(
     f,
     grad!,
     lmo,
@@ -106,7 +132,42 @@ x, v, primal, dual_gap, trajectoryBCG = FrankWolfe.bcg(
     weight_purge_threshold=1e-10,
 )
 
-data = [trajectorySs, trajectoryAda, trajectoryBCG]
-label = ["short step", "AFW", "BCG"]
-
-FrankWolfe.plot_trajectories(data, label)
+data = [trajectoryBCG, trajectoryBCG2, trajectoryBCG_backup]
+label = ["BCG", "BCG old", "BCG backup"]
+
+FrankWolfe.plot_trajectories(data, label, filename="output_results.png")
+
+#x0 = deepcopy(x00)
+#@time x, v, primal, dual_gap, trajectoryAda = FrankWolfe.afw(
+#    f,
+#    grad!,
+#    lmo,
+#    x0,
+#    max_iteration=k,
+#    line_search=FrankWolfe.adaptive,
+#    L=100,
+#    print_iter=k / 10,
+#    emphasis=FrankWolfe.memory,
+#    verbose=true,
+#    trajectory=true,
+#);
+
+#x0 = deepcopy(x00)
+#@time x, v, primal, dual_gap, trajectorySs = FrankWolfe.fw(
+#    f,
+#    grad!,
+#    lmo,
+#    x0,
+#    max_iteration=k,
+#    line_search=FrankWolfe.shortstep,
+#    L=2,
+#    print_iter=k / 10,
+#    emphasis=FrankWolfe.memory,
+#    verbose=true,
+#    trajectory=true,
+#);
+
+#data = [trajectorySs, trajectoryAda, trajectoryBCG]
+#label = ["short step", "AFW", "BCG"]
+#
+#FrankWolfe.plot_trajectories(data, label)