# In this notebook we look into the performance of semi-dual damped Newton in the numpy framework.

In [None]:
from __future__ import division
import os
import numpy as np
import time
import matplotlib.pyplot as plt
import warnings
warnings.filterwarnings( 'ignore' )
np.random.seed(1234)
plt.rcParams.update( { 'font.size' : 10 } )
import computational_OT
%matplotlib inline
%load_ext autoreload
%autoreload 2   

In [None]:
relative_path_to_new_folder = "../Images"
os.makedirs( relative_path_to_new_folder, exist_ok = True )
if not os.path.isdir( "../Images/DampedNewton_SemiDual_images_numpy" ):
    os.makedirs( "../Images/DampedNewton_SemiDual_images_numpy" )

In [None]:
"""To compute distance matrix"""
def distmat( x, y ):
    return np.sum( x**2, 0 )[:,None] + np.sum( y**2, 0 )[None,:] - 2 * x.transpose().dot( y )

"""To Normalise a vector"""
normalize = lambda a: a/np.sum( a )

"""To Compute P"""
def GetP( u, K, v ):
    return u[:,None] * K * v[None,:]

def plotp( x, col, plt, scale = 200, edgecolors = "k" ):
  return plt.scatter( x[0,:], x[1,:], s = scale, edgecolors = edgecolors, c = col, cmap = 'plasma', linewidths = 2 )

In [None]:
def generate_data( N ):
    """
     N is a list of the size of the data on x and y
    """
    x = np.random.rand( 2, N[0] ) - 0.5
    theta = 2 * np.pi * np.random.rand( 1, N[1] )
    r = 0.8 + 0.2 * np.random.rand( 1, N[1] )
    y = np.vstack( ( r * np.cos( theta ), r * np.sin( theta ) ) )
    return x, y

In [None]:
N = [ 500,  600 ]
x, y = generate_data( N )

## Entropy regularized dual-formulation
The dual formulation of the entropy regularized OT is given by:
$$
OT_{\varepsilon}(\alpha,\beta) = \max_{f\in \mathbb{R}^{n}, g\in\mathbb{R}^{m}} \langle f, \alpha \rangle + \langle g, \beta \rangle - \varepsilon\left(\langle\alpha \otimes \beta, e^{\frac{f}{\varepsilon}}\odot K \odot e^{\frac{g}{\varepsilon}}  \rangle-1\right)\ ,
$$
where
$$
\alpha \in \mathcal{M}_{1}(\mathcal{X}),\ \beta \in \mathcal{M}_{1}(\mathcal{Y}),\ \varepsilon>0,\ f\in\mathbb{R}^{n},\ g\in \mathbb{R}^{m}\ .
$$

## The dual formulation of OT is given by:
Using the Shrodinger-bridge equations between the potentials, that is, $g_{j} = -\varepsilon\log\left(\sum_{i}\exp\left(\frac{f_{i}-C_{ij}}{\varepsilon}\right)\alpha_{i}\right)\ , \ \forall j = 1,\dots,m$, we obtain the semi-dual formulation of the objective function, that is,
$$
Q_{\varepsilon}^{semi}(f) = \langle f, \alpha \rangle + \langle g(f,C,\varepsilon), \beta \rangle\ , 
$$
where
$g(f,C,\varepsilon)_{j} = -\varepsilon\log\left(\sum_{i}\exp\left(\frac{f_{i}-C_{ij}}{\varepsilon}\right)\alpha_{i}\right)$.

In this setup, the gradients and the Hessian is as follows:
$$
\nabla_{f}Q_{\varepsilon}^{semi}(f)_{i} = \frac{1}{\varepsilon}\alpha_{i}\left(1-\sum_{s=1}^{n}\frac{e^{\frac{f_{i}-C_{ij}}{\varepsilon}}\beta_{s}}{\left(\sum_{t=1}^{n}\alpha_{t}e^{\frac{f_{t}-C_{ts}}{\varepsilon}}\right)}\right)\ ,\ \forall i = 1,\dots,n 
$$
and
$$
\nabla^{2}_{f}Q_{\varepsilon}^{semi}(f)_{ii} = \frac{-1}{\varepsilon}\sum_{s=1}^{m}\left(\alpha_{i}\exp\left(\frac{f_{i}+g(f,C,\varepsilon)_{s}-C_{is}}{\varepsilon}\right)\right)\left(1 - \alpha_{i}\left(\exp\left(\frac{f_{i}+g(f,C,\varepsilon)_{s}-C_{is}}{\varepsilon}\right)\right)\right)\beta_{s}\ ,\ \forall i =1,\dots,n,
$$
and
$$
\nabla^{2}_{f}Q_{\varepsilon}^{semi}(f)_{ij} = \frac{1}{\varepsilon}\sum_{s=1}^{m}\alpha_{i}\alpha_{j}\left(\exp\left(\frac{f_{i}+g(f,C,\varepsilon)_{s}-C_{is}}{\varepsilon}\right)\right)\left(\exp\left(\frac{f_{j}+g(f,C,\varepsilon)_{s}-C_{js}}{\varepsilon}\right)\right)\beta_{s}\ ,\ \forall i \neq j = 1,\dots,n\ .
$$
Now we plug-in these gradients and Hessian in damped Newton algorithm as we did before.

Here we also use the exp-log stabilization to stabilize $g$, the gradients as well as the Hessian as below
$$
f^{C}_{j} \leftarrow \min_{i}(C_{ij}-f_{i})\ ,  \ \forall j = 1,\dots,m,\ \text{the C-transform of f} \\
g_{j} = -\varepsilon\log\left(\sum_{i}\exp\left(\frac{f_{i}-C_{ij}+f^{C}_{j}}{\varepsilon}\right)\alpha_{i}\right)+f^{C}_{j}\ ,  \ \forall j = 1,\dots,m\ ,\\
\nabla_{f}Q_{\varepsilon}^{semi}(f)_{i} = \frac{1}{\varepsilon}\alpha_{i}\left(1-\sum_{s=1}^{n}\frac{e^{\frac{f_{i}-C_{ij}+f^{C}_{j}}{\varepsilon}}\beta_{s}}{\left(\sum_{t=1}^{n}\alpha_{t}e^{\frac{f_{t}-C_{ts}+f^{C}_{j}}{\varepsilon}}\right)}\right)\ ,\ \forall i = 1,\dots,n\ , \\
\nabla^{2}_{f}Q_{\varepsilon}^{semi}(f)_{ii} = \frac{-1}{\varepsilon}\sum_{s=1}^{m}\left(\alpha_{i}\exp\left(\frac{f_{i}+g(f,C,\varepsilon)_{s}-C_{is}}{\varepsilon}\right)\right)\left(1 - \alpha_{i}\left(\exp\left(\frac{f_{i}+g(f,C,\varepsilon)_{s}-C_{is}}{\varepsilon}\right)\right)\right)\beta_{s}\ ,\ \forall i =1,\dots,n\ , \\
\nabla^{2}_{f}Q_{\varepsilon}^{semi}(f)_{ij} = \frac{1}{\varepsilon}\sum_{s=1}^{m}\alpha_{i}\alpha_{j}\left(\exp\left(\frac{f_{i}+g(f,C,\varepsilon)_{s}-C_{is}}{\varepsilon}\right)\right)\left(\exp\left(\frac{f_{j}+g(f,C,\varepsilon)_{s}-C_{js}}{\varepsilon}\right)\right)\beta_{s}\ ,\ \forall i \neq j = 1,\dots,n\ .
$$

## I. Semidual damped Newton (Direct inversion / No preconditioning)

#### Experiment

In [None]:
withoutprecond_epsilons = [ 1.0, 0.5, 0.05, 0.03, 0.02 ]


rho = 0.95
c = 0.5
Semi_dual_dampedNewtonP = []
results_DampedNewtonsemidual = []
times_DampedNewtonsemidual = []
Hessians_DampedNewtonsemidual= []

#Cost matrix
C = distmat( x, y )
# a and b
a = normalize( np.ones( N[0] ) )
b = normalize( np.ones( N[1] ) )
for eps in withoutprecond_epsilons:
    K = np.exp( - C/eps )
    # Line Search
    print( " Semi-dual damped Newton for epsilon = " + str(eps) + ":" )   
    f = a
    print( " Doing for (",N[0], N[1],"). ")
    print( " |-  Iterating" )  
    start = time.time()
    Optimizer = computational_OT.DampedNewton_SemiDual_np( C, a, b, f, eps, rho, c ) 
    out = Optimizer._update( maxiter = 50 )
    results_DampedNewtonsemidual.append( out )
    end = time.time()
    times_DampedNewtonsemidual.append( 1e3 * ( end - start ) )
    print( " |- Computing P " )
    Semi_dual_dampedNewtonP.append( GetP( np.exp( out['potential_f']/eps ), K, np.exp( out['potential_g']/eps ) ) )
    print( " |- Recording (unstabilized) Hessian \n " )
    mat  = - eps * Optimizer.Hessian
    diag = 1/np.sqrt( a )
    mat = diag * mat * diag
    Hessians_DampedNewtonsemidual.append( mat )

#### Error plot

In [None]:
plt.figure( figsize = ( 12, 5 ) )
plt.title( "$$" )
plt.title( "$||P1 -a||_1+||P^T 1 -b||_1$" )
for i in range( len( results_DampedNewtonsemidual ) ):
  error = np.asarray( results_DampedNewtonsemidual[i]['error'] )
  plt.plot( error, label = 'Semi-dual damped Newton for $\epsilon = $' + str(withoutprecond_epsilons[i]), linewidth = 2 )
plt.xlabel( " Number of iterations " ) 
plt.ylabel( " Error in log-scale " )
plt.legend( loc = "upper right" )
plt.yscale( 'log' )
plt.tight_layout()
plt.savefig( "../Images/DampedNewton_SemiDual_images_numpy/ErrorLinesearchNewton.pdf", format = 'pdf' )
plt.show()
print( " \n Error plot  s can increase! The error is not the objective function! " )

#### Objective values plot

In [None]:
plt.figure( figsize = ( 12, 5 ) )
plt.title( "$$" )
plt.title( " Objective Function " )
for i in range( len( results_DampedNewtonsemidual ) ):
  value = np.asarray( results_DampedNewtonsemidual[i]['objectives'] )
  plt.plot( value,label = 'Semi-dual damped Newton for $\epsilon = $'+ str(withoutprecond_epsilons[i]), linewidth = 2 )

plt.xlabel( " Number of iterations " )
plt.ylabel( " Objective value " )
plt.yscale( 'log' )
plt.legend()
plt.savefig( "../Images/DampedNewton_SemiDual_images_numpy/ObjectiveLineSearchNewton.pdf", format = 'pdf' )
plt.show()

#### Plot displaying the step lengths obtained from the Armijo's conditions at different iterations for different epsilons

In [None]:
plt.figure( figsize = ( 20, 7 ) )
plt.subplot( 2, 1, 1 )
plt.title( "Alpha" )
for i in range( len( results_DampedNewtonsemidual ) ):
  plt.plot( np.asarray( results_DampedNewtonsemidual[i]["linesearch_steps"] ), label = 'Damped Newton for $\epsilon = $'+ str(withoutprecond_epsilons[i]), linewidth = 2 )
plt.xlabel( "Number of iterations" )
plt.ylabel( "Alpha in log-scale" ) 
plt.legend()
plt.savefig( "../Images/DampedNewton_SemiDual_images_numpy/AlphaLineSearchNewton.pdf", format = 'pdf' )
plt.show()

#### Observing the spectrum of the eigenvalues of the Hessian at the optimal potentials obtained from the above algorithm

In [None]:
def print_spectral_statistics( mat, stabilize = False ):
    if stabilize:
        # Stabilizing largest and smallest eigenvalue
        min_vector = np.hstack( ( np.ones( N[0] ) ) )
        max_vector = np.hstack( ( np.ones(N[0] ) ) )
        norm = np.sqrt( N[0] )
        min_vector = min_vector/norm
        max_vector = max_vector/norm
        min_vector = min_vector.reshape( ( min_vector.shape[0], 1 ) )
        max_vector = max_vector.reshape( ( max_vector.shape[0], 1 ) )
        #
        mat = mat + np.dot( min_vector, min_vector.T )
        mat = mat - np.dot( max_vector, max_vector.T )
    # endif
    eig, v = np.linalg.eigh( mat )
    sorting_indices = np.argsort( eig )
    eig = eig[ sorting_indices ]
    v   = v[ :, sorting_indices ]
    
    #print( "Mean eigenvalue: ", np.mean(eig) )
    print( "List of smallest eigenvalues: ", eig[ : 10 ] )
    print( "List of largest  eigenvalues: ", eig[ - 10 : ] )
    min_index = np.argmin( eig )
    max_index = np.argmax( eig )
    min_value = eig[ min_index ]
    max_value = eig[ max_index ]
    min_vector = v[ :, min_index ]
    min_vector = min_vector/min_vector[0]
    max_vector = v[ :,max_index ]
    max_vector = max_vector/max_vector[0]
    condition_number = max_value/min_value
    # Test smallest and largest
    # print( "Min eigenvalue vector: ", min_vector)
    # print( "Max eigenvalue vector: ", max_vector)
    #
    #print( v[:,0]*np.sqrt( self.N1 + self.N2))
    #vector = v[:,0]
    #test = np.dot( result, vector)
    #print( np.linalg.norm(test) )
    #print("Min absolute eigenvalues: ", min_value)
    #print("Norm of v-1: ", np.linalg.norm(min_vector-eig_vector))
    print( " Condition number: ", condition_number )
    # plt.hist( eig, 50)
    # plt.title( "Histogram of eigenvalues for Hessian")
    # plt.xlabel( "Eigenvalues")
    # plt.yscale( "log" )
    # plt.show()
    return eig, v

In [None]:
eigs = []
eigvecs = []
for i in range( len( withoutprecond_epsilons ) ):
    eps = withoutprecond_epsilons[i]
    print( " Spectral statistics of Hessian for epsilon = " + str(eps) )
    Hessian = Hessians_DampedNewtonsemidual[i]
    ev = print_spectral_statistics( Hessian, stabilize = False )
    eigs.append( ev[0] )
    eigvecs.append( ev[1] )
    print("")


In [None]:
fig, ax = plt.subplots( figsize = ( 5, 9 ), nrows = len(withoutprecond_epsilons), ncols = 1, sharey = True )
plt.title( " Histogram of eigenvalues. " )
for i in range( len( withoutprecond_epsilons ) ):
    ax[i].hist( eigs[i], 50 )
    ax[i].set_title( " $\epsilon$: " + str(withoutprecond_epsilons[i]) )
    ax[i].set_xlabel( " Eigenvalues " )
    ax[i].set_yscale( "log" )
    ax[i].set_xlim( 0, 2 )
plt.subplots_adjust( wspace = 0, hspace = 0 ) 
plt.tight_layout()
plt.savefig( "../Images/DampedNewton_SemiDual_images_numpy/eigenhistunstabilized.pdf", format = 'pdf' )
plt.show()

## II. Semidual damped Newton with preconditioning
Here we proceed similar to semi-dual damped Newton but with preconditioning. We consider $t$ eigenvalues of the Hessian and form the following preconditioning matrix:
$$
P = \left(I_{n+m}-\sum_{i-1}^{t}\left(1 - \frac{1}{\sqrt{\lambda_{i}}}\right)y_{i}y_{i}^{T}\right)\ .
$$
Now, at the $k^{th}$ iteration we solve the following equation:
$$
(P\nabla^{2}Q_{\varepsilon}(f,g)P)(Pp_{k})=P\nabla Q_{\varepsilon}(f,g)\ ,
$$
using iterative inversion methods such as "Conjugate gradient" and "GMRES" to get the update direction $p_{k}$, following which we use the Armijo condition to obtain the step size $\alpha_{k}$.

#### Preconditioning eigenvectors 
The Hessian of damped Newton in the semi-dual formulation are in the interval  [0,1]. The following function collects the eigenvectors corresponding to the eigenvalues that are less than 0 and greater than 1.

In [None]:
def build_preconditioners( num_eigs, modified_Hessian, ansatz = True ):
    # Diagonalize
    eigenvalues, eigenvectors = np.linalg.eigh( modified_Hessian )
    sorting_indices = np.argsort( eigenvalues )
    eigenvalues  = eigenvalues[ sorting_indices ]
    eigenvectors = eigenvectors[ : , sorting_indices ]
    # Form null vector
    if not ansatz:
        null_vector = eigenvectors[:, 0]
    else:
        null_vector = np.ones( N[0] ) 
        norm = np.sqrt( N[0] )
        null_vector = null_vector/norm
    # Form other vectors
    indices1 = []
    for i in range( num_eigs ):
        indices1.append( i + 1 )
    
    # For eigenvectors corresponding to eigenvalues greater than 1
    indices2 =  np.where( eigenvalues > 1  )[0].tolist()
    indices = indices1 + indices2[ - num_eigs: ]
    precond_vectors = eigenvectors[ :, indices ]
    
    precond_vectors = []
    for index in indices:
        precond_vectors.append( eigenvectors[ :, index ] )
    #
    return null_vector, precond_vectors

#### Experiment

In [None]:
num_eigs = 30
null_vector, precond_vectors = build_preconditioners( num_eigs,  Hessians_DampedNewtonsemidual[-1], ansatz = False )


In [None]:
withprecond_epsilons = [ 1.0, 0.5, 0.05, 0.03, 0.02, 0.01 ]
rho = 0.95
c = 0.5
reset_starting_point = True  
final_modified_Hessians = []
Semi_dual_dampedNewtonP = []
results_DampedNewton_with_preconditioner_SemiDual = []
times_DampedNewton_with_preconditioner_SemiDual = []
f = None
# Cost matrix
C = distmat( x, y )
# a and b   
a = normalize( np.ones( N[0] ) )
b = normalize( np.ones( N[1] ) )
for eps in withprecond_epsilons :
    # Line Search
    print( " Semi-dual damped Newton for epsilon = "+str(eps)+":" )    
    if f is None:
        f = a * 0
    print( " Doing for (",N[0], N[1],"). " )
    print( " |- Iterating" )  

    start = time.time() 
    Optimizer = computational_OT.DampedNewton_with_precodonditioner_SemiDual_np( C, a, b, f, eps, rho, c, null_vector, precond_vectors[:] )
    out = Optimizer._update( maxiter = 50, iterative_inversion = 100, version = None, debug = False, optType = 'cg' )
    results_DampedNewton_with_preconditioner_SemiDual.append( out )
    end = time.time()
    times_DampedNewton_with_preconditioner_SemiDual.append( 1e3 * ( end - start ) )
    print( " |- Computing P" )
    if not reset_starting_point:
        f = Optimizer.x[:a.shape[0]]
        g = Optimizer.x[a.shape[0]:]
    Semi_dual_dampedNewtonP.append( GetP( np.exp( out['potential_f']/eps ), np.exp( -C/eps ), np.exp( out['potential_g']/eps ) ) )
    final_modified_Hessians.append( Optimizer.modified_Hessian )

#### Error plot

In [None]:
plt.rcParams.update( { 'font.size' : 10 } )
plt.figure( figsize = ( 20, 7 ) )   
plt.title( "$$" ) 
plt.title( " $||P1 -a||_1+||P^T1 -b||_1$ " ) 
for i in range( len( results_DampedNewton_with_preconditioner_SemiDual ) ): 
  error = np.asarray( results_DampedNewton_with_preconditioner_SemiDual[i]['error'] ) 
  plt.plot( error, label = 'Semi-dual damped Newton for $\epsilon = $'+ str(withprecond_epsilons[i]), linewidth = 2 ) 
plt.xlabel( " Number of iterations " )  
plt.ylabel( " Error in log-scale " )  
plt.legend() 
plt.yscale( 'log' ) 
plt.savefig( "../Images/DampedNewton_SemiDual_images_numpy/ErrorDampedNewtonwithPrec+ond_final_cg.png" ) 
plt.show() 
print( "\n Error plots can increase! The error is not the objective function!" ) 

#### Objective function plot

In [None]:

plt.figure( figsize = ( 12, 5 ) )
plt.title( "$$" )
plt.title( " Objective Function " )
for i in range( len(results_DampedNewton_with_preconditioner_SemiDual) ):
  value = np.asarray( results_DampedNewton_with_preconditioner_SemiDual[i]['objectives'] )
  plt.plot( value, label = 'Damped Newton for $\epsilon = $' + str(withprecond_epsilons[i]), linewidth = 2 )
plt.xlabel( " Number of iterations " )
plt.ylabel( " Objective value " )
plt.yscale( 'log' )
plt.legend()
plt.show()

#### Plot displaying the step lengths obtained from the Armijo's conditions at different iterations for different epsilons

In [None]:
plt.figure( figsize = ( 20, 7 ) )
plt.subplot( 2, 1, 1 )
plt.title( " Alpha " )
for i in range( len( results_DampedNewton_with_preconditioner_SemiDual ) ):
  plt.plot( np.asarray( results_DampedNewton_with_preconditioner_SemiDual[i]["linesearch_steps"] ), label = 'Damped Newton for $\epsilon = $'+ str(withprecond_epsilons[i]), linewidth = 2 )
plt.xlabel( "Number of iteration  s" )
plt.ylabel( "Alpha in log-scale" )
plt.legend()
plt.show()

#### Plot of the time stamps recorded at different blocks of the iterative inversion method


In [None]:
text = [
        "Preconditioning 1: Form E data",
        "Preconditioning 2: Form P data",
        "Form preconditioning functions",
        "Invert the linear system for p_k",
        "Unwinding",
        "Complete code block"
        ]

plt.figure( figsize = ( 20, 10 ) )  
for j in range( len(results_DampedNewton_with_preconditioner_SemiDual[0]['timings'][0]) ):
  values = []
  for i in range( len(results_DampedNewton_with_preconditioner_SemiDual) ):
    mean = 0
    for k in range( len(results_DampedNewton_with_preconditioner_SemiDual[i]['timings']) ):
      mean += results_DampedNewton_with_preconditioner_SemiDual[i]['timings'][k][j]
    mean = mean/len( results_DampedNewton_with_preconditioner_SemiDual[i]['timings'] ) 
    values.append( mean )
  if len(withprecond_epsilons) == len(values):
    plt.plot( withprecond_epsilons, np.asarray(values), label = text[j], linewidth = 2 )
    plt.legend( loc = 'upper left' )
plt.xlabel( "$\epsilon$" )
plt.ylabel( "Time in ms" )
plt.show()

#### Looking into the preconditioning
Here we perform the preconditioning of the Hessians for different number of preconditioning vectors and plot the hitograms of the eigenvalues of the preconditoned Hessian.

In [None]:
num_eigs = [ 0, 30, 50, 100, 400, 499 ]
preconditioned_Hessians = {}
for numeigs  in  range(len(num_eigs)):
    preconditioned_Hessians[ num_eigs[ numeigs ] ] = []
    for i in  range(len(withoutprecond_epsilons)):
        diag   = 1/np.sqrt(np.diag( Hessians_DampedNewtonsemidual[i] ).flatten())
        result = diag[:,None] * Hessians_DampedNewtonsemidual[i] * diag[None,:]
        if num_eigs[numeigs] != 0:
            null_vector, precond_vectors = build_preconditioners( num_eigs[ numeigs ],  Hessians_DampedNewtonsemidual[i], ansatz = False )
            # vector = null_vector
            # vector = vector/diag
            # vector = vector/np.linalg.norm( vector )
            # vector = vector.reshape( ( len( vector ), 1) )
            # result = result + np.dot( vector, vector.T )
            y_ = np.array( precond_vectors ).T # Matrix of size n by k
            # Compute eigenvalues
            Ay = np.dot( result, y_ )
            eigenvalues = np.sum( y_ * Ay, axis = 0 )
            # Compute P_matrix = id + y*diag(values)*y.T
            values = ( 1/np.sqrt(eigenvalues) - 1 )    # Vector of size k
            z = y_ * values[None,:]
            B = np.dot( Ay, z.T )
            C_ = z @ np.dot( y_.T, Ay ) @ z.T
            result = result + B + B.T + C_
        preconditioned_Hessians[ num_eigs[ numeigs ] ].append( result )

In [None]:
def spectral_decomposition( mat ):
    eig, v = np.linalg.eigh( mat )
    sorting_indices = np.argsort( eig )
    eig = eig[ sorting_indices ]
    v   = v[ : , sorting_indices ]
    print( "List of smallest eigenvalues: ", eig[ : 10 ] )
    print( "List of largest  eigenvalues: ", eig[ - 10 : ] )
    return eig, v


eigs = {}
for numeigs in  range(len(num_eigs)):
    eigs[ num_eigs[ numeigs ] ] = []
    print(" For number of preconditioning eigenvectors = ", num_eigs[ numeigs ])
    for i in range(len(withoutprecond_epsilons)):
        eps = withoutprecond_epsilons[i]
        print( "Spectral statistics of Hessian for epsilon = "+str(eps) )
        ev = spectral_decomposition( preconditioned_Hessians[ num_eigs[ numeigs ] ][i])
        eigs[ num_eigs[ numeigs ] ].append( ev[0] )
        print("")
    print("------------------------------------------------------------------------------------------")

The following plot displays different size of preconditioning on the Hessian obtained from the semi-dual damped Newton without preconditioning.

In [None]:
plt.rcParams.update( { 'font.size' : 90 } )
fig, ax = plt.subplots( figsize = ( 120, 130 ), nrows = len(num_eigs), ncols = len(withoutprecond_epsilons), sharey = True, sharex = False )
plt.subplots_adjust( wspace = 0, hspace = 0.3 )
p = np.log10( 0.5 )   
for numeigs in range(len(num_eigs)):
    for i in range(len(withoutprecond_epsilons)):
        ax[ numeigs ][i].hist( eigs[ num_eigs[ numeigs ] ][i], 50, rwidth = 0.9 )
        ax[ numeigs ][i].set_title( " k = "+str(num_eigs[ numeigs ])+", $\epsilon$ = " +str(withoutprecond_epsilons[i])+ "" )
        ax[ numeigs ][i].set_ylim( ymin = 10 ** p )
        ax[ numeigs ][i].set_yscale( "log" )    
ax[ len(num_eigs) - 1 ][ len(withoutprecond_epsilons) - 1 ].set_xticks([ 0, 1, 2 ])  
plt.subplots_adjust( wspace = 0, hspace = 0.4 )
plt.show()
