# Simple iteration for systems of linear equations

First, generate a random diagonally dominant matrix, for testing.

In [None]:
import numpy as np
rndm = np.random.RandomState(1234)

n = 10
A = rndm.uniform(size=(n, n)) + np.diagflat([15]*n)
b = rndm.uniform(size=n)

In [None]:
A

array([[1.51915195e+01, 6.22108771e-01, 4.37727739e-01, 7.85358584e-01,
        7.79975808e-01, 2.72592605e-01, 2.76464255e-01, 8.01872178e-01,
        9.58139354e-01, 8.75932635e-01],
       [3.57817270e-01, 1.55009951e+01, 6.83462935e-01, 7.12702027e-01,
        3.70250755e-01, 5.61196186e-01, 5.03083165e-01, 1.37684496e-02,
        7.72826622e-01, 8.82641191e-01],
       [3.64885984e-01, 6.15396178e-01, 1.50753812e+01, 3.68824006e-01,
        9.33140102e-01, 6.51378143e-01, 3.97202578e-01, 7.88730143e-01,
        3.16836122e-01, 5.68098653e-01],
       [8.69127390e-01, 4.36173424e-01, 8.02147642e-01, 1.51437668e+01,
        7.04260971e-01, 7.04581308e-01, 2.18792106e-01, 9.24867629e-01,
        4.42140755e-01, 9.09315959e-01],
       [5.98092228e-02, 1.84287084e-01, 4.73552788e-02, 6.74880944e-01,
        1.55946248e+01, 5.33310163e-01, 4.33240627e-02, 5.61433080e-01,
        3.29668446e-01, 5.02966833e-01],
       [1.11894318e-01, 6.07193706e-01, 5.65944643e-01, 6.76406199e-03,
   

# I.  Jacobi iteration

Given

$$
A x = b
$$

separate the diagonal part $D$,

$$ A = D + (A - D) $$

and write

$$
x = D^{-1} (D - A) x + D^{-1} b\;.
$$

Then iterate

$$
x_{n + 1} = B x_{n} + c\;,
$$

where 

$$
B = D^{-1} (A - D) \qquad \text{and} \qquad c = D^{-1} b
$$


Let's construct the matrix and the r.h.s. for the Jacobi iteration

In [None]:
diag_1d = np.diag(A)

B = -A.copy()
np.fill_diagonal(B, 0)

D = np.diag(diag_1d)
invD = np.diag(1./diag_1d)
BB = invD @ B 
c = invD @ b

In [None]:
# sanity checks
from numpy.testing import assert_allclose

assert_allclose(-B + D, A)


# xx is a "ground truth" solution, compute it using a direct method
xx = np.linalg.solve(A, b)

np.testing.assert_allclose(A@xx, b)
np.testing.assert_allclose(D@xx, B@xx + b)
np.testing.assert_allclose(xx, BB@xx + c)

Check that $\| B\| \leqslant 1$:

In [None]:
np.linalg.norm(BB)

0.36436161983015336

### Do the Jacobi iteration

In [None]:
n_iter = 50

x0 = np.ones(n)
x = x0
for _ in range(n_iter):
    x = BB @ x + c

In [None]:
# Check the result:

A @ x - b

array([ 1.11022302e-16,  0.00000000e+00, -2.22044605e-16, -1.11022302e-16,
        1.11022302e-16,  0.00000000e+00, -2.42861287e-17,  0.00000000e+00,
       -2.77555756e-17,  1.11022302e-16])

### Task I.1

Collect the proof-of-concept above into a single function implementing the Jacobi iteration. This function should receive the r.h.s. matrix $A$, the l.h.s. vector `b`, and the number of iterations to perform.


The matrix $A$ in the illustration above is strongly diagonally dominant, by construction. 
What happens if the diagonal matrix elements of $A$ are made smaller? Check the convergence of the Jacobi iteration, and check the value of the norm of $B$.

(20% of the total grade)


In [7]:
# ... ENTER YOUR CODE HERE ...
import numpy as np
from numpy.linalg import norm

def jacobi_iteration(A, b, num_iterations):
    n = len(A)
    x = np.zeros(n)
    x_new = np.zeros(n)
    
    for _ in range(num_iterations):
        for i in range(n):
            x_new[i] = (b[i] - np.dot(A[i, :i], x[:i]) - np.dot(A[i, i+1:], x[i+1:])) / A[i, i]
        x = x_new.copy()
        
        B = np.matmul(A, x) - b
        norm_B = norm(B)
        print(f"Iteration {_+1}: Norm of B = {norm_B}")
    
    return x

In [15]:
A = np.array([[9, 4, 1],
              [2, 5, 2],
              [1, 3, 9]])
b = np.array([6, -7, 5])
num_iterations = 4


result = jacobi_iteration(A, b, num_iterations)
print("Final result:", result)

Iteration 1: Norm of B = 6.626173317949521
Iteration 2: Norm of B = 2.6263086895343566
Iteration 3: Norm of B = 1.8084642560080106
Iteration 4: Norm of B = 0.6496155628553975
Final result: [ 1.55907331 -2.37986283  1.15661637]


# II. Seidel's iteration.

##### Task II.1

Implement the Seidel's iteration. 

Test it on a random matrix. Study the convergence of iterations, relate to the norm of the iteration matrix.

(30% of the total grade)

In [17]:
# ... ENTER YOUR CODE HERE ...
import numpy as np
from numpy.linalg import norm

def gauss_seidel_iteration(A, b, num_iterations):
    n = len(A)
    x = np.zeros(n)
    
    for _ in range(num_iterations):
        for i in range(n):
            x[i] = (b[i] - np.dot(A[i, :i], x[:i]) - np.dot(A[i, i+1:], x[i+1:])) / A[i, i]
    
        B = np.matmul(A, x) - b
        norm_B = norm(B)
        print(f"Iteration {_+1}: Norm of B = {norm_B}")
    
    return x

In [19]:
n = 4  # Size of the matrix
A = np.random.rand(n, n)
b = np.random.rand(n)
num_iterations = 10

result = gauss_seidel_iteration(A, b, num_iterations)
print("Final result:", result)

Iteration 1: Norm of B = 0.47115482880698306
Iteration 2: Norm of B = 0.4682065461401488
Iteration 3: Norm of B = 1.1522340723326459
Iteration 4: Norm of B = 3.1400496009127585
Iteration 5: Norm of B = 8.61689820683844
Iteration 6: Norm of B = 23.657183585657798
Iteration 7: Norm of B = 64.95132680978035
Iteration 8: Norm of B = 178.32566714938162
Iteration 9: Norm of B = 489.5981215427655
Iteration 10: Norm of B = 1344.2053880193603
Final result: [ -229.90788346  -157.40250978 -2614.86989    10427.19235299]


# III. Minimum residual scheme

### Task III.1

Implement the $\textit{minimum residual}$ scheme: an explicit non-stationary method, where at each step you select the iteration parameter $\tau_n$ to minimize the residual $\mathbf{r}_{n+1}$ given $\mathbf{r}_n$. Test it on a random matrix, study the convergence to the solution, in terms of the norm of the residual and the deviation from the ground truth solution (which you can obtain using a direct method). Study how the iteration parameter $\tau_n$ changes as iterations progress.

(50% of the grade)

In [21]:
# ... ENTER YOUR CODE HERE ...
import numpy as np
from numpy.linalg import norm, solve


def minres(A, b, num_iterations):
    n = len(A)
    x = np.zeros(n)
    r = b - np.dot(A, x)
    p = r.copy()
    norm_b = norm(b)
    
    for k in range(num_iterations):
        Ap = np.dot(A, p)
        alpha = np.dot(r, r) / np.dot(p, Ap)
        x += alpha * p
        r -= alpha * Ap
        
        residual_norm = norm(r)
        deviation = norm(x - solve(A, b))
        tau = np.dot(r, Ap) / np.dot(Ap, Ap)
        
        print(f"Iteration {k+1}: Residual Norm = {residual_norm}, Deviation = {deviation}, Tau = {tau}")
        
        if residual_norm / norm_b < 1e-6:
            break
        
        beta = np.dot(r, r) / np.dot(Ap, Ap)
        p = r + beta * p
    
    return x

In [22]:
n = 8  # Size of the matrix
A = np.random.rand(n, n)
b = np.random.rand(n)
num_iterations = 10

result = minres(A, b, num_iterations)
print("Final result:", result)

Iteration 1: Residual Norm = 0.47088471249107333, Deviation = 1.0931128183914578, Tau = -0.015205071305713058
Iteration 2: Residual Norm = 4.703617727164354, Deviation = 5.075321901790385, Tau = -9.710085196622206
Iteration 3: Residual Norm = 12.647081241627847, Deviation = 17.614807269858133, Tau = 0.3654060383997934
Iteration 4: Residual Norm = 10.447742748352281, Deviation = 16.20671631810815, Tau = -0.19557702041804415
Iteration 5: Residual Norm = 14.592839292809803, Deviation = 17.8855834632457, Tau = -0.4808208815156215
Iteration 6: Residual Norm = 15.864886510857293, Deviation = 21.875356611657075, Tau = -0.36589202944585547
Iteration 7: Residual Norm = 19.38214778083515, Deviation = 25.741190054227218, Tau = -0.450679106997556
Iteration 8: Residual Norm = 21.416752177686497, Deviation = 30.947126423395552, Tau = -0.3550303371400915
Iteration 9: Residual Norm = 23.560777604261045, Deviation = 35.21373840129604, Tau = -0.38178405893279155
Iteration 10: Residual Norm = 37.84151676