[![Fixel Algorithms](https://fixelalgorithms.co/images/CCExt.png)](https://fixelalgorithms.gitlab.io/)

<!-- ![](https://i.imgur.com/qkg2E2D.png) -->

# Machine Learning Methods

## Introduction to Optimization - The Gradient Descent Algorithm

> Notebook by:
> - Royi Avital RoyiAvital@fixelalgorithms.com

## Revision History

| Version | Date       | User        |Content / Changes                                                   |
|---------|------------|-------------|--------------------------------------------------------------------|
| 1.0.001 | 02/07/2024 | Royi Avital | Added type notations to the gradient function                      |
| 1.0.001 | 02/07/2024 | Royi Avital | Added dimensions check for the gradient and function evaluation    |
| 1.0.000 | 18/01/2024 | Royi Avital | First version                                                      |

[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/FixelAlgorithmsTeam/FixelCourses/blob/master/AIProgram/2024_02/0009GradientDescent.ipynb)

In [None]:
# Import Packages

# General Tools
import numpy as np
import scipy as sp
import pandas as pd

# Miscellaneous
import datetime
import os
from platform import python_version
import random
import warnings
import yaml

# Visualization
import matplotlib as mpl
import matplotlib.pyplot as plt
import plotly.graph_objects as go
import plotly.io as pio
import seaborn as sns

# Jupyter
from IPython import get_ipython
from IPython.display import Image, display
from ipywidgets import Dropdown, FloatSlider, interact, interactive, IntSlider, Layout, VBox

## Notations

* <font color='red'>(**?**)</font> Question to answer interactively.
* <font color='blue'>(**!**)</font> Simple task to add code for the notebook.
* <font color='green'>(**@**)</font> Optional / Extra self practice.
* <font color='brown'>(**#**)</font> Note / Useful resource / Food for thought.

Code Notations:

```python
someVar    = 2; #<! Notation for a variable
vVector    = np.random.rand(4) #<! Notation for 1D array
mMatrix    = np.random.rand(4, 3) #<! Notation for 2D array
tTensor    = np.random.rand(4, 3, 2, 3) #<! Notation for nD array (Tensor)
tuTuple    = (1, 2, 3) #<! Notation for a tuple
lList      = [1, 2, 3] #<! Notation for a list
dDict      = {1: 3, 2: 2, 3: 1} #<! Notation for a dictionary
oObj       = MyClass() #<! Notation for an object
dfData     = pd.DataFrame() #<! Notation for a data frame
dsData     = pd.Series() #<! Notation for a series
hObj       = plt.Axes() #<! Notation for an object / handler / function handler
```

### Code Exercise

 - Single line fill

 ```python
 vallToFill = ???
 ```

 - Multi Line to Fill (At least one)

 ```python
 # You need to start writing
 ????
 ```

 - Section to Fill

```python
#===========================Fill This===========================#
# 1. Explanation about what to do.
# !! Remarks to follow / take under consideration.
mX = ???

???
#===============================================================#
```

In [None]:
# Configuration
%matplotlib inline

warnings.filterwarnings("ignore")

seedNum = 512
np.random.seed(seedNum)
random.seed(seedNum)

# Matplotlib default color palette
lMatPltLibclr = ['#1f77b4', '#ff7f0e', '#2ca02c', '#d62728', '#9467bd', '#8c564b', '#e377c2', '#7f7f7f', '#bcbd22', '#17becf']
sns.set_theme() #>! Apply SeaBorn theme
# sns.set_palette("tab10")

runInGoogleColab = 'google.colab' in str(get_ipython())

In [None]:
# Constants

FIG_SIZE_DEF    = (8, 8)
ELM_SIZE_DEF    = 50
CLASS_COLOR     = ('b', 'r')
EDGE_COLOR      = 'k'
MARKER_SIZE_DEF = 10
LINE_WIDTH_DEF  = 2


In [None]:
# Course Packages


In [None]:
# Auxiliary Functions

In [None]:
# Parameters




## The Function

* Consider the function $f$:

$$ f \left( {x}_{1}, {x}_{2} \right) = {x}_{1}^{2} + 10 {x}_{2}^{2} $$

* The gradient of $f$:

$$ \nabla f \left( {x}_{1}, {x}_{2} \right) = \begin{bmatrix} 2 {x}_{1} \\ 20 {x}_{2} \end{bmatrix} $$


In [None]:
# Define the Function

def f(mX: np.ndarray):  

    if mX.ndim > 2:
        raise ValueError(f'The input must be a vector or a matrix')
    
    if mX.ndim == 1:
        # Add a dimension to make the vector a column in a matrix
        mX = mX[:, None]
    
    vX1 = mX[0, :]
    vX2 = mX[1, :]
    
    return (vX1 ** 2) + (10 * (vX2 ** 2))


In [None]:
# Define the Gradient

def GradF(vX: np.ndarray):

    if np.ndim(vX) > 1:
        raise ValueError(f'The input must be a vector')

    x1     = vX[0]
    x2     = vX[1]
    vGradF = np.array([2 * x1, 20 * x2])
    
    return vGradF

## The Gradient Descent Algorithm

The algorithm is defined iteratively as:

$$ \boldsymbol{x}_{k+1} = \boldsymbol{x}_{k} - \mu \nabla f \left( \boldsymbol{x}_{k} \right) $$

In [None]:
# The Gradient Descent 
vX0 = np.array([-9.8, 1.7]) #<! Initial point
K   = 50                    #<! Number of iterations (Keep 50 for tne interactive part)
µ   = 0.09                  #<! Step size

vX      = vX0.copy()
mX      = np.full((2, K), np.nan) #<! The result per iteration

mX[:, 0] = vX0
for kk in range(1, K):
    vX          = vX - µ * GradF(vX)
    mX[:, kk]   = vX

In [None]:
# Plotting the Path

# Grid and Surface
v1         = np.linspace(-10, 10, 51)
v2         = np.linspace(-2, 2, 51)
mXX1, mXX2 = np.meshgrid(v1, v2)
mXX        = np.c_[mXX1.ravel(), mXX2.ravel()].T
mY         = f(mXX)
mY.shape   = mXX1.shape

# Plotting  (PlotLy)
contours = dict(z = dict(show = True, start = -1, end = 100, size = 10, color = 'black'))
marker   = dict(size = 5, color = list(range(K + 1)), colorscale = ["magenta", "yellow"])
line     = dict(color = 'black', width = 2)
# title    = dict(text = r'$\mu =$' + str(µ), y = 0.7, x = 0.5, xanchor = 'center', yanchor = 'top')
title    = dict(text = r'μ = ' + str(μ), y = 0.7, x = 0.5, xanchor = 'center', yanchor = 'top')
font     = dict(size = 16)
camera   = dict(eye = dict(x = 0, y = -1, z = 4))
scene    = dict(xaxis = dict(title = 'x1', range = [-10, 10]),
                yaxis = dict(title = 'x2', range = [-2, 2]),
                zaxis = dict(title = 'f',  range = [-1/2, 200]))

Surf1  = go.Surface(x = mXX1, y = mXX2, z = mY, colorscale = 'Viridis', opacity = 0.95, showscale = False, contours = contours)
Scat1  = go.Scatter3d(x = mX[0, :], y = mX[1, :], z = f(mX), marker = marker, line = line)

layout = go.Layout(width = 1000, height = 500, margin = dict(r = 0, l = 0, b = 0, t = 0),
                   title = title, font = font, scene = scene, scene_camera = camera,
                   scene_aspectmode = 'manual', scene_aspectratio = dict(x = 5, y = 1, z = 1))

fig   = go.Figure(data = [Surf1, Scat1], layout = layout)
fig.show()

In [None]:
# Interactive Visualization

def PlotGradientDescent(figWidget, µ, K = 15):
    vX      = vX0.copy()
    mX      = np.full((2, K), np.nan)
    mX[:,0] = vX0
    for kk in range(1, K):
        vX       = vX - µ * GradF(vX)
        mX[:,kk] = vX

    with figWidget.batch_update():
        figWidget.data[1].x = mX[0, :]
        figWidget.data[1].y = mX[1, :]
        figWidget.data[1].z = f(mX)
        figWidget.layout.title.text = f'µ = {µ}'

In [None]:
# PlotLy Widget
figWid = go.FigureWidget(data = fig.data, layout = fig.layout)

In [None]:
# Sliders
KSlider = IntSlider(min = 1, max = 50, step = 1, value = 15, layout = Layout(width = '30%'))
µSlider = FloatSlider(min = 0, max = .15, step = .01, value = .01, layout = Layout(width = '30%'))

In [None]:
# Interactive Widget (Won't work on Google Colab)
hPlotGradientDescent = lambda µ, K: PlotGradientDescent(figWid, µ, K)
vertBox = VBox((figWid, interactive(hPlotGradientDescent, µ = µSlider, K = KSlider)))
vertBox