### 1.
Read the sections “Introducing the Julia Set” and “Calculating the Full Julia Set” on 
Chapter 2. Profiling to Find Bottlenecks from the book: M. Gorelick & I. Ozsvald 
(2020). High Performance Python. Practical Performant Programming for Humans. 
Second Edition. United States of America: O’Reilly Media, Inc. Implement the 
chapter functions (Example 2-1, 2-2, 2-3 and 2-4) on Python in order to calculate the 
Julia Set. Make the representation for the false gray and pure gray scale.  

In [1]:
import time
from PIL import Image # Pillow
import array

In [2]:
# area of space to be rendered
x1, x2, y1, y2 = -1.8, 1.8, -1.8, 1.8
c_real, c_imag = -0.62772, -.42193

In [3]:
def calculate_z_serial_purepython(maxiter, zs, cs):
    """Calculate list"""
    output = [0] * len(zs)
    for i in range(len(zs)):
        n = 0
        z = zs[i]
        c = cs[i]
        while abs(z) < 2 and n < maxiter:
            z = z * z + c
            n += 1
        output[i] = n
    return output

In [4]:
def calc_pure_python(draw_output, desired_width, max_iterations):
    """Create a list of zs and cs, build Julia set and display using PIL"""
    x_step = (float(x2 - x1) / float(desired_width))
    y_step = (float(y1 - y2) / float(desired_width))
    x = []
    y = []
    ycoord = y2
    while ycoord > y1:
        y.append(ycoord)
        ycoord += y_step
    xcoord = x1
    while xcoord < x2:
        x.append(xcoord)
        xcoord += x_step
    # build a list and the initial condition.
    zs = []
    cs = []
    for ycoord in y:
        for xcoord in x:
            zs.append(complex(xcoord, ycoord))
            cs.append(complex(c_real, c_imag))

    print("Length of x:", len(x))
    print("Total elements:", len(zs))
    start_time = time.time()
    output = calculate_z_serial_purepython(max_iterations, zs, cs)
    end_time = time.time()
    secs = end_time - start_time
    print(calculate_z_serial_purepython.__name__ + " took", secs, "seconds")

    # 1000^2 grid with 300 iterations
    assert sum(output) == 33219980

In [5]:
if __name__ == "__main__":
    # Calculate the Julia set 
    # set draw_output
    calc_pure_python(draw_output=False, desired_width=1000, max_iterations=300)

Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 4.320175647735596 seconds


In [6]:
# area of complex space to be rendered
x1, x2, y1, y2 = -1.8, 1.8, -1.8, 1.8
c_real, c_imag = -0.62772, -.42193

In [7]:
def show_greyscale(output_raw, width, height, max_iterations):
    """Convert list to array, show using PIL"""
    # convert scale to [0...255]
    max_iterations = float(max(output_raw))
    print(max_iterations)
    scale_factor = float(max_iterations)
    scaled = [int(o / scale_factor * 255) for o in output_raw]
    output = array.array('B', scaled)  # array of unsigned ints
    # display
    im = Image.new("L", (width, width))
    # Greyscale
    im.frombytes(output.tobytes(), "raw", "L", 0, -1)
    im.show(title="Greyscale Julia Set")

In [8]:
def show_false_greyscale(output_raw, width, height, max_iterations):
    """Convert list to array, show using PIL"""
    # convert scale to [0...255]
    assert width * height == len(output_raw)
    # normalise to 0-255
    max_value = float(max(output_raw))
    output_raw_limited = [int(float(o) / max_value * 255) for o in output_raw]
    # fancy RGB
    output_rgb = (
        (o + (256 * o) + (256 ** 2) * o) * 16 for o in output_raw_limited)  # fancier
    # convert to bytes
    output_rgb = array.array('I', output_rgb)
    # display
    im = Image.new("RGB", (width, height))
    # False colour
    im.frombytes(output_rgb.tobytes(), "raw", "RGBX", 0, -1)
    im.show(title="False Greyscale Julia Set")

In [9]:
def calculate_z_serial_purepython(maxiter, zs, cs):
    """Calculate list"""
    output = [0] * len(zs)
    for i in range(len(zs)):
        n = 0
        z = zs[i]
        c = cs[i]
        while abs(z) < 2 and n < maxiter:
            z = z * z + c
            n += 1
        output[i] = n
    return output

In [10]:
def calc_pure_python(draw_output, desired_width, max_iterations):
    """Create a list of zs and cs, build Julia set and display using PIL"""
    x_step = (float(x2 - x1) / float(desired_width))
    y_step = (float(y1 - y2) / float(desired_width))
    x = []
    y = []
    ycoord = y2
    while ycoord > y1:
        y.append(ycoord)
        ycoord += y_step
    xcoord = x1
    while xcoord < x2:
        x.append(xcoord)
        xcoord += x_step
    width = len(x)
    height = len(y)
    # build a list of co-ordinates and the initial condition 
    zs = []
    cs = []
    for ycoord in y:
        for xcoord in x:
            zs.append(complex(xcoord, ycoord))
            cs.append(complex(c_real, c_imag))

    print("Length of x:", len(x))
    print("Total elements:", len(zs))
    start_time = time.time()
    output = calculate_z_serial_purepython(max_iterations, zs, cs)
    end_time = time.time()
    secs = end_time - start_time
    print(calculate_z_serial_purepython.__name__ + " took", secs, "seconds")

    # 1000^2 grid with 300 iterations
    assert sum(output) == 33219980
    
    if draw_output:
        
        show_false_greyscale(output, width, height, max_iterations)
        show_greyscale(output, width, height, max_iterations)
        # use matplotlib to draw with falsegray and gray

In [11]:
if __name__ == "__main__":
    # Calculate the Julia set
    calc_pure_python(draw_output=True, desired_width=1000, max_iterations=300)

Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 4.330952405929565 seconds
300.0


/snap/core20/current/lib/x86_64-linux-gnu/libstdc++.so.6: version `GLIBCXX_3.4.29' not found (required by /lib/x86_64-linux-gnu/libproxy.so.1)
Failed to load module: /home/chris/snap/code/common/.cache/gio-modules/libgiolibproxy.so
eog: symbol lookup error: /snap/core20/current/lib/x86_64-linux-gnu/libpthread.so.0: undefined symbol: __libc_pthread_init, version GLIBC_PRIVATE
/snap/core20/current/lib/x86_64-linux-gnu/libstdc++.so.6: version `GLIBCXX_3.4.29' not found (required by /lib/x86_64-linux-gnu/libproxy.so.1)
Failed to load module: /home/chris/snap/code/common/.cache/gio-modules/libgiolibproxy.so


### 2.
Define a new function, timefn, which takes a function as an argument: the inner 
function, measure_time, takes *args (a variable number of positional arguments) 
and **kwargs (a variable number of key/value arguments) and passes them through 
to fn for execution. Decorate calculate_z_serial_purepython with @timefn to profile 
it. Implement Example 2-5 and adapt your current source code.

In [12]:
import time
from functools import wraps

In [13]:
def timefn(function):
    @wraps(function)
    def measure_time(*args, **kwargs):
        t1 = time.time()
        result = function(*args, **kwargs)
        t2 = time.time()
        total_time = t2 - t1
        print(f"{function.__name__} took {total_time} seconds")
        return result
    return measure_time
    
@timefn
def calculate_z_serial_purepython(maxiter, zs, cs):
    """Executes Julia set calculation"""
    output = [0] * len(zs)
    for i in range(len(zs)):
        n = 0
        z = zs[i]
        c = cs[i]
        while abs(z) < 2 and n < maxiter:
            z = z * z + c
            n += 1
        output[i] = n
    return output

In [14]:
if __name__ == "__main__":
     # Compute Julia set with Python only; settings optimized for laptops
    calc_pure_python(draw_output=False, desired_width=1000, max_iterations=300)

eog: symbol lookup error: /snap/core20/current/lib/x86_64-linux-gnu/libpthread.so.0: undefined symbol: __libc_pthread_init, version GLIBC_PRIVATE


Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 4.278077840805054 seconds
calculate_z_serial_purepython took 4.2781455516815186 seconds


### 3.
Use the timeit modeule to get a coarse measurement of the execution speed of the 
CPU-bound function. Runs 10 loops with 5 repetitions. Show how to do the 
measurement on the command line and on a Jupyter Notebook. 

In [15]:
%timeit -r 5 -n 10 calc_pure_python(draw_output=False,desired_width=1000, max_iterations=300)

Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 4.174441576004028 seconds
calculate_z_serial_purepython took 4.174518823623657 seconds
Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 4.087728023529053 seconds
calculate_z_serial_purepython took 4.087798118591309 seconds
Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 3.9615743160247803 seconds
calculate_z_serial_purepython took 3.9616429805755615 seconds
Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 3.9566292762756348 seconds
calculate_z_serial_purepython took 3.9566946029663086 seconds
Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 3.9580259323120117 seconds
calculate_z_serial_purepython took 3.958090305328369 seconds
Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 3.9476125240325928 seconds
calculate_z_serial_purepython took 3.947678565979004 seconds
Length of 

### 4.

Use the cProfile module to profile the source code (.py). Sort the results by the time 
spent inside each function. This will give a view into the slowest parts. Analyze the 
output and make a syntesis of the findings. Show how to use the cProfile module on 
the command line and on a Jupyter Notebook. 

In [16]:
import cProfile
import pstats

In [17]:
profiler = cProfile.Profile()
profiler.enable()
calc_pure_python(draw_output=False, desired_width=1000, max_iterations=300)
profiler.disable()
stats = pstats.Stats(profiler).sort_stats('cumulative')
stats.print_stats()

Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 10.678610801696777 seconds
calculate_z_serial_purepython took 10.678703308105469 seconds
         36222235 function calls in 11.247 seconds

   Ordered by: cumulative time

   ncalls  tottime  percall  cumtime  percall filename:lineno(function)
        2    0.000    0.000   11.270    5.635 /home/chris/miniconda3/envs/hpc3/lib/python3.11/site-packages/IPython/core/interactiveshell.py:3541(run_code)
        2    0.000    0.000   11.269    5.635 {built-in method builtins.exec}
        1    0.468    0.468   11.246   11.246 /tmp/ipykernel_5527/733580140.py:1(calc_pure_python)
        1    0.000    0.000   10.679   10.679 /tmp/ipykernel_5527/472432449.py:2(measure_time)
        1    8.158    8.158   10.679   10.679 /tmp/ipykernel_5527/472432449.py:12(calculate_z_serial_purepython)
 34219980    2.521    0.000    2.521    0.000 {built-in method builtins.abs}
  2002000    0.095    0.000    0.095    0.000 {method 'appen

<pstats.Stats at 0x78126c221a50>

### 5.

Use snakeviz to get a high-level understanding of the cPrifile statistics file. Analyze 
the output and make a syntesis of the findings. 

In [19]:
# using snakeviz
%load_ext snakeviz

if __name__ == "__main__":
    cProfile.run('calc_pure_python(draw_output=False, desired_width=1000, max_iterations=300)', 'Results') # save to file

# view the results on the browser
!snakeviz "Results"

Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 10.147825241088867 seconds
calculate_z_serial_purepython took 10.14790654182434 seconds
snakeviz web server started on 127.0.0.1:8080; enter Ctrl-C to exit
http://127.0.0.1:8080/snakeviz/%2Fhome%2Fchris%2FDesktop%2FHPC%2FHomework%2FCA3C%2FPart%201%20-%20Benchmarking%20and%20Profiling%2FResults
^C

Bye!


### 6.

Use the line_profiler and kernprof file to profile line-by-line the function 
calculate_z_serial_purepython. Analyze the output and make a syntesis of the 
findings. 

In [20]:
# use line_profiler to profile the code
%load_ext line_profiler

# profile the function
%lprun -f calculate_z_serial_purepython calc_pure_python(draw_output=False, desired_width=1000, max_iterations=300) 

  profile = LineProfiler(*funcs)


Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 13.802193641662598 seconds
calculate_z_serial_purepython took 13.802300691604614 seconds


Timer unit: 1e-09 s

Total time: 13.8023 s
File: /tmp/ipykernel_5527/472432449.py
Function: measure_time at line 2

Line #      Hits         Time  Per Hit   % Time  Line Contents
     2                                               @wraps(function)
     3                                               def measure_time(*args, **kwargs):
     4         1       2579.0   2579.0      0.0          t1 = time.time()
     5         1        1e+10    1e+10    100.0          result = function(*args, **kwargs)
     6         1       2476.0   2476.0      0.0          t2 = time.time()
     7         1        747.0    747.0      0.0          total_time = t2 - t1
     8         1      84496.0  84496.0      0.0          print(f"{function.__name__} took {total_time} seconds")
     9         1        210.0    210.0      0.0          return result

### 7.
Use the memory_profiler to diagnose memory usage. Analyze the output and make 
a syntesis of the findings. 


In [21]:
# use memory_profiler to profile the code
%reload_ext memory_profiler 

# profile the function
%memit calc_pure_python(draw_output=False, desired_width=1000, max_iterations=300)

Length of x: 1000
Total elements: 1000000
calculate_z_serial_purepython took 4.181931018829346 seconds
calculate_z_serial_purepython took 4.182017087936401 seconds
peak memory: 178.66 MiB, increment: 85.25 MiB
