In [1]:
# According to the provided images, we have the formulas for calculating the output size of a layer (n_out),
# the jump in the output layer (j_out), and the receptive field of a layer (r_out).

# The calculations are as follows:
# n_out = ((n_in + 2p - k) // s) + 1
# j_out = j_in * s
# r_out = r_in + (k - 1) * j_in

# Define the initial parameters for the input image
n_in = 28  # Assuming the input image is of size 32x32
j_in = 1   # The jump is initially 1 as we start with the input image
r_in = 1   # The initial receptive field is 1x1

# Define the parameters for each layer
layers_params = [
    {'k': 3, 'p': 0, 's': 1},  # conv1
    {'k': 3, 'p': 0, 's': 1},  # conv2
    {'k': 1, 'p': 0, 's': 2},  # trans_block1 (MaxPool with stride 2 and Conv1x1)
    {'k': 3, 'p': 0, 's': 1},  # conv3 (Before MaxPool)
    {'k': 1, 'p': 0, 's': 2},  # conv3 (MaxPool with stride 2)
    {'k': 3, 'p': 0, 's': 1},  # conv4
    {'k': 3, 'p': 0, 's': 1},  # conv7
]

# Perform the calculations for each layer
for layer in layers_params:
    n_out = ((n_in + 2 * layer['p'] - layer['k']) // layer['s']) + 1
    j_out = j_in * layer['s']
    r_out = r_in + (layer['k'] - 1) * j_in

    # Update for next layer iteration
    n_in = n_out
    j_in = j_out
    r_in = r_out

    # Print the results for the current layer
    print(f"Output size (n_out): {n_out}, Jump in output (j_out): {j_out}, Receptive field (r_out): {r_out}")

# The final receptive field will be the last calculated r_out
final_receptive_field = r_out
final_receptive_field


Output size (n_out): 26, Jump in output (j_out): 1, Receptive field (r_out): 3
Output size (n_out): 24, Jump in output (j_out): 1, Receptive field (r_out): 5
Output size (n_out): 12, Jump in output (j_out): 2, Receptive field (r_out): 5
Output size (n_out): 10, Jump in output (j_out): 2, Receptive field (r_out): 9
Output size (n_out): 5, Jump in output (j_out): 4, Receptive field (r_out): 9
Output size (n_out): 3, Jump in output (j_out): 4, Receptive field (r_out): 17
Output size (n_out): 1, Jump in output (j_out): 4, Receptive field (r_out): 25


25