# Practice Assignment: Understanding Distributions Through Sampling

** *This assignment is optional, and I encourage you to share your solutions with me and your peers in the discussion forums!* **


To complete this assignment, create a code cell that:
* Creates a number of subplots using the `pyplot subplots` or `matplotlib gridspec` functionality.
* Creates an animation, pulling between 100 and 1000 samples from each of the random variables (`x1`, `x2`, `x3`, `x4`) for each plot and plotting this as we did in the lecture on animation.
* **Bonus:** Go above and beyond and "wow" your classmates (and me!) by looking into matplotlib widgets and adding a widget which allows for parameterization of the distributions behind the sampling animations.


Tips:
* Before you start, think about the different ways you can create this visualization to be as interesting and effective as possible.
* Take a look at the histograms below to get an idea of what the random variables look like, as well as their positioning with respect to one another. This is just a guide, so be creative in how you lay things out!
* Try to keep the length of your animation reasonable (roughly between 10 and 30 seconds).

In [3]:
import matplotlib.pyplot as plt
import numpy as np

%matplotlib notebook

# generate 4 random variables from the random, gamma, exponential, and uniform distributions
x1 = np.random.normal(-2.5, 1, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)+7
x4 = np.random.uniform(14,20, 10000)

# plot the histograms
plt.figure(figsize=(9,3))
plt.hist(x1, density=True, bins=20, alpha=0.5)
plt.hist(x2, density=True, bins=20, alpha=0.5)
plt.hist(x3, density=True, bins=20, alpha=0.5)
plt.hist(x4, density=True, bins=20, alpha=0.5);
plt.axis([-7,21,0,0.6])

plt.text(x1.mean()-1.5, 0.5, 'x1\nNormal')
plt.text(x2.mean()-1.5, 0.5, 'x2\nGamma')
plt.text(x3.mean()-1.5, 0.5, 'x3\nExponential')
plt.text(x4.mean()-1.5, 0.5, 'x4\nUniform')

<IPython.core.display.Javascript object>

Text(15.488134592326922, 0.5, 'x4\nUniform')

In [8]:
x1 = np.random.normal(-2.5, 1, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)+7
x4 = np.random.uniform(14,20, 10000)

fig, axs = plt.subplots(2, 2, sharex=True, sharey=True)

def update(curr):
    if curr == 10000:
        a.event_source.stop()
    axs[0, 1].cla()
    #bins = np.arange(-4, 4, 0.5)
    axs[0, 1].hist(x1[:curr], bins=25)
    axs[0, 1].axis([-6,0,0,250])
    axs[0, 1].gca().set_title('Sampling the Normal Distribution')
    axs[0, 1].gca().set_ylabel('Frequency')
    axs[0, 1].gca().set_xlabel('Value')
    axs[0, 1].annotate('n = {}'.format(curr), [3,27])
    
import matplotlib.animation as animation

a = animation.FuncAnimation(fig, update, interval=1000)

<IPython.core.display.Javascript object>

In [6]:
axs[0, 1].hist(x1[:1000])

(array([ 10.,  16.,  52., 108., 193., 236., 174., 138.,  53.,  20.]),
 array([-5.5486053 , -4.99125671, -4.43390811, -3.87655951, -3.31921092,
        -2.76186232, -2.20451373, -1.64716513, -1.08981654, -0.53246794,
         0.02488066]),
 <a list of 10 Patch objects>)

In [10]:
def update(curr):
    if curr == 10000:
        a.event_source.stop()
    axs[0, 1].cla()
    #bins = np.arange(-4, 4, 0.5)
    axs[0, 1].hist(x1[:curr], bins=25)
    axs[0, 1].axis([-6,0,0,250])
    axs[0, 1].gca().set_title('Sampling the Normal Distribution')
    axs[0, 1].gca().set_ylabel('Frequency')
    axs[0, 1].gca().set_xlabel('Value')
    axs[0, 1].annotate('n = {}'.format(curr), [3,27])

In [11]:
import matplotlib.animation as animation

a = animation.FuncAnimation(fig, update, interval=10)

In [60]:
linear_data = np.array([1,2,3,4,5,6,7,8])
# create a 3x3 grid of subplots
fig, ((ax1,ax2,ax3), (ax4,ax5,ax6), (ax7,ax8,ax9)) = plt.subplots(3, 3, sharex=True, sharey=True)
# plot the linear_data on the 5th subplot axes 
ax5.plot(linear_data, '-')

<IPython.core.display.Javascript object>

[<matplotlib.lines.Line2D at 0x12a8ee610>]

In [63]:
# set inside tick labels to visible
for ax in plt.gcf().get_axes():
    for label in ax.get_xticklabels() + ax.get_yticklabels():
        label.set_visible(True)

In [64]:
# necessary on some systems to update the plot
plt.gcf().canvas.draw() #gcf:get curren figure

In [17]:
fig, axs = plt.subplots(2, 2, sharey=True)

import matplotlib.animation as animation

n = 100
x = np.random.randn(n)

# create the function that will do the plotting, where curr is the current frame
def update(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    axs[0,0].cla()
    bins = np.arange(-4, 4, 0.5)
    axs[0,0].hist(x[:curr], bins=bins)
    axs[0,0].axis([-4,4,0,30])
    axs[0,0].gca().set_title('Sampling the Normal Distribution')
    axs[0,0].gca().set_ylabel('Frequency')
    axs[0,0].gca().set_xlabel('Value')
    axs[0,0].annotate('n = {}'.format(curr), [3,27])

<IPython.core.display.Javascript object>

In [19]:
a = animation.FuncAnimation(fig, update, interval=100)

In [16]:
axs[0,0].hist(x)

(array([ 1.,  2., 11., 16., 22., 22., 10., 10.,  4.,  2.]),
 array([-2.47514497, -1.97680999, -1.47847501, -0.98014003, -0.48180505,
         0.01652993,  0.5148649 ,  1.01319988,  1.51153486,  2.00986984,
         2.50820482]),
 <a list of 10 Patch objects>)

In [20]:
type(axs)

numpy.ndarray

In [24]:
axs[0]

array([<matplotlib.axes._subplots.AxesSubplot object at 0x11da27850>,
       <matplotlib.axes._subplots.AxesSubplot object at 0x11da93150>],
      dtype=object)

Another try

In [58]:
import matplotlib.pyplot as plt
import numpy as np

%matplotlib notebook

fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2, sharex=True)
axs = [ax1,ax2,ax3,ax4]

# generate 4 random variables from the random, gamma, exponential, and uniform distributions

x1 = np.random.normal(5, 1.5, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)
x4 = np.random.uniform(0,10, 10000)

# plot the histograms
axs[0].hist(x1, density=True, bins=20, alpha=1, color='lightblue')
axs[1].hist(x2, density=True, bins=20, alpha=1, color='navajowhite')
axs[2].hist(x3, density=True, bins=20, alpha=1, color='palegreen')
axs[3].hist(x4, density=True, bins=20, alpha=1, color='lightsalmon')
axs[0].set_xlim([0, 10])
axs[0].set_title('x1 - Normal')
axs[1].set_title('x2 - Gamma')
axs[2].set_title('x3 - Exponential')
axs[3].set_title('x4 - Uniform')

Traceback (most recent call last):
  File "/opt/anaconda3/lib/python3.7/site-packages/matplotlib/cbook/__init__.py", line 216, in process
    func(*args, **kwargs)
  File "/opt/anaconda3/lib/python3.7/site-packages/matplotlib/animation.py", line 1465, in _stop
    self.event_source.remove_callback(self._loop_delay)
AttributeError: 'NoneType' object has no attribute 'remove_callback'


<IPython.core.display.Javascript object>

Text(0.5, 1.0, 'x4 - Uniform')

In [74]:
import matplotlib.pyplot as plt
import numpy as np
import matplotlib.animation as animation

%matplotlib notebook

n = 1000
x1 = np.random.normal(-2.5, 1, n)
x2 = np.random.gamma(2, 1.5, n)
x3 = np.random.exponential(2, n)
x4 = np.random.uniform(0, 10, n)

# create the function that will do the plotting, where curr is the current frame
def update(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    bins1 = np.arange(-7, 3, 0.5)
    bins2 = np.arange(0, 10, 0.5)
    bins3 = np.arange(7, 17, 0.5)
    bins4 = np.arange(13, 20, 0.5)
    bins = np.arange(-4, 4, 0.5)


    axs[0].hist(x1[:curr], density=True, stacked=True, bins=bins, alpha=1, color='lightblue')
    axs[1].hist(x2[:curr], density=True, stacked=True, bins=bins, alpha=1, color='navajowhite')
    axs[2].hist(x3[:curr], density=True, stacked=True, bins=bins, alpha=1, color='palegreen')
    axs[3].hist(x4[:curr], density=True, stacked=True, bins=bins, alpha=1, color='lightsalmon')
    
    #axs[0].set_xlim([-7, 3])
    axs[0].axis([-5, 2, 0, 3])
    axs[1].axis([0, 4, 0, 3])
    axs[2].axis([0, 4, 0, 3])
    axs[3].axis([0,4, 0, 1])
    
    axs[0].set_title('Normal n = {}'.format(curr))
    axs[1].set_title('Gamma n = {}'.format(curr))
    axs[2].set_title('Exponential n = {}'.format(curr))
    axs[3].set_title('Uniform n = {}'.format(curr))

fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2)
axs = [ax1, ax2, ax3, ax4]
fig.tight_layout(pad=3.0)
a = animation.FuncAnimation(fig, update, interval=1)

<IPython.core.display.Javascript object>

In [49]:
fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2, sharey=True)
axs = [ax1, ax2, ax3, ax4]
axs[3].hist(x4, bins=25, alpha=1, color='lightsalmon')

<IPython.core.display.Javascript object>

(array([5., 4., 3., 3., 1., 5., 3., 4., 4., 5., 3., 3., 3., 7., 3., 5., 7.,
        5., 3., 4., 3., 1., 5., 5., 6.]),
 array([14.04228743, 14.27959986, 14.51691229, 14.75422472, 14.99153715,
        15.22884958, 15.46616201, 15.70347444, 15.94078687, 16.1780993 ,
        16.41541173, 16.65272417, 16.8900366 , 17.12734903, 17.36466146,
        17.60197389, 17.83928632, 18.07659875, 18.31391118, 18.55122361,
        18.78853604, 19.02584847, 19.2631609 , 19.50047333, 19.73778576,
        19.97509819]),
 <a list of 25 Patch objects>)