# Practice Assignment: Understanding Distributions Through Sampling

** *This assignment is optional, and I encourage you to share your solutions with me and your peers in the discussion forums!* **


To complete this assignment, create a code cell that:
* Creates a number of subplots using the `pyplot subplots` or `matplotlib gridspec` functionality.
* Creates an animation, pulling between 100 and 1000 samples from each of the random variables (`x1`, `x2`, `x3`, `x4`) for each plot and plotting this as we did in the lecture on animation.
* **Bonus:** Go above and beyond and "wow" your classmates (and me!) by looking into matplotlib widgets and adding a widget which allows for parameterization of the distributions behind the sampling animations.


Tips:
* Before you start, think about the different ways you can create this visualization to be as interesting and effective as possible.
* Take a look at the histograms below to get an idea of what the random variables look like, as well as their positioning with respect to one another. This is just a guide, so be creative in how you lay things out!
* Try to keep the length of your animation reasonable (roughly between 10 and 30 seconds).

In [1]:
import matplotlib.pyplot as plt
import numpy as np

%matplotlib notebook

# generate 4 random variables from the random, gamma, exponential, and uniform distributions
x1 = np.random.normal(-2.5, 1, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)+7
x4 = np.random.uniform(14,20, 10000)

# plot the histograms
plt.figure(figsize=(9,3))
plt.hist(x1, normed=True, bins=20, alpha=0.5)
plt.hist(x2, normed=True, bins=20, alpha=0.5)
plt.hist(x3, normed=True, bins=20, alpha=0.5)
plt.hist(x4, normed=True, bins=20, alpha=0.5);
plt.axis([-7,21,0,0.6])

plt.text(x1.mean()-1.5, 0.5, 'x1\nNormal')
plt.text(x2.mean()-1.5, 0.5, 'x2\nGamma')
plt.text(x3.mean()-1.5, 0.5, 'x3\nExponential')
plt.text(x4.mean()-1.5, 0.5, 'x4\nUniform')

<IPython.core.display.Javascript object>

<matplotlib.text.Text at 0x7fb9e852c860>

# Research Code

The following code was used to research the method of implementing the required function, it should be noted that the answer to the assignment question is at the bottom of the notebook

In [2]:
import matplotlib.pyplot as plt
import matplotlib.gridspec as gridspec
import pandas as pd
import mpl_toolkits.axes_grid1.inset_locator as mpl_il
import matplotlib.animation as animation


In [3]:
#Plot histogram of the x1 distirbution
#Plot hisograms using subplots
plt.figure(figsize=(10,3))
# subplot with 1 row, 2 columns, and current axis is 1st subplot axes
plt.subplot(1, 4, 1)
plt.hist(x1, normed=True, bins=20, alpha=0.5, color = "#75bbfd")
plt.axis([-7,1,0,0.6])
plt.title("Normal (x1)")

plt.subplot(1, 4, 2)
plt.hist(x2, normed=True, bins=20, alpha=0.5, color = "#ff796c")
plt.axis([-1,14,0,0.6])
plt.title("Gamma (x2)")

plt.subplot(1, 4, 3)
plt.hist(x3, normed=True, bins=20, alpha=0.5, color = "#c0737a")
plt.axis([5,21,0,0.6])
plt.title("Exponential (x3)")

plt.subplot(1, 4, 4)
plt.hist(x4, normed=True, bins=20, alpha=0.5, color = "#88b378")
plt.axis([13,21,0,0.6])
plt.title("Uniform (x4)")



<IPython.core.display.Javascript object>

<matplotlib.text.Text at 0x7fb9ba3c4a20>

In [40]:
import matplotlib.animation as animation

def update_hist_normal(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    #bins = np.arange(-7,1, 0.3)
    plt.hist(x1[:curr], bins=20, alpha=0.5, color = "#75bbfd")
    #plt.hist(x1, normed=True, bins=20, alpha=0.5, color = "#75bbfd")
    plt.axis([-7,1,0,20])
    plt.gca().set_title('Normal (x1)')
    #plt.gca().set_ylabel('Frequency')
    #plt.gca().set_xlabel('Value')
    plt.annotate('n = {}'.format(curr), [3,27])

In [41]:
fig = plt.figure()
a = animation.FuncAnimation(fig, update_hist_normal, interval=100)

<IPython.core.display.Javascript object>

In [42]:
def update_hist_gamma(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    #bins = np.arange(-7,1, 0.3)
    plt.hist(x2[:curr], bins=20, alpha=0.5, color = "#ff796c")
    plt.axis([-1,14,0,20])
    plt.gca().set_title('Gamma (x2)')
    #plt.gca().set_ylabel('Frequency')
    #plt.gca().set_xlabel('Value')
    plt.annotate('n = {}'.format(curr), [3,27])


In [43]:
fig1 = plt.figure()
a = animation.FuncAnimation(fig1, update_hist_gamma, interval=100)

<IPython.core.display.Javascript object>

In [44]:
def update_hist_exp(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    #bins = np.arange(-7,1, 0.3)
    plt.hist(x3[:curr], bins=20, alpha=0.5, color = "#c0737a")
    plt.axis([5,21,0,20])
    plt.gca().set_title('Exponential (x3)')
    #plt.gca().set_ylabel('Frequency')
    #plt.gca().set_xlabel('Value')
    plt.annotate('n = {}'.format(curr), [3,27])



In [45]:
fig1 = plt.figure()
a = animation.FuncAnimation(fig1, update_hist_exp, interval=100)

<IPython.core.display.Javascript object>

In [48]:
def update_hist_uni(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    #bins = np.arange(-7,1, 0.3)
    plt.hist(x4[:curr], bins=20, alpha=0.5, color = "#88b378")
    plt.axis([13,21,0,20])
    plt.gca().set_title('Uniform (x4)')
    #plt.gca().set_ylabel('Frequency')
    #plt.gca().set_xlabel('Value')
    plt.annotate('n = {}'.format(curr), [3,27])




In [49]:
fig1 = plt.figure()
a = animation.FuncAnimation(fig1, update_hist_uni, interval=100)

<IPython.core.display.Javascript object>

# The Assignment code

The following function implements the following set of requirements 

1. Creates a number of subplots using the pyplot subplots or matplotlib gridspec functionality.
2. Creates an animation, pulling between 100 and 1000 samples from each of the random variables (x1, x2, x3, x4) for each plot and plotting this as we did in the lecture on animation.


In [81]:
#Now function for multiple plots
def update_hist(curr):
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    #Normal x1
    plt.subplot(2, 2, 1)
    plt.hist(x1[:curr], bins=20, alpha=0.5, color = "#75bbfd")
    plt.axis([-7,1,0,10])
    plt.gca().set_title('Normal (x1)')
    #plt.annotate('n = {}'.format(curr), [3,27])
    
    #Gamma (x2)
    plt.subplot(2, 2, 2)
    plt.hist(x2[:curr],  bins=20, alpha=0.5, color = "#ff796c")
    plt.axis([-1,14,0,10])
    plt.gca().set_title('Gamma (x2)')
    #plt.annotate('n = {}'.format(curr), [3,27])
    
    #Exponential (x3)
    plt.subplot(2, 2, 3)
    plt.hist(x3[:curr],  bins=20, alpha=0.5, color = "#c0737a")
    plt.axis([5,21,0,10])
    plt.gca().set_title('Exponential (x3)')
    #plt.annotate('n = {}'.format(curr), [3,27])
    
    #Uniform (x4)
    plt.subplot(2, 2, 4)
    plt.hist(x4[:curr], bins=20, alpha=0.5, color = "#88b378")
    plt.axis([13,21,0,10])
    plt.gca().set_title('Uniform (x4)')
    #plt.annotate('n = {}'.format(curr), [3,27])

        

The following function call produces the required output

In [82]:
my_fig = plt.figure(figsize=(10,8))
a = animation.FuncAnimation(my_fig, update_hist, interval=1000)

<IPython.core.display.Javascript object>