# Practice Assignment: Understanding Distributions Through Sampling

** *This assignment is optional, and I encourage you to share your solutions with me and your peers in the discussion forums!* **


To complete this assignment, create a code cell that:
* Creates a number of subplots using the `pyplot subplots` or `matplotlib gridspec` functionality.
* Creates an animation, pulling between 100 and 1000 samples from each of the random variables (`x1`, `x2`, `x3`, `x4`) for each plot and plotting this as we did in the lecture on animation.
* **Bonus:** Go above and beyond and "wow" your classmates (and me!) by looking into matplotlib widgets and adding a widget which allows for parameterization of the distributions behind the sampling animations.


Tips:
* Before you start, think about the different ways you can create this visualization to be as interesting and effective as possible.
* Take a look at the histograms below to get an idea of what the random variables look like, as well as their positioning with respect to one another. This is just a guide, so be creative in how you lay things out!
* Try to keep the length of your animation reasonable (roughly between 10 and 30 seconds).

In [17]:
import matplotlib.pyplot as plt
import numpy as np

%matplotlib notebook

# generate 4 random variables from the random, gamma, exponential, and uniform distributions
x1 = np.random.normal(-2.5, 1, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)+7
x4 = np.random.uniform(14,20, 10000)

# plot the histograms
fig_1 = plt.figure(figsize=(9,3))
plt.hist(x1, normed=True, bins=20, alpha=0.3)
plt.hist(x2, normed=True, bins=20, alpha=0.4)
plt.hist(x3, normed=True, bins=20, alpha=0.5)
plt.hist(x4, normed=True, bins=20, alpha=0.6);
plt.axis([-7,21,0,0.6])

plt.text(x1.mean()-1.5, 0.5, 'x1\nNormal')
plt.text(x2.mean()-1.5, 0.5, 'x2\nGamma')
plt.text(x3.mean()-1.5, 0.5, 'x3\nExponential')
plt.text(x4.mean()-1.5, 0.5, 'x4\nUniform')

<IPython.core.display.Javascript object>

<matplotlib.text.Text at 0x1139a02b0>

In [18]:
fig_2 = plt.figure(figsize=(7,5))

# generate 4 random variables from the random, gamma, exponential, and uniform distributions
x1 = np.random.normal(-2.5, 1, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)+7
x4 = np.random.uniform(14,20, 10000)

# plot the histograms
ax1 = plt.subplot(2, 2, 1)
plt.hist(x1, normed=True, bins=20, alpha=0.4, color='blue')
# plt.text(x1.mean()-1.5, 0.5, 'x1\nNormal')
plt.subplot(2, 2, 2, sharey=ax1)
plt.hist(x2, normed=True, bins=20, alpha=0.4, color='orange')
# plt.text(x2.mean()-1.5, 0.5, 'x2\nGamma')
plt.subplot(2, 2, 3, sharey=ax1)
plt.hist(x3, normed=True, bins=20, alpha=0.4, color='green')
# plt.text(x3.mean()-1.5, 0.5, 'x3\nExponential')
plt.subplot(2, 2, 4, sharey=ax1)
plt.hist(x4, normed=True, bins=20, alpha=0.4, color='red')
# plt.text(x4.mean()-1.5, 0.5, 'x4\nUniform')

#plt.axis([-7,21,0,0.6])

<IPython.core.display.Javascript object>

(array([0.17002396, 0.17235762, 0.16535664, 0.1660234 , 0.16802368,
        0.16669016, 0.16702354, 0.17502467, 0.16235621, 0.14968776,
        0.17935861, 0.18202565, 0.1506879 , 0.15802227, 0.15835565,
        0.16969058, 0.17202424, 0.16535664, 0.1693572 , 0.16635678]),
 array([14.00028572, 14.30024344, 14.60020116, 14.90015888, 15.2001166 ,
        15.50007432, 15.80003204, 16.09998976, 16.39994748, 16.69990521,
        16.99986293, 17.29982065, 17.59977837, 17.89973609, 18.19969381,
        18.49965153, 18.79960925, 19.09956697, 19.39952469, 19.69948242,
        19.99944014]),
 <a list of 20 Patch objects>)

- ** Creates a number of subplots using the pyplot subplots or matplotlib gridspec functionality. **

In [19]:
import matplotlib.gridspec as gridspec
# gridspec?
fig_3 = plt.figure()
gspec = gridspec.GridSpec(2, 2)

top_left = plt.subplot(gspec[0, 0], )
top_right = plt.subplot(gspec[0, 1], sharey=top_left)
lower_left = plt.subplot(gspec[1, 0], sharey=top_left)
lower_right = plt.subplot(gspec[1, 1], sharey=top_left)

<IPython.core.display.Javascript object>

In [20]:
x1 = np.random.normal(-2.5, 1, 10000)
x2 = np.random.gamma(2, 1.5, 10000)
x3 = np.random.exponential(2, 10000)+7
x4 = np.random.uniform(14,20, 10000)

top_left.hist(x1, normed=True, bins=20, alpha=0.4, color='blue')
top_right.hist(x2, normed=True, bins=20, alpha=0.4, color='orange')
lower_left.hist(x3, normed=True, bins=20, alpha=0.4, color='green')
lower_right.hist(x4, normed=True, bins=20, alpha=0.4, color='red')

(array([0.16003895, 0.17937699, 0.17770991, 0.17770991, 0.15803846,
        0.16003895, 0.16403992, 0.16704065, 0.17370894, 0.16970797,
        0.15537114, 0.1473692 , 0.16203943, 0.15370407, 0.16203943,
        0.1820443 , 0.16737407, 0.17637626, 0.16870772, 0.17170845]),
 array([14.00105852, 14.30098552, 14.60091251, 14.9008395 , 15.20076649,
        15.50069349, 15.80062048, 16.10054747, 16.40047446, 16.70040146,
        17.00032845, 17.30025544, 17.60018243, 17.90010943, 18.20003642,
        18.49996341, 18.7998904 , 19.0998174 , 19.39974439, 19.69967138,
        19.99959837]),
 <a list of 20 Patch objects>)

- ** Creates an animation, pulling between 100 and 1000 samples from each of the random variables (x1, x2, x3, x4) for each plot and plotting this as we did in the lecture on animation. **

In [8]:
import matplotlib.animation as animation

In [1]:
n = np.random.randint(100, 1000)
print(n) #n is a rendom number choosen from between 100 and 1000

# i have my own x1 x2 x3 and x4, need to replace x with them
# x = np.random.randn(n)
# print(x)

# create the function that will do the plotting, where curr is the current frame
def update(curr):
    # check if animation is at the last frame, and if so, stop the animation a
    if curr == n: 
        a.event_source.stop()
    plt.cla()
    bins = 20 #np.arange(-4, 4, 0.5)
    top_left.hist(x1[:curr], bins=bins)
    top_right.hist(x2[:curr], bins=bins)
    lower_left.hist(x3[:curr], bins=bins)
    lower_right.hist(x4[:curr], bins=bins)
    plt.axis([-4,4,0,30])
    plt.gca().set_title('Sampling the Normal Distribution')
    plt.gca().set_ylabel('Frequency')
    plt.gca().set_xlabel('Value')
    plt.annotate('n = {}'.format(curr), [3,27])

NameError: name 'np' is not defined

In [25]:
a = animation.FuncAnimation(fig_3, update, interval=100)

In [54]:
fig_1
fig_2
fig_3

<IPython.core.display.Javascript object>