# The Poisson distribution - discrete (counting events)

In [2]:
# Events appear to happen at a certain rate, but
# completely random

# ** Number of animals adopted per week
# ** Number of people arriving at a restaurant per hour

# or --
# How likely it is for a certain number of events to happen within a 
# fixed amount of time or space, given the average rate at which those events occur
# It's commonly used in situations where events happen randomly and independently of each other.

In [None]:
# Helps you predict the likelihood of seeing different numbers
# of cars in any given hour, like 5 cars, 10 cars, or 15 cars.

# Probability of >= 5 animals adopted per week

In [3]:
# The Poisson distribution - is described by "Lambda"
# "Lambda" - average number of events per time interval
# This is also the expected value of the distribution

![image.png](attachment:image.png)

In [12]:
# Probability of a single value
from scipy.stats import poisson

# Avg number if adoptions per week is 8

# 1. What is Probability(of 5 adoptions per week)?
poisson.pmf(5, 8) #9%

# 2. What is Probability(of 5 or less adoptions per week)?
poisson.cdf(5, 8) #19%

# 3. What is Probability(of 5 or more adoptions per week)?
1 - poisson.cdf(5, 8) #80%

0.8087639379203747

In [13]:
# Sampling from Passion distribution - just like other distributions

# poisson.rvs(avg, size = n)
poisson.rvs(8, size = 10) # to simulate 10 different weeks to get 8 on average

array([ 9,  8,  5,  9,  7,  8, 10,  4, 10, 10], dtype=int64)

In [None]:
# The CLT still applies !!!

# The Exponential Distribution - continious

In [None]:
# Probability of time between Poisson events
# The exponential distribution describes the time it takes for something to happen. 
# It's often used when events happen randomly, but on average, at a constant rate.

# ** Probability of  > 1 day between adoptions
# ** Probability of  < 10min between restaurant arrivals
# ** Probability of 1 bus between 20 minutes

# ** Amount of time until the next customer makes a purchase
# ** Amount of time until someone pays off their loan

![image.png](attachment:image.png)

In [19]:
# Expected value

# In terms of rate:
# lambda = 0.5 requests per minute

# In terms of time between events:
# 1/lambda = 1/0.5 = 2 minutes between requests

In [18]:
# How long until a new request has created?
from scipy.stats import expon

# Probability of waiting less than 1 minute
expon.cdf(1, scale = 2) #40%

# Probability of waiting more than 4 minutes
1 - expon.cdf(4, scale = 2) #13%

# Probability of waiting 1-4 minutes
expon.cdf(4, scale = 2) - expon.cdf(1, scale = 2) #47%

0.4711953764760207

# Student's t-distribution - continious

In [1]:
# Has similar shape to The Normal distribution, but the t-distribution's
# tails are thicker. Which means that in a t-distribution, observations
# are more likely to fall further from the mean

![image.png](attachment:image.png)

In [20]:
# Degrees of freedom - parameter of t-distribution, which affects
# the thickness of the tails

# *lower degrees of freedom -- thicker tails, higher standard deviation
# *higher degrees of freedom -- closer to normal distribution

# Log-normal distribution - continious

In [None]:
# Variables that follow a log-normal distribution
# have a logarithm that is normally distributed

# *Results distributions that are skewed

# ** Lenght of chess games
# ** Adult blood pressure

![image.png](attachment:image.png)