!pip install scipy

Defaulting to user installation because normal site-packages is not writeable
Requirement already satisfied: scipy in c:\users\dhafe\appdata\roaming\python\python310\site-packages (1.7.3)
Requirement already satisfied: numpy<1.23.0,>=1.16.5 in c:\users\dhafe\appdata\roaming\python\python310\site-packages (from scipy) (1.22.1)


import numpy as np


from scipy import stats


X= stats.bernoulli(.3)


X.pmf(1)

0.3


X.pmf(0)

0.7


X.pmf(4)

0.0


X.pmf(-2)

0.0


X.cdf(-1)

0.0


X.cdf(0)

0.7


X.cdf(0.2)

0.7


X.cdf(1)

1.0


X.cdf(10)

1.0


import numpy as np


data = np.random.random(1000)


data[1:10]

array([0.62485778, 0.12170412, 0.25287054, 0.78623599, 0.34879936,
       0.74056271, 0.42610447, 0.2546339 , 0.63981476])


data.min()

0.0005284937096231568


data.max()

0.9998493971559735


data=-3*(2*data-1)


data.min()

-2.999096382935841


data.max()

2.996829037742261


data[:8]

array([-2.05663816, -0.74914665,  2.26977529,  1.48277674, -1.71741591,
        0.90720382, -1.44337625,  0.4433732 ])


x = np.sort(data)


x[:8]

array([-2.99909638, -2.99394417, -2.97917872, -2.97467941, -2.97431385,
       -2.97152315, -2.96997004, -2.95919471])


import scipy


y = scipy.stats.bernoulli.cdf(x,.4)


import matplotlib.pyplot as plt


plt.step(x, y,'r*', where='post')
plt.xlabel('x')

Text(0.5, 0, 'x')


X.mean()

0.3


X.var()

0.21


X.rvs()

1


X.rvs(20)

array([1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0])


z=X.rvs(100)


z.mean()

0.37


z.var()

0.23309999999999995


from scipy import stats


X= stats.poisson(1.4)


X.pmf(3)

0.11277701150929471


X.pmf(4)

0.039471954028253146


x=np.arange(0,20)


y = scipy.stats.poisson.pmf(x,1.4)

y

array([2.46596964e-01, 3.45235750e-01, 2.41665025e-01, 1.12777012e-01,
       3.94719540e-02, 1.10521471e-02, 2.57883433e-03, 5.15766866e-04,
       9.02592015e-05, 1.40403202e-05, 1.96564483e-06, 2.50172979e-07,
       2.91868475e-08, 3.14319896e-09, 3.14319896e-10, 2.93365237e-11,
       2.56694582e-12, 2.11395538e-13, 1.64418752e-14, 1.21150659e-15])


plt.bar(x, y)
plt.xticks(x)
plt.show()


X.mean()

1.4


X.var()

1.4


X.cdf(2)

0.8334977381226298


X.cdf(5)

0.9967988507880886


data = np.random.random(1000)


data=7*data


x=np.sort(data)


y = scipy.stats.poisson.cdf(x,1.4)


plt.step(x, y,'r*', where='post')
plt.xlabel('x')

Text(0.5, 0, 'x')


X.rvs()

5


X.rvs(20)

array([0, 0, 2, 1, 2, 2, 3, 0, 0, 2, 4, 2, 1, 1, 1, 3, 0, 1, 2, 2])


z=X.rvs(100)


z.mean()

1.47


z.var()

1.5090999999999999

z<3

array([False,  True,  True,  True,  True,  True,  True,  True,  True,
        True, False,  True,  True,  True,  True,  True,  True,  True,
        True,  True, False,  True,  True,  True,  True, False, False,
        True,  True,  True,  True,  True,  True,  True,  True,  True,
       False,  True,  True, False,  True, False,  True, False,  True,
        True,  True,  True, False,  True,  True,  True,  True,  True,
        True,  True,  True, False,  True, False,  True,  True,  True,
       False,  True,  True,  True,  True,  True,  True,  True,  True,
        True,  True,  True, False,  True,  True,  True,  True,  True,
        True,  True,  True,  True,  True,  True,  True, False,  True,
        True, False,  True,  True, False,  True,  True,  True,  True,
        True])


zz=z<3


zz.sum()

83


phat=zz.sum()/len(zz)


phat

0.83


X.cdf(2.999)

0.8334977381226298


x=np.arange(1,1001)


z=X.rvs(1000)


zz=z<3


phat=zz.cumsum()/x


import math
from scipy import stats


X= stats.norm(loc=1.4,scale=2)


X.cdf(3)

0.7881446014166034


X.mean()

1.4


X.var()

4.0


X.pdf(3)

0.14484577638074136


X.pdf(1.4)

0.19947114020071635


1/math.sqrt(2*math.pi*4)

0.19947114020071635


X.cdf(-10)

5.99037140106353e-09


X.cdf(0)

0.24196365222307303


X.cdf(1.4)

0.5


X.cdf(1.4-1.96*2).round(3)

0.025


X.cdf(1.4+1.96*2).round(3)

0.975


X.rvs()

-1.4972065404834658


data = X.rvs(1000)


import numpy as np


data = np.random.normal(size=1000,loc=0,scale=2)


x = np.sort(data)


x[0:8]

array([-7.00527363, -6.40776959, -5.53323088, -5.22003149, -5.07977012,
       -4.95514965, -4.87125955, -4.83750203])


import scipy


y = scipy.stats.norm.cdf(x,1.4,2)


y[0:8]

array([1.31911847e-05, 4.73304266e-05, 2.63527680e-04, 4.66453618e-04,
       5.97889450e-04, 7.42561820e-04, 8.57427691e-04, 9.08096829e-04])


import matplotlib.pyplot as plt


plt.step(x, y)
plt.xlabel('x')
plt.ylabel('CDF of X')

Text(0, 0.5, 'CDF of X')


import math
from scipy import stats


X= stats.expon(scale=2.2)


X.mean()

2.2


X.var()

4.840000000000001


2.2**2

4.840000000000001


X.pdf(2)

0.1831319643314241


X.pdf(-1)

0.0


X.cdf(3)

0.7442708400868994


1-math.exp(-3/2.2)

0.7442708400868994


math.exp(0)

1.0


X.pdf(0)

0.45454545454545453


1/2.2

0.45454545454545453


X.pdf(3)

0.11624052723322756


(1/2.2)*math.exp(-3/2.2)

0.11624052723322756


X.rvs()

2.2496880342664096


import numpy as np


data  = np.random.normal(size=1000,loc=0,scale=20)


x=np.sort(data)


x.min()

-56.402034243025184


x.max()

58.70478274607458


y = scipy.stats.expon.cdf(x,scale=2.2)


import matplotlib.pyplot as plt


plt.step(x, y)
plt.xlabel('x')
plt.ylabel('CDF of X')

Text(0, 0.5, 'CDF of X')

Name	Python command	parameters
Geometric $p$	stats.geom(p)	$p$ is the probability
Binomial $(n,p)$	stats.binom(n, p)	$n$ is the size and $p$ is the probability

Probability distributions with Python¶

Table of Contents

Introduction¶

Random variables¶

Bernoulli random variables¶

Tossing a dice¶

Poisson random variables¶

Life time random variables¶

What should we know about a random variable?¶

Probability distributions with Python¶

Bernoulli distribution¶

Poisson distribution¶

Normal distribution¶

Exponential distribution¶