def sim_cards():
    deck = [
        (num, suit)
        for num in range(1, 14)
        for suit in np.arange(4)
    ]
    # shuffle the deck
    deck = rng.choice(deck, replace=False, size=52)
    j = 0
    card = deck[j]
    total = card[0]
    # print(f"First card: {card}; total: {total}")
    while j < 52:
        next_card = deck[j+1]
        # print(f"Next card: {next_card}; total: {total}")
        if next_card[1] != card[1]:
            break
        else:
            total += next_card[0]
        j += 1
    return total

sim_cards()

10


values = [sim_cards() for _ in range(10000)]
from dsci345 import pretty

plt.hist(values, bins=pretty(values, 40));

(array([6.000e+02, 1.158e+03, 1.225e+03, 1.334e+03, 1.373e+03, 1.415e+03,
        1.435e+03, 3.060e+02, 2.720e+02, 2.440e+02, 2.090e+02, 1.520e+02,
        9.500e+01, 5.800e+01, 3.700e+01, 3.000e+01, 1.800e+01, 1.600e+01,
        7.000e+00, 1.000e+00, 3.000e+00, 5.000e+00, 3.000e+00, 1.000e+00,
        2.000e+00, 0.000e+00, 0.000e+00, 0.000e+00, 1.000e+00]),
 array([ 0.,  2.,  4.,  6.,  8., 10., 12., 14., 16., 18., 20., 22., 24.,
        26., 28., 30., 32., 34., 36., 38., 40., 42., 44., 46., 48., 50.,
        52., 54., 56., 58.]),
 <BarContainer object of 29 artists>)


from scipy.stats import norm
1 - norm.cdf(2300, loc=2080, scale=94.86)

0.010191900701979173


x = [2.51, 44.16,  6.1 , 42.4,  3.49,  1.62, 25.37, 50.58, 41.11, 15.25,
    6.64,  6.54, 14.64,  7.33,  7.11, 61.53, 7.26, 13.34,  1.88, 10.67]
plt.hist(x)

(array([10.,  2.,  2.,  1.,  0.,  0.,  2.,  1.,  1.,  1.]),
 array([ 1.62 ,  7.611, 13.602, 19.593, 25.584, 31.575, 37.566, 43.557,
        49.548, 55.539, 61.53 ]),
 <BarContainer object of 10 artists>)


# 1. write a log-likelihood function
from scipy.stats import expon

def log_likelihood(scale):
    return np.sum(expon.logpdf(x, scale=scale))


log_likelihood(3)

-145.14891244002885


xvals = np.linspace(5, 40, 101)
lvals = [log_likelihood(a) for a in xvals]
plt.plot(xvals, lvals)
plt.xlabel("scale parameter")
plt.ylabel("log-likelihood");


import scipy

def f(scale):
    return -1 * log_likelihood(scale)

scipy.optimize.minimize(
    f,
    10
)

      fun: 78.32999308675163
 hess_inv: array([[16.95651328]])
      jac: array([-9.53674316e-07])
  message: 'Optimization terminated successfully.'
     nfev: 18
      nit: 8
     njev: 9
   status: 0
  success: True
        x: array([18.47647761])


rng.beta(a=0.5, b=0.5,size=10)

array([0.70247288, 0.06706727, 0.98810507, 0.32376168, 0.35145546,
       0.13162128, 0.30439685, 0.36214   , 0.99997619, 0.75311264])


x = rng.beta(a=0.5, b=0.5,size=100000)
plt.hist(x, bins=40);


x = rng.beta(a=5, b=5,size=100000)
plt.hist(x, bins=40);


from scipy.stats import beta
xvals = np.linspace(0, 1, 101)
fx = [beta.pdf(x, a=5, b=1) for x in xvals]

plt.plot(xvals, fx);
plt.xlabel("value")
plt.ylabel("density of a Beta distribution");

Text(0, 0.5, 'density of a Beta distribution')


help(rng.beta)

Help on built-in function beta:

beta(...) method of numpy.random._generator.Generator instance
    beta(a, b, size=None)
    
    Draw samples from a Beta distribution.
    
    The Beta distribution is a special case of the Dirichlet distribution,
    and is related to the Gamma distribution.  It has the probability
    distribution function
    
    .. math:: f(x; a,b) = \frac{1}{B(\alpha, \beta)} x^{\alpha - 1}
                                                     (1 - x)^{\beta - 1},
    
    where the normalization, B, is the beta function,
    
    .. math:: B(\alpha, \beta) = \int_0^1 t^{\alpha - 1}
                                 (1 - t)^{\beta - 1} dt.
    
    It is often seen in Bayesian inference and order statistics.
    
    Parameters
    ----------
    a : float or array_like of floats
        Alpha, positive (>0).
    b : float or array_like of floats
        Beta, positive (>0).
    size : int or tuple of ints, optional
        Output shape.  If the given shape is, e.g., ``(m, n, k)``, then
        ``m * n * k`` samples are drawn.  If size is ``None`` (default),
        a single value is returned if ``a`` and ``b`` are both scalars.
        Otherwise, ``np.broadcast(a, b).size`` samples are drawn.
    
    Returns
    -------
    out : ndarray or scalar
        Drawn samples from the parameterized beta distribution.

Looking back: a review¶

Distribution roundup¶

On computation¶

Mathematics of probability¶

Bayes' rule¶

Random variables¶

Poisson limits¶

Central limits¶

Facts about Normals¶

$t$ statistics¶

Concepts¶

Method of moments¶

Maximum likelihood¶

The $p$-value¶

Confidence intervals¶

A simulation problem¶

A new distribution¶

Tips¶

Fitting an exponential¶

The beta distribution: introduction¶