def L(p):
    C = np.math.factorial(20) / (np.math.factorial(15) * np.math.factorial(5))
    return C * (p ** 15) * ((1-p) ** 5)

pvals = np.linspace(0, 1, 51)
plt.plot(pvals, L(pvals))
plt.xlabel("probability of heads (p)")
plt.ylabel("likelihood")
plt.axvline(0.75, c='red');


x = [112, 145, 131, 98, 104]
np.mean(x)

118.0


muvals = np.linspace(100, 140, 51)
x = np.array([112, 145, 131, 98, 104])

def normal_L(mu, sigma):
    C = np.sqrt(2 * np.math.pi * sigma**2)
    return np.prod(np.exp(- (x - mu)**2 / (2 * sigma**2)) / C)

sigvals = [5, 25]
fig, axes = plt.subplots(1, len(sigvals))
for sig, ax in zip(sigvals, axes):
    ax.plot(muvals, [normal_L(m, sig) for m in muvals])
    ax.axvline(np.mean(x), c='r')
    ax.set_title(f"sigma={sig}")


from scipy.stats import norm

mu, sigma = 150, 50
print(normal_L(mu, sigma), np.prod(norm.pdf(x, loc=mu, scale=sigma)))

8.552412635759266e-12 8.552412635759269e-12


muvals = np.linspace(100, 140, 51)
x = np.array([112, 145, 131, 98, 104])

sigvals = [5, 25]
fig, axes = plt.subplots(1, len(sigvals))
for sig, ax in zip(sigvals, axes):
    ax.plot(muvals, [np.prod(norm.pdf(x, loc=m, scale=sig)) for m in muvals])
    ax.axvline(np.mean(x), c='r')
    ax.set_title(f"sigma={sig}")


rain

array([ 17.,  99.,  79.,  24.,  32.,  45.,  93.,  83., 113.,  32.,   3.,
       114.,  71.,  98.,  56.,  31.,  95.,  31.,  76.,  83.,  70., 107.,
        23.,  40., 168.,  43.,  43.,  28.,  20.,  49.,  26.,  32.,  10.,
        58.,  52.,  35.,  81., 124.,  28.,  46.,  25., 120.,  24.,  17.,
        57.,  96.,  59., 100.,  33.,  74.,  27.,  33.,  33.,  35.,  76.,
       104.,  31.,  24.,  33.,  24.,  73.,  34.,  50.,  53.,  50.,  33.,
       106., 125.,  44.,  94.,  35.,  54.])


from scipy.stats import gamma

def logL(theta, k):
    lpdfs = gamma.logpdf(rain, a=k, scale=theta) # "a" is the shape parameter here
    return np.sum(lpdfs)

from scipy.optimize import minimize
max_L = minimize(lambda x: -logL(*x), x0=(24, 1.8))
mle_theta, mle_k = max_L['x']
max_L

      fun: 348.1884538503342
 hess_inv: array([[14.27925121, -1.48033603],
       [-1.48033603,  0.18579412]])
      jac: array([0.00000000e+00, 7.62939453e-06])
  message: 'Optimization terminated successfully.'
     nfev: 33
      nit: 9
     njev: 11
   status: 0
  success: True
        x: array([21.17999438,  2.71089168])


thetavals = pretty([10, 40], 20)
kvals = np.round(pretty([0.5, 3], 10), 2)
Lmap = np.array(
    [[logL(theta, k) for theta in thetavals] for k in kvals]
)

fig, ax = plt.subplots()
im = ax.imshow(Lmap)
cbar = ax.figure.colorbar(im, ax=ax)
ax.set_xlabel("scale (theta)"); ax.set_ylabel("shape (k)")
ax.set_xticks(np.arange(len(thetavals)), labels=thetavals)
ax.set_yticks(np.arange(len(kvals)), labels=kvals)
ax.set_title(f"maximum at theta = {mle_theta:.2f}, k = {mle_k:.2f}");


obs_mean = np.mean(rain)
obs_sd = np.std(rain)
theta = obs_sd**2  / obs_mean - 1
k = obs_mean / theta
print(f"MOM estimates: theta = {theta:.2f}, k = {k:.2f}.")
print(f"MLE estimates: theta = {max_L['x'][0]:.2f}, k = {max_L['x'][1]:.2f}.")

MOM estimates: theta = 19.25, k = 2.98.
MLE estimates: theta = 21.18, k = 2.71.


print(f"The observed mean rainfall/hour is {obs_mean:.3f} mm and the MLE-predicted mean is {(mle_theta * mle_k):.3f} mm.")

The observed mean rainfall/hour is 57.417 mm and the MLE-predicted mean is 57.417 mm.

Likelihood and model fitting¶

Guess the probability¶

Guess the mean¶

Likelihood surfaces¶

Example: the gamma distribution¶

Maximum likelihood¶