t = np.linspace(0, 20, 101)
y = 2 + np.cos(t) + rng.normal(scale=0.2, size=101)
plt.scatter(t, y); plt.xlabel("t"); plt.ylabel("y");

r = np.corrcoef(np.cos(t), y)[0, 1]
b = r * np.std(y, ddof=1) / np.std(np.cos(t), ddof=1)
a = np.mean(y) - b * np.mean(np.cos(t))
yhat = a + b * np.cos(tt)

fig, ax = plt.subplots()
ax.scatter(np.cos(t), y, label='data')
tt = np.linspace(0, 20, 201)
ax.scatter(np.cos(tt), yhat, label='prediction')
ax.legend();

fig, ax = plt.subplots()
ax.scatter(t, y); plt.xlabel("t"); plt.ylabel("y");
ax.scatter(tt, yhat);

n = 150
true_coefs = [(1, 0), (3.2, 2.5), (0, 0), (10, 0)]
tvec = np.sort(rng.uniform(low=0, high=15, size=n))
mean_yvec = np.zeros(n)
for j, (alpha, beta) in enumerate(true_coefs):
    mean_yvec += alpha * np.cos(np.pi * tvec / 2**j) + beta * np.sin(np.pi * tvec / 2**j)
yvec = mean_yvec + rng.normal(scale=2.0, size=n)

fig, ax = plt.subplots()
ax.scatter(tvec, yvec, label="data (y)")
ax.plot(tvec, mean_yvec, label="true signal")
ax.legend();

k = 5
X = np.array([
    [np.cos(np.pi * t / 2 ** j) for j in range(k+1)]
    + [np.sin(np.pi * t / 2 ** j) for j in range(k+1)]
    for t in tvec
])
a_hat = np.linalg.solve(np.matmul(X.T, X), (X.T).dot(yvec))
y_hat = X.dot(a_hat)

fig, ax = plt.subplots()
ax.scatter(tvec, yvec, label="data (y)")
ax.plot(tvec, mean_yvec, label="true signal")
ax.plot(tvec, y_hat, label="estimated signal")
ax.legend();

x = np.linspace(0, 2, 101)
y = np.exp(2 + x + rng.normal(scale=0.1, size=101))
plt.scatter(x, y); plt.xlabel("x"); plt.ylabel("y");

x = np.array([28., 67.,  7., 47., 15., 65., 29., 21., 49., 41., 56.,  1., 32.,
        25., 49., 27., 40., 54., 22.,  9.])
y = np.array([ 32., 119.,   9.,  90.,  18., 107.,  23.,  14.,  56.,  40.,  85.,
         8.,  42.,  19.,  48.,  30.,  38., 110.,  27.,   8.])

from scipy.optimize import least_squares
def resids(u):
    return y - np.exp(u[0] + u[1] * x)
ls_fit = least_squares(
    resids,
    x0=(1, 1),
)
ls_fit

     message: `ftol` termination condition is satisfied.
     success: True
      status: 2
         fun: [ 2.462e+00 -6.009e+00 ...  3.341e+00 -6.627e+00]
           x: [ 2.350e+00  3.699e-02]
        cost: 1457.0070960833966
         jac: [[-2.954e+01 -8.271e+02]
               [-1.250e+02 -8.376e+03]
               ...
               [-2.366e+01 -5.205e+02]
               [-1.463e+01 -1.316e+02]]
        grad: [-1.209e-05  4.690e-01]
  optimality: 0.4689870746078668
 active_mask: [ 0.000e+00  0.000e+00]
        nfev: 76
        njev: 73

est_a, est_b = ls_fit['x']
y_hat = np.exp(est_a + est_b * x)
plt.scatter(x, y, label='data')
plt.scatter(x, y_hat, label='predicted')
xx = np.linspace(0, 70, 101)
plt.plot(xx, np.exp(est_a + est_b * xx), label='fit')
plt.legend();

Nonlinear models¶

When it's not straight lines, part 1¶

Example: sines and cosines¶

When it's not straight lines, part 2¶

Exercise:¶

Nonlinear, for reals¶