# Truth, without noise
xx, yy = generateData(100, False)

# Noisy observation, training samples
x, y = generateData(13, True)

# plot data
plt.plot(xx, yy, 'g--')
plt.plot(x, y, 'ro')

[<matplotlib.lines.Line2D at 0x10a41e5e0>]


# Here were are going to take advantage of numpy's 'polyfit' function
# This implements a "polynomial fitting" algorithm
# coeffs are the optimal coefficients of the polynomial
coeffs = np.polyfit(x, y, 0)  # 0 is the degree of the poly

# We construct poly(), the polynomial with "learned" coefficients
poly = np.poly1d(coeffs)

plt.plot(xx, yy, "g--")
plt.plot(x, y, "ro")
plt.plot(xx, poly(xx), "b-")

[<matplotlib.lines.Line2D at 0x10a502b50>]


coeffs = np.polyfit(x, y, 1) # Now let's try degree = 1
poly = np.poly1d(coeffs)
plt.plot(xx, yy, "g--")
plt.plot(x, y, "ro")
plt.plot(xx, poly(xx), "b-")

[<matplotlib.lines.Line2D at 0x10a56a370>]


coeffs = np.polyfit(x, y, 3) # Now degree = 3
poly = np.poly1d(coeffs)

plt.plot(xx, yy, "g--")
plt.plot(x, y, "ro")
plt.plot(xx, poly(xx), "b-")

[<matplotlib.lines.Line2D at 0x10a5c7730>]


r = np.linspace(-1,1,100)
f, axs = plt.subplots(1, 3, figsize=(12,4))
for j in range(8):
    axs[0].plot(r, np.power(r,j))
    axs[1].plot(r, np.exp( - (r - j/7.0 + 0.5)**2 / 2*5**2 ))
    axs[2].plot(r, 1 / (1 + np.exp( - (r - j/5.0 + 0.5) * 5)) )

set_nice_plot_labels(axs) # I'm hiding some helper code that adds labels


stys = ['k-', 'k-.', 'm-', 'm-.']
plt.plot(xx, yy, "g--")
plt.plot(x, y, "ro", label="Training data")
for _i in range(4):
    plt.plot(xx, tsts[_i], stys[_i], label='Order {0}'.format(_i))
plt.legend()

<matplotlib.legend.Legend at 0x10a7f8970>


f, ax = plt.subplots(ncols=4, sharey=True, figsize=(16,4))
for _i in range(4):
    ax[_i].plot(xx, yy, "g--")
    ax[_i].plot(x, y, "ro")
    ax[_i].plot(xx, tsts[_i])
    ax[_i].set_title('Order {0}, RMSE={1:4.3f}'.format(_i, es[_i]))


f, ax = plt.subplots(ncols=4, sharey=True, figsize=(16,4))
for _i in range(4):
    ax[_i].plot(y, y, "r-")
    ax[_i].plot(y, trns[_i], "bo")
    ax[_i].set_title('Order {0}, R2={1:4.3f}'.format(_i, rs[_i]))

AERSP 597 - Machine Learning in Aerosapce Engineering¶

Lecture 4, Linear Regression: Formulation by optimization¶

Instructor: Daning Huang¶

TODAY: Linear Regression - I¶

References:¶

Supervised Learning¶

No Free Lunch Theorem¶

Classical ML v.s. Deep learning¶

Notation¶

Linear Regression (1d inputs)¶

Regression: Noisy Data¶

Regression: 0th Order Polynomial¶

Regression: 1st Order Polynomial¶

Regression: 3rd Order Polynomial¶

Linear Regression (General Case)¶

Basis Functions¶

Least Squares: Objective Function¶

Closed Form Solution: Derivation¶

Closed Form Solution: Data Matrix¶

Least Squares: Gradient via Matrix Calculus¶

Digression: Moore-Penrose Pseudoinverse¶

Alternative View: Projection onto subspace¶

Accuracy Assessment¶

Back to the polynomial example¶

Root of Mean-Squared Error, RMSE¶

Coefficient of determination¶

Geometrical interpretation of R2¶