import numpy as np
import matplotlib.pyplot as plt

# Create a synthetic dataset of a bunch of numbers labeled 0
# interspersed with another bunch of numbers labeled 1

N = 50
np.random.seed(0)
# x is data, labels
x = np.random.randn(N) - 1
labels = np.zeros(N)
x = np.concatenate((x, np.random.randn(N)+2))
labels = np.concatenate((labels, np.ones(N)))

plt.figure(figsize=(12, 3))
plt.scatter(x, np.zeros(x.size), c=labels)
plt.colorbar()
plt.gca().set_yticks([]);


def fc(c, x):
    return np.array(x > c, dtype=float)

pts = np.linspace(-4, 4, 200)
c = -1
y = fc(c=c, x=pts)


plt.figure(figsize=(12, 3))
plt.scatter(x, np.zeros(x.size), c=labels)
plt.colorbar()
plt.plot(pts, y)
plt.title("Example: c = {}".format(c))

Text(0.5, 1.0, 'Example: c = -1')


def loss_squared(X, Y, f):
    return np.sum((Y - f(X))**2)

cs = np.linspace(-3, 3, 1000)
losses = np.zeros_like(cs)
for i in range(len(cs)):
    c = cs[i]
    f = lambda x: fc(c=c, x=x)
    losses[i] = loss_squared(x, labels, f)


plt.figure(figsize=(12, 3))
plt.scatter(x, np.zeros(x.size), c=labels)
plt.colorbar()
plt.plot(cs, losses)
plt.legend(["Data Points", "Loss Function"])

<matplotlib.legend.Legend at 0x7f8ec9b78d00>

(Binary) Supservised Learning¶

Supervised Learning Setup¶

$f^* = \text{argmin}_{f \in \mathcal{F}} \ell(f, \{X, Y\})$¶

Example: Separating Points on A Number Line¶

Function space¶

$f_{c}(x) = \left\{ \begin{array}{cc} 1 & x > c \\ 0 & x \leq c \end{array} \right\}$¶

Loss function¶

$\ell(f_c, D) = \sum_{(x, y) \in D} (y - f_c(x))^2 $¶