Skip to content

Instantly share code, notes, and snippets.

Last active August 25, 2020 01:47
Show Gist options
  • Save kingjr/7cf9973676fe3e0bda30 to your computer and use it in GitHub Desktop.
Save kingjr/7cf9973676fe3e0bda30 to your computer and use it in GitHub Desktop.
Illustrate how SVM and Logistic Regression are very similar except that SVM strictly relies on a subset of the data.
# Author: Jean-Remi King <>
Illustrate how a hinge loss and a log loss functions
typically used in SVM and Logistic Regression
respectively focus on a variable number of samples.
For simplification purposes, we won't consider the
regularization or penalty (C) factors.
import numpy as np
import matplotlib.animation as animation
import matplotlib.pyplot as plt
# Setup data
# We'll try to fit the linear model y = w*X
n_sample, n_dim = 40, 2
X = np.random.randn(n_sample, n_dim)
coefs = np.random.randn(n_dim) # set informative feature
y = np.sign(, coefs)) # add information to data
X += np.random.randn(n_sample, n_dim) / 2. # add noise
def hinge(w, X, y):
"""Hinge loss, as used in SVM"""
pred =[X, np.ones(len(X))], w)
loss = np.max([np.zeros_like(y), 1-pred*y], axis=0)
return loss
def log(w, X, y):
"""Log loss, as used in logistic regression"""
dist =[X, np.ones(len(X))], w)
return np.log2(1 + np.exp(-y * dist))
loss_funcs = dict(hinge=hinge, log=log)
def sum_loss(w, X, y, loss):
"""Sum losses across samples"""
return np.sum(loss_funcs[loss](w, X, y))
def fit(X, y, loss, maxiter):
"""Optimization function to find w that minimize y-w*X"""
from scipy.optimize import fmin
w0 = np.random.rand(X.shape[1] + 1)
w = fmin(sum_loss, w0, args=(X, y, loss), maxiter=maxiter)
return w
def plot(loss, ax, maxiter):
# Fit
w = fit(X, y, loss, maxiter)
# Get individual losses
losses = loss_funcs[loss](w, X, y)
widths = losses / np.std(losses)
# Plot data
ax.scatter(X[:, 0], X[:, 1], s=widths*50, c='k', zorder=-1,
ax.scatter(X[:, 0], X[:, 1], s=40, c=y,, edgecolor=None)
# Plot coef (line)
coefs, intercept = w[:-1], w[-1]
slope = -coefs[0] / coefs[1]
xx = np.linspace(-2, 2)
bb = -(intercept) / coefs[1]
yy = slope * xx + bb
ax.plot(xx, yy, 'k', linewidth=2)
# Plot data distances to coef
bb_ = X[:, 1] + X[:, 0] / slope
xx_ = (bb_ - bb) / (slope + 1. / slope)
yy_ = slope * xx_ + bb
for ii in np.where(widths > 0)[0]:
ax.plot([X[ii, 0], xx_[ii]], [X[ii, 1], yy_[ii]],
linewidth=widths[ii]*2, color='k', zorder=-2)
ax.set_xlim(-2, 2)
ax.set_ylim(-2, 2)
fig, axes = plt.subplots(1, 2, sharex=True, sharey=True,
figsize=[8., 4.], facecolor='w')
def animate(maxiter):
for ax, loss in zip(axes, ['log', 'hinge']):
plot(loss, ax, maxiter=maxiter)
ani = animation.FuncAnimation(fig, animate, range(1, 50),
blit=False, interval=100, repeat=True)
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment