Ordinal Regression¶

Ordinal regression aims at fitting a model to some data $(X, Y)$, where $Y$ is an ordinal variable. To do so, we use a VPG model with a specific likelihood (gpflow.likelihoods.Ordinal).

In [1]:

import gpflow
import numpy as np
import matplotlib
%matplotlib inline
matplotlib.rcParams['figure.figsize'] = (12, 6)
plt = matplotlib.pyplot

In [2]:

#make a one dimensional ordinal regression problem

# This function generates a set of inputs X, 
# quantitative output f (latent) and ordinal values Y

def generate_data(num_data):
    # First generate random inputs
    X = np.random.rand(num_data, 1)
    
    # Now generate values of a latent GP
    kern = gpflow.kernels.RBF(1, lengthscales=0.1)
    K = kern.compute_K_symm(X)
    f = np.random.multivariate_normal(mean=np.zeros(num_data), cov=K).reshape(-1, 1)
    
    # Finally convert f values into ordinal values Y
    Y = np.round((f + f.min())*3)
    Y = Y - Y.min()
    Y = np.asarray(Y, np.float64)

    return X, f, Y

np.random.seed(1)
num_data = 20
X, f, Y = generate_data(num_data)

plt.figure(figsize=(11, 6))
plt.plot(X, f, '.')
plt.ylabel('latent function value')

plt.twinx()
plt.plot(X, Y, 'kx', mew=1.5)
plt.ylabel('observed data value')

Out[2]:

Text(0, 0.5, 'observed data value')

In [3]:

# construct ordinal likelihood - bin_edges is the same as unique(Y) but centered
bin_edges = np.array(np.arange(np.unique(Y).size + 1), dtype=float)
bin_edges = bin_edges - bin_edges.mean()
likelihood=gpflow.likelihoods.Ordinal(bin_edges)

# build a model with this likelihood
m = gpflow.models.VGP(X, Y, 
                   kern=gpflow.kernels.Matern32(1),
                   likelihood=likelihood)

# fit the model
gpflow.train.ScipyOptimizer().minimize(m)

INFO:tensorflow:Optimization terminated with:
  Message: b'CONVERGENCE: REL_REDUCTION_OF_F_<=_FACTR*EPSMCH'
  Objective function value: 25.484796
  Number of iterations: 199
  Number of functions evaluations: 220

INFO:tensorflow:Optimization terminated with:
  Message: b'CONVERGENCE: REL_REDUCTION_OF_F_<=_FACTR*EPSMCH'
  Objective function value: 25.484796
  Number of iterations: 199
  Number of functions evaluations: 220

In [4]:

# here we'll plot the expected value of Y +- 2 std deviations, as if the distribution were Gaussian
plt.figure(figsize=(11, 6))
Xtest = np.linspace(m.X.read_value().min(), m.X.read_value().max(), 100).reshape(-1, 1)
mu, var = m.predict_y(Xtest)
line, = plt.plot(Xtest, mu, lw=2)
col=line.get_color()
plt.plot(Xtest, mu+2*np.sqrt(var), '--', lw=2, color=col)
plt.plot(Xtest, mu-2*np.sqrt(var), '--', lw=2, color=col)
plt.plot(m.X.read_value(), m.Y.read_value(), 'kx', mew=2)

Out[4]:

[<matplotlib.lines.Line2D at 0x7f5320b53908>]

In [5]:

# to see the predictive density, try predicting every possible discrete value for Y.
def pred_density(m):
    Xtest = np.linspace(m.X.read_value().min(), m.X.read_value().max(), 100).reshape(-1, 1)
    ys = np.arange(m.Y.read_value().max()+1)
    densities = []
    for y in ys:
        Ytest = np.ones_like(Xtest) * y
        # Predict the log density
        densities.append(m.predict_density(Xtest, Ytest))
    return np.hstack(densities).T

In [6]:

fig = plt.figure(figsize=(14, 6))
plt.imshow(np.exp(pred_density(m)), interpolation='nearest',
           extent=[m.X.read_value().min(), m.X.read_value().max(), -0.5, m.Y.read_value().max()+0.5],
           origin='lower', aspect='auto', cmap=plt.cm.viridis)
plt.colorbar()
plt.plot(X, Y, 'kx', mew=2, scalex=False, scaley=False)

Out[6]:

[<matplotlib.lines.Line2D at 0x7f53208364a8>]

In [7]:

# Predictive density for a single input x=0.5
x_new = 0.5
ys = np.arange(np.max(m.Y.value+1)).reshape([-1, 1])
x_new_vec = x_new*np.ones_like(ys)
# for predict_density x and y need to have the same number of rows
dens_new = np.exp(m.predict_density(x_new_vec, ys))
fig = plt.figure(figsize=(8, 4))
plt.bar(x=ys.flatten(), height=dens_new.flatten())

Out[7]:

<BarContainer object of 8 artists>

In [ ]: