In [1]:

import os
data_folder = os.path.join(os.path.expanduser("~"), "Data", "cifar-10-batches-py")
batch1_filename = os.path.join(data_folder, "data_batch_1")

In [2]:

import pickle
# Bigfix thanks to: http://stackoverflow.com/questions/11305790/pickle-incompatability-of-numpy-arrays-between-python-2-and-3
def unpickle(filename):
    with open(filename, 'rb') as fo:
        return pickle.load(fo, encoding='latin1')

In [3]:

batch1 = unpickle(batch1_filename)

In [4]:

image_index = 100
image = batch1['data'][image_index]

In [5]:

image = image.reshape((32,32, 3), order='F')
import numpy as np
image = np.rot90(image, -1)

In [6]:

%matplotlib inline
from matplotlib import pyplot as plt

In [7]:

plt.imshow(image)

Out[7]:

<matplotlib.image.AxesImage at 0x7fe57222a2e8>

Application¶

In [10]:

import numpy as np
batches = []
for i in range(1, 6):
    batch_filename = os.path.join(data_folder, "data_batch_{}".format(i))
    batches.append(unpickle(batch1_filename))
    break    #IMPORTANT -- see chapter for explanation of this line

In [9]:

X = np.vstack([batch['data'] for batch in batches])

In [11]:

X = np.array(X) / X.max()
X = X.astype(np.float32)

In [12]:

from sklearn.preprocessing import OneHotEncoder
y = np.hstack(batch['labels'] for batch in batches).flatten()
y = OneHotEncoder().fit_transform(y.reshape(y.shape[0],1)).todense()
y = y.astype(np.float32)

In [15]:

from sklearn.cross_validation import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2) 

In [16]:

X_train = X_train.reshape(-1, 3, 32, 32)
X_test = X_test.reshape(-1, 3, 32, 32)

In [17]:

from lasagne import layers
layers=[
        ('input', layers.InputLayer),
        ('conv1', layers.Conv2DLayer),
        ('pool1', layers.MaxPool2DLayer),
        ('conv2', layers.Conv2DLayer),
        ('pool2', layers.MaxPool2DLayer),
        ('conv3', layers.Conv2DLayer),
        ('pool3', layers.MaxPool2DLayer),
        ('hidden4', layers.DenseLayer),
        ('hidden5', layers.DenseLayer),
        ('output', layers.DenseLayer),
        ]

In [19]:

from nolearn.lasagne import NeuralNet
from lasagne.nonlinearities import sigmoid, softmax
nnet = NeuralNet(layers=layers,
                 input_shape=(None, 3, 32, 32),
                 conv1_num_filters=32,
                 conv1_filter_size=(3, 3),
                 conv2_num_filters=64,
                 conv2_filter_size=(2, 2),
                 conv3_num_filters=128,
                 conv3_filter_size=(2, 2),
                 pool1_ds=(2,2),
                 pool2_ds=(2,2),
                 pool3_ds=(2,2),
                 hidden4_num_units=500,
                 hidden5_num_units=500,
                 output_num_units=10,
                 output_nonlinearity=softmax,
                 update_learning_rate=0.01,
                 update_momentum=0.9,
                 regression=True,
                 max_epochs=3,
                 verbose=1)

In [20]:

nnet.fit(X_train, y_train)

  input             	(None, 3, 32, 32)   	produces    3072 outputs
  conv1             	(None, 32, 30, 30)  	produces   28800 outputs
  pool1             	(None, 32, 15, 15)  	produces    7200 outputs
  conv2             	(None, 64, 14, 14)  	produces   12544 outputs
  pool2             	(None, 64, 7, 7)    	produces    3136 outputs
  conv3             	(None, 128, 6, 6)   	produces    4608 outputs
  pool3             	(None, 128, 3, 3)   	produces    1152 outputs
  hidden4           	(None, 500)         	produces     500 outputs
  hidden5           	(None, 500)         	produces     500 outputs
  output            	(None, 10)          	produces      10 outputs

 Epoch  |  Train loss  |  Valid loss  |  Train / Val  |  Valid acc  |  Dur
--------|--------------|--------------|---------------|-------------|-------
     1  |    0.090018  |    0.090022  |     0.999963  |             |  103.9s
     2  |    0.089988  |    0.090000  |     0.999858  |             |  103.8s
     3  |    0.089961  |    0.089982  |     0.999759  |             |  104.2s

/usr/local/lib/python3.4/dist-packages/Lasagne-0.1dev-py3.4.egg/lasagne/init.py:30: UserWarning: The uniform initializer no longer uses Glorot et al.'s approach to determine the bounds, but defaults to the range (-0.01, 0.01) instead. Please use the new GlorotUniform initializer to get the old behavior. GlorotUniform is now the default for all layers.
  warnings.warn("The uniform initializer no longer uses Glorot et al.'s "

Out[20]:

NeuralNet(X_tensor_type=<function tensor4 at 0x7fe55b73a0d0>,
     batch_iterator_test=<nolearn.lasagne.BatchIterator object at 0x7fe559e70710>,
     batch_iterator_train=<nolearn.lasagne.BatchIterator object at 0x7fe559e706d8>,
     conv1_filter_size=(3, 3), conv1_num_filters=32,
     conv2_filter_size=(2, 2), conv2_num_filters=64,
     conv3_filter_size=(2, 2), conv3_num_filters=128, eval_size=0.2,
     hidden4_num_units=500, hidden5_num_units=500,
     input_shape=(None, 3, 32, 32),
     layers=[('input', <class 'lasagne.layers.input.InputLayer'>), ('conv1', <class 'lasagne.layers.conv.Conv2DLayer'>), ('pool1', <class 'lasagne.layers.pool.MaxPool2DLayer'>), ('conv2', <class 'lasagne.layers.conv.Conv2DLayer'>), ('pool2', <class 'lasagne.layers.pool.MaxPool2DLayer'>), ('conv3', <class..., <class 'lasagne.layers.dense.DenseLayer'>), ('output', <class 'lasagne.layers.dense.DenseLayer'>)],
     loss=None, max_epochs=3, more_params={},
     objective=<class 'lasagne.objectives.Objective'>,
     objective_loss_function=<function mse at 0x7fe559e622f0>,
     on_epoch_finished=(), on_training_finished=(),
     output_nonlinearity=<theano.tensor.nnet.nnet.Softmax object at 0x7fe57cfddba8>,
     output_num_units=10, pool1_ds=(2, 2), pool2_ds=(2, 2),
     pool3_ds=(2, 2), regression=True,
     update=<function nesterov_momentum at 0x7fe559e628c8>,
     update_learning_rate=0.01, update_momentum=0.9,
     use_label_encoder=False, verbose=1,
     y_tensor_type=TensorType(float32, matrix))

In [21]:

from sklearn.metrics import f1_score
y_pred = nnet.predict(X_test)
print(f1_score(y_test.argmax(axis=1), y_pred.argmax(axis=1)))

0.0364246254873

/usr/local/lib/python3.4/dist-packages/sklearn/metrics/metrics.py:1771: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no predicted samples.
  'precision', 'predicted', average, warn_for)

Cifar Dataset¶

In [1]:

import os
data_folder = os.path.join(os.path.expanduser("~"), "Data", "cifar-10-batches-py")
batch1_filename = os.path.join(data_folder, "data_batch_1")

In [2]:

import pickle
# Bigfix thanks to: http://stackoverflow.com/questions/11305790/pickle-incompatability-of-numpy-arrays-between-python-2-and-3
def unpickle(filename):
    with open(filename, 'rb') as fo:
        return pickle.load(fo, encoding='latin1')

In [3]:

batch1 = unpickle(batch1_filename)

In [4]:

image_index = 100
image = batch1['data'][image_index]

In [5]:

image = image.reshape((32,32, 3), order='F')
import numpy as np
image = np.rot90(image, -1)

In [8]:

%matplotlib inline
from matplotlib import pyplot as plt

In [9]:

plt.imshow(image)

Out[9]:

<matplotlib.image.AxesImage at 0x7f12f47efac8>

Theano¶

In [10]:

import theano
from theano import tensor as T

In [11]:

a = T.dscalar()
b = T.dscalar()

In [12]:

c = T.sqrt(a ** 2 + b ** 2)

In [13]:

f = theano.function([a,b], c)

In [14]:

f(3, 4)

Out[14]:

array(5.0)

Deep Neural Networks¶

In [15]:

from sklearn.datasets import load_iris
iris = load_iris()
X = iris.data.astype(np.float32)
y_true = iris.target.astype(np.int32)

In [16]:

from sklearn.cross_validation import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y_true, random_state=14)

In [17]:

import lasagne
input_layer = lasagne.layers.InputLayer(shape=(10, X.shape[1]))

In [18]:

hidden_layer = lasagne.layers.DenseLayer(input_layer, num_units=12, nonlinearity=lasagne.nonlinearities.sigmoid)

/usr/local/lib/python3.4/dist-packages/Lasagne-0.1dev-py3.4.egg/lasagne/init.py:30: UserWarning: The uniform initializer no longer uses Glorot et al.'s approach to determine the bounds, but defaults to the range (-0.01, 0.01) instead. Please use the new GlorotUniform initializer to get the old behavior. GlorotUniform is now the default for all layers.
  warnings.warn("The uniform initializer no longer uses Glorot et al.'s "

In [19]:

output_layer = lasagne.layers.DenseLayer(hidden_layer, num_units=3, 
                                     nonlinearity=lasagne.nonlinearities.softmax)

In [20]:

import theano.tensor as T
net_input = T.matrix('net_input')
net_output = output_layer.get_output(net_input)
true_output = T.ivector('true_output')

In [21]:

loss = T.mean(T.nnet.categorical_crossentropy(net_output, true_output))

In [22]:

all_params = lasagne.layers.get_all_params(output_layer)
updates = lasagne.updates.sgd(loss, all_params, learning_rate=0.1)

/usr/local/lib/python3.4/dist-packages/Lasagne-0.1dev-py3.4.egg/lasagne/layers/helper.py:52: UserWarning: get_all_layers() has been changed to return layers in topological order. The former implementation is still available as get_all_layers_old(), but will be removed before the first release of Lasagne. To ignore this warning, use `warnings.filterwarnings('ignore', '.*topo.*')`.
  warnings.warn("get_all_layers() has been changed to return layers in "

In [23]:

import theano
train = theano.function([net_input, true_output], loss, updates=updates)
get_output = theano.function([net_input], net_output)

In [24]:

for n in range(1000):
    train(X_train, y_train)

In [25]:

y_output = get_output(X_test)

In [26]:

import numpy as np
y_pred = np.argmax(y_output, axis=1)

In [27]:

from sklearn.metrics import f1_score
print(f1_score(y_test, y_pred))

1.0

In [28]:

import numpy as np
from PIL import Image, ImageDraw, ImageFont
from skimage.transform import resize
from skimage import transform as tf
from skimage.measure import label, regionprops
from sklearn.utils import check_random_state
from sklearn.preprocessing import OneHotEncoder
from sklearn.cross_validation import train_test_split

def create_captcha(text, shear=0, size=(100, 24)):
    im = Image.new("L", size, "black")
    draw = ImageDraw.Draw(im)
    font = ImageFont.truetype(r"Coval.otf", 22)
    draw.text((2, 2), text, fill=1, font=font)
    image = np.array(im)
    affine_tf = tf.AffineTransform(shear=shear)
    image = tf.warp(image, affine_tf)
    return image / image.max()


def segment_image(image):
    labeled_image = label(image > 0)
    subimages = []
    for region in regionprops(labeled_image):
        start_x, start_y, end_x, end_y = region.bbox
        subimages.append(image[start_x:end_x,start_y:end_y])
    if len(subimages) == 0:
        return [image,]
    return subimages

random_state = check_random_state(14)
letters = list("ABCDEFGHIJKLMNOPQRSTUVWXYZ")
shear_values = np.arange(0, 0.5, 0.05)

def generate_sample(random_state=None):
    random_state = check_random_state(random_state)
    letter = random_state.choice(letters)
    shear = random_state.choice(shear_values)
    return create_captcha(letter, shear=shear, size=(20, 20)), letters.index(letter)
dataset, targets = zip(*(generate_sample(random_state) for i in range(3000)))
dataset = np.array(dataset, dtype='float')
targets =  np.array(targets)

onehot = OneHotEncoder()
y = onehot.fit_transform(targets.reshape(targets.shape[0],1))
y = y.todense().astype(np.float32)

dataset = np.array([resize(segment_image(sample)[0], (20, 20)) for sample in dataset])
X = dataset.reshape((dataset.shape[0], dataset.shape[1] * dataset.shape[2]))
X = X / X.max()
X = X.astype(np.float32)

X_train, X_test, y_train, y_test = \
    train_test_split(X, y, train_size=0.9, random_state=14)

In [29]:

from lasagne import layers
layers=[
        ('input', layers.InputLayer),
        ('hidden', layers.DenseLayer),
        ('output', layers.DenseLayer),
        ]

In [30]:

from lasagne import updates
from nolearn.lasagne import NeuralNet
from lasagne.nonlinearities import sigmoid, softmax

In [33]:

net1 = NeuralNet(layers=layers,
                 input_shape=X.shape,
                 hidden_num_units=100,
                 output_num_units=26,
                 hidden_nonlinearity=sigmoid,
                 output_nonlinearity=softmax,
                 hidden_b=np.zeros((100,), dtype=np.float64),
                 update=updates.momentum,
                 update_learning_rate=0.9,
                 update_momentum=0.1,
                 regression=True,
                 max_epochs=1000,
                 )

In [34]:

net1.fit(X_train, y_train)

Out[34]:

NeuralNet(X_tensor_type=<function matrix at 0x7f12ed0819d8>,
     batch_iterator_test=<nolearn.lasagne.BatchIterator object at 0x7f12e5039c50>,
     batch_iterator_train=<nolearn.lasagne.BatchIterator object at 0x7f12e5039c18>,
     eval_size=0.2, hidden_b=array([ 0.,  0., ...,  0.,  0.]),
     hidden_nonlinearity=<theano.tensor.elemwise.Elemwise object at 0x7f12ecd109e8>,
     hidden_num_units=100, input_shape=(3000, 400),
     layers=[('input', <class 'lasagne.layers.input.InputLayer'>), ('hidden', <class 'lasagne.layers.dense.DenseLayer'>), ('output', <class 'lasagne.layers.dense.DenseLayer'>)],
     loss=None, max_epochs=1000, more_params={},
     objective=<class 'lasagne.objectives.Objective'>,
     objective_loss_function=<function mse at 0x7f12e8300598>,
     on_epoch_finished=(), on_training_finished=(),
     output_nonlinearity=<theano.tensor.nnet.nnet.Softmax object at 0x7f12ecd195c0>,
     output_num_units=26, regression=True,
     update=<function momentum at 0x7f12e8300ae8>,
     update_learning_rate=0.9, update_momentum=0.1,
     use_label_encoder=False, verbose=0,
     y_tensor_type=TensorType(float32, matrix))

In [35]:

y_pred = net1.predict(X_test)
y_pred = y_pred.argmax(axis=1)
assert len(y_pred) == len(X_test)
if len(y_test.shape) > 1:
    y_test = y_test.argmax(axis=1)
print(f1_score(y_test, y_pred))

1.0

In [ ]: