Notebook

In [1]:

%pylab inline
import lasagne
import theano
import theano.tensor as T

Populating the interactive namespace from numpy and matplotlib

In [4]:

# create Theano variables for input and target minibatch
hr="-"*120
input_var = T.tensor4('X')
target_var = T.ivector('y')

input_var,hr,target_var

Out[4]:

(X,
 '------------------------------------------------------------------------------------------------------------------------',
 y)

In [5]:

# create a small convolutional neural network
from lasagne.nonlinearities import leaky_rectify, softmax
network = lasagne.layers.InputLayer((None, 3, 32, 32), input_var)
network = lasagne.layers.Conv2DLayer(network, 64, (3, 3),
                                     nonlinearity=leaky_rectify)
network = lasagne.layers.Conv2DLayer(network, 32, (3, 3),
                                     nonlinearity=leaky_rectify)
network = lasagne.layers.Pool2DLayer(network, (3, 3), stride=2, mode='max')
network = lasagne.layers.DenseLayer(lasagne.layers.dropout(network, 0.5),
                                    128, nonlinearity=leaky_rectify,
                                    W=lasagne.init.Orthogonal())
network = lasagne.layers.DenseLayer(lasagne.layers.dropout(network, 0.5),
                                    10, nonlinearity=softmax)


network

Out[5]:

<lasagne.layers.dense.DenseLayer at 0x4280e50>

In [6]:

# create loss function
prediction = lasagne.layers.get_output(network)
loss = lasagne.objectives.categorical_crossentropy(prediction, target_var)
loss = loss.mean() + 1e-4 * lasagne.regularization.regularize_network_params(
        network, lasagne.regularization.l2)

loss

Out[6]:

Elemwise{add,no_inplace}.0

In [7]:

# create parameter update expressions
params = lasagne.layers.get_all_params(network, trainable=True)
updates = lasagne.updates.nesterov_momentum(loss, params, learning_rate=0.01,
                                            momentum=0.9)

# compile training function that updates parameters and returns training loss
train_fn = theano.function([input_var, target_var], loss, updates=updates)

params,hr,updates,hr,train_fn

Out[7]:

([W, b, W, b, W, b, W, b],
 '------------------------------------------------------------------------------------------------------------------------',
 OrderedDict([(W, Elemwise{add,no_inplace}.0), (b, Elemwise{add,no_inplace}.0), (W, Elemwise{add,no_inplace}.0), (b, Elemwise{add,no_inplace}.0), (W, Elemwise{add,no_inplace}.0), (b, Elemwise{add,no_inplace}.0), (W, Elemwise{add,no_inplace}.0), (b, Elemwise{add,no_inplace}.0), (<TensorType(float64, 4D)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, vector)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, 4D)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, vector)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, matrix)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, vector)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, matrix)>, Elemwise{sub,no_inplace}.0), (<TensorType(float64, vector)>, Elemwise{sub,no_inplace}.0)]),
 '------------------------------------------------------------------------------------------------------------------------',
 <theano.compile.function_module.Function at 0x5ef71d0>)

In [9]:

# train network (assuming you've got some training data in numpy arrays)
for epoch in range(100):
    loss = 0
    for input_batch, target_batch in training_data:
        loss += train_fn(input_batch, target_batch)
    print("Epoch %d: Loss %g" % (epoch + 1, loss / len(training_data)))

# use trained network for predictions
test_prediction = lasagne.layers.get_output(network, deterministic=True)
predict_fn = theano.function([input_var], T.argmax(test_prediction, axis=1))
print("Predicted class for first test input: %r" % predict_fn(test_data[0]))

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-9-0428f5063366> in <module>()
      2 for epoch in range(100):
      3     loss = 0
----> 4     for input_batch, target_batch in training_data:
      5         loss += train_fn(input_batch, target_batch)
      6     print("Epoch %d: Loss %g" % (epoch + 1, loss / len(training_data)))

NameError: name 'training_data' is not defined

In [ ]: