pylearn: mlp_factory_approach.py comparison

comparison mlp_factory_approach.py @ 191:e816821c1e50

added early stopping to mlp.__call__

author	James Bergstra <bergstrj@iro.umontreal.ca>
date	Wed, 14 May 2008 20:04:44 -0400
parents	aa7a3ecbcc90
children	c5a7105fa40b

comparison

equal deleted inserted replaced

-:aa7a3ecbcc90
+:e816821c1e50
-import copy
+import copy, sys
 import numpy
 import theano
-import theano.tensor as t
+from theano import tensor as t
-import dataset
+from tlearn import dataset, nnet_ops, stopper
-import nnet_ops
 def _randshape(*shape):
 return (numpy.random.rand(*shape) -0.5) * 0.001
-class NeuralNet(object):
+def _cache(d, key, valfn):
+#valfn() is only evaluated if key isn't in dictionary d
+if key not in d:
+d[key] = valfn()
+return d[key]
 class _Model(object):
-def __init__(self, nnet, params):
+def __init__(self, algo, params):
-self.nnet = nnet
+self.algo = algo
 self.params = params
+v = algo.v
+self.update_fn = algo._fn([v.input, v.target] + v.params, [v.nll] + v.new_params)
+self._fn_cache = {}
 def __copy__(self):
-return _Model(self.nnet, [copy.copy(p) for p in params])
+return _Model(self.algo, [copy.copy(p) for p in params])
-def update(self, trainset, stopper=None):
+def update(self, input_target):
 """Update this model from more training data."""
-v = self.nnet.v
+params = self.params
-params = self.params
+#TODO: why should we have to unpack target like this?
-update_fn = self.nnet._fn([v.input, v.target] + v.params, [v.nll] + v.new_params)
+for input, target in input_target:
-if stopper is not None:
+self.update_fn(input, target[:,0], *params)
-raise NotImplementedError()
-else:
-for i in xrange(100):
-for input, target in trainset.minibatches(['input', 'target'],
-minibatch_size=min(32, len(trainset))):
-dummy = update_fn(input, target[:,0], *params)
-if 0: print dummy[0] #the nll
-def __call__(self, testset,
+def __call__(self, testset, fieldnames=['output_class']):
-output_fieldnames=['output_class'],
+"""Apply this model (as a function) to new data"""
-test_stats_collector=None,
+#TODO: cache fn between calls
-copy_inputs=False,
+assert 'input' == testset.fieldNames()[0]
-put_stats_in_output_dataset=True,
+assert len(testset.fieldNames()) <= 2
-output_attributes=[]):
+v = self.algo.v
-"""Apply this model (as a function) to new data"""
+outputs = [getattr(v, name) for name in fieldnames]
-v = self.nnet.v
+inputs = [v.input] + ([v.target] if 'target' in testset else [])
-outputs = [getattr(self.nnet.v, name) for name in output_fieldnames]
+inputs.extend(v.params)
-if 'target' in testset:
+theano_fn = _cache(self._fn_cache, (tuple(inputs), tuple(outputs)),
-fn = self.nnet._fn([v.input, v.target] + v.params, outputs)
+lambda: self.algo._fn(inputs, outputs))
-return dataset.ApplyFunctionDataSet(testset,
+lambda_fn = lambda *args: theano_fn(*(list(args) + self.params))
-lambda input, target: fn(input, target[:,0], *self.params),
+return dataset.ApplyFunctionDataSet(testset, lambda_fn, fieldnames)
-output_fieldnames)
-else:
-fn = self.nnet._fn([v.input] + v.params, outputs)
-return dataset.ApplyFunctionDataSet(testset,
-lambda input: fn(input, *self.params),
-output_fieldnames)
-def _fn(self, inputs, outputs):
-#it is possible for this function to implement function caching
-#... but not necessarily desirable.
-#- caching ruins the possibility of multi-threaded learning
-#- caching demands more efficiency in the face of resizing inputs
-#- caching makes it really hard to borrow references to function outputs
-return theano.function(inputs, outputs, unpack_single=False, linker=self.linker)
-def __init__(self, ninputs, nhid, nclass, lr, nepochs,
+class AutonameVars(object):
+def __init__(self, dct):
+for key, val in dct.items():
+if type(key) is str and hasattr(val, 'name'):
+val.name = key
+self.__dict__.update(dct)
+class MultiLayerPerceptron(object):
+def __init__(self, ninputs, nhid, nclass, lr,
 l2coef=0.0,
 linker='c&py',
-hidden_layer=None):
+hidden_layer=None,
-class Vars:
+early_stopper=None,
-def __init__(self, lr, l2coef):
+validation_portion=0.2,
+V_extern=None):
+class V_intern(AutonameVars):
+def __init__(v_self, lr, l2coef, **kwargs):
 lr = t.constant(lr)
 l2coef = t.constant(l2coef)
-input = t.matrix('input') # n_examples x n_inputs
+input = t.matrix() # n_examples x n_inputs
-target = t.ivector('target') # n_examples x 1
+target = t.ivector() # len: n_examples
-W2 = t.matrix('W2')
+W2, b2 = t.matrix(), t.vector()
-b2 = t.vector('b2')
 if hidden_layer:
 hid, hid_params, hid_ivals, hid_regularization = hidden_layer(input)
 else:
-W1 = t.matrix('W1')
+W1, b1 = t.matrix(), t.vector()
-b1 = t.vector('b1')
 hid = t.tanh(b1 + t.dot(input, W1))
 hid_params = [W1, b1]
 hid_regularization = l2coef * t.sum(W1*W1)
 hid_ivals = lambda : [_randshape(ninputs, nhid), _randshape(nhid)]
 output_class = t.argmax(activations,1)
 loss_01 = t.neq(output_class, target)
 g_params = t.grad(nll + regularization, params)
 new_params = [t.sub_inplace(p, lr * gp) for p,gp in zip(params, g_params)]
 self.__dict__.update(locals()); del self.self
+AutonameVars.__init__(v_self, locals())
 self.nhid = nhid
 self.nclass = nclass
-self.nepochs = nepochs
+self.v = V_intern(**locals()) if V_extern is None else V_extern(**locals())
-self.v = Vars(lr, l2coef)
-self.params = None
 self.linker = linker
+self.early_stopper = early_stopper if early_stopper is not None else lambda: stopper.NStages(10,1)
+self.validation_portion = validation_portion
+def _fn(self, inputs, outputs):
+# Caching here would hamper multi-threaded apps
+# prefer caching in _Model.__call__
+return theano.function(inputs, outputs, unpack_single=False, linker=self.linker)
 def __call__(self, trainset=None, iparams=None):
+"""Allocate and optionally train a model"""
 if iparams is None:
 iparams = [_randshape(self.nhid, self.nclass), _randshape(self.nclass)]\
 + self.v.hid_ivals()
-rval = NeuralNet._Model(self, iparams)
+rval = _Model(self, iparams)
 if trainset:
-rval.update(trainset)
+if len(trainset) == sys.maxint:
+raise NotImplementedError('Learning from infinite streams is not supported')
+nval = int(self.validation_portion * len(trainset))
+nmin = len(trainset) - nval
+assert nmin >= 0
+minset = trainset[:nmin] #real training set for minimizing loss
+valset = trainset[nmin:] #validation set for early stopping
+best = rval
+for stp in self.early_stopper():
+rval.update(
+trainset.minibatches(['input', 'target'], minibatch_size=min(32,
+len(trainset))))
+if stp.set_score:
+stp.score = rval(valset, ['loss_01'])
+if (stp.score < stp.best_score):
+best = copy.copy(rval)
+rval = best
 return rval
+import unittest
+class TestMLP(unittest.TestCase):
+def test0(self):
+training_set1 = dataset.ArrayDataSet(numpy.array([[0, 0, 0],
+[0, 1, 1],
+[1, 0, 1],
+[1, 1, 1]]),
+{'input':slice(2),'target':2})
+training_set2 = dataset.ArrayDataSet(numpy.array([[0, 0, 0],
+[0, 1, 1],
+[1, 0, 0],
+[1, 1, 1]]),
+{'input':slice(2),'target':2})
+test_data = dataset.ArrayDataSet(numpy.array([[0, 0, 0],
+[0, 1, 1],
+[1, 0, 0],
+[1, 1, 1]]),
+{'input':slice(2)})
+learn_algo = MultiLayerPerceptron(2, 10, 2, .1
+, linker='c&py'
+, early_stopper = lambda:stopper.NStages(100,1))
+model1 = learn_algo(training_set1)
+model2 = learn_algo(training_set2)
+n_match = 0
+for o1, o2 in zip(model1(test_data), model2(test_data)):
+#print o1
+#print o2
+n_match += (o1 == o2)
+assert n_match ==  (numpy.sum(training_set1.fields()['target'] ==
+training_set2.fields()['target']))
 if __name__ == '__main__':
-training_set1 = dataset.ArrayDataSet(numpy.array([[0, 0, 0],
+unittest.main()
-[0, 1, 1],
-[1, 0, 1],
-[1, 1, 1]]),
-{'input':slice(2),'target':2})
-training_set2 = dataset.ArrayDataSet(numpy.array([[0, 0, 0],
-[0, 1, 1],
-[1, 0, 0],
-[1, 1, 1]]),
-{'input':slice(2),'target':2})
-test_data = dataset.ArrayDataSet(numpy.array([[0, 0, 0],
-[0, 1, 1],
-[1, 0, 0],
-[1, 1, 1]]),
-{'input':slice(2)})
-learn_algo = NeuralNet(2, 10, 3, .1, 1000)
-model1 = learn_algo(training_set1)
-model2 = learn_algo(training_set2)
-n_match = 0
-for o1, o2 in zip(model1(test_data), model2(test_data)):
-n_match += (o1 == o2)
-print n_match, numpy.sum(training_set1.fields()['target'] ==
-training_set2.fields()['target'])

Mercurial > pylearn

comparison mlp_factory_approach.py @ 191:e816821c1e50