pylearn: pylearn/gd/sgd.py comparison

merge

author	James Bergstra <bergstrj@iro.umontreal.ca>
date	Wed, 18 May 2011 10:52:42 -0400
parents	ddda8d93c162 cac29ca79a74
children	0e6ca7eecc72

comparison

equal deleted inserted replaced

-:91a475ca9b6d
+:a57f4839a9d8
 :param stepsizes: step by this amount times the negative gradient on each iteration
 :type stepsizes: [symbolic] scalar or list of one [symbolic] scalar per param
 """
 try:
 iter(stepsizes)
-except:
+except Exception:
 stepsizes = [stepsizes for p in params]
 if len(params) != len(grads):
 raise ValueError('params and grads have different lens')
 updates = [(p, p - step * gp) for (step, p, gp) in zip(stepsizes, params, grads)]
 return updates
 def sgd_momentum_updates(params, grads, stepsizes, momentum=0.9):
 # if stepsizes is just a scalar, expand it to match params
 try:
 iter(stepsizes)
-except:
+except Exception:
 stepsizes = [stepsizes for p in params]
 try:
 iter(momentum)
-except:
+except Exception:
 momentum = [momentum for p in params]
 if len(params) != len(grads):
 raise ValueError('params and grads have different lens')
 headings = [theano.shared(numpy.zeros_like(p.get_value(borrow=True))) for p in params]
 updates = []
 if self.stepsize.ndim != 0:
 raise TypeError('stepsize must be a scalar', stepsize)
 self.params = params
-self.gparams = theano.tensor.grad(cost, self.params) if gradients is None else gradients
+self.gparams = [theano.tensor.grad(cost, self.params)] if gradients is None else gradients
+assert len(self.params) == len(self.gparams)
 self._updates = (dict((p, p - self.stepsize * g) for p, g in zip(self.params, self.gparams)))
 if updates is not None:
 self._updates.update(updates)

Mercurial > pylearn