pylearn: nnet_ops.py comparison

comparison nnet_ops.py @ 117:3ef569b92fba

ported nnet_ops to new theano

author	James Bergstra <bergstrj@iro.umontreal.ca>
date	Wed, 07 May 2008 15:28:17 -0400
parents	76e5c0f37165
children	2ca8dccba270

comparison

equal deleted inserted replaced

-:9330d941fa1f
+:3ef569b92fba
 import theano
-from theano import tensor, gof, scalar
+from theano import tensor, scalar
 import numpy
 ############
 #
 # SCALAR OPS
 #
-class ScalarSigmoid(scalar.FloatUnaryScalarOp):
+class ScalarSigmoid(scalar.UnaryScalarOp):
 @staticmethod
 def st_impl(x):
 if x < -30.0:
 return 0.0
 if x > 30.0:
 def impl(self, x):
 return ScalarSigmoid.st_impl(x)
 def grad(self, (x,), (gz,)):
 y = scalar_sigmoid(x)
 return [gz * y * (1.0 - y)]
-def c_foreach(self, (x,), (z,), sub):
+def c_code(self, (x,), (z,), sub):
 if 'float' in self.inputs[0].dtype:
 return """%(z)s =
 %(x)s < -30.0
 ? 0.0
 : %(x)s > 30.0
 ? 1.0
 : 1.0 /(1.0+exp(-%(x)s));""" % locals()
-raise NotImplementedError('only floatingpoint is implemented')
+return NotImplemented#Error('only floatingpoint is implemented')
-scalar_sigmoid = gof.op.constructor(ScalarSigmoid)
+scalar_sigmoid = ScalarSigmoid(scalar.upgrade_to_float, name='scalar_sigmoid')
-Sigmoid, sigmoid, SigmoidInplace, sigmoid_inplace =\
+sigmoid = tensor.Elemwise(scalar_sigmoid, name='sigmoid')
-tensor.broadcast(ScalarSigmoid, 'Sigmoid')
+class ScalarSoftplus(scalar.UnaryScalarOp):
-class ScalarSoftplus(scalar.FloatUnaryScalarOp):
 @staticmethod
 def static_impl(x):
 if x < -30.0:
 return 0.0
 if x > 30.0:
 return numpy.log1p(numpy.exp(x))
 def impl(self, x):
 return ScalarSoftplus.static_impl(x)
 def grad(self, (x,), (gz,)):
 return [gz * scalar_sigmoid(x)]
-def c_foreach(self, (x,), (z,), sub):
+def c_code(self, (x,), (z,), sub):
 if 'float' in self.inputs[0].dtype:
 return """%(z)s =
 %(x)s < -30.0
 ? 0.0
 : %(x)s > 30.0
 ? %(x)s
 : log1p(exp(%(x)s));""" % locals()
-raise NotImplementedError('only floating point x is implemented')
+return NotImplemented#Error('only floating point x is implemented')
-scalar_softplus = gof.op.constructor(ScalarSoftplus)
+scalar_softplus = ScalarSoftplus(scalar.upgrade_to_float, name='scalar_softplus')
-Softplus, softplus, SoftplusInplace, softplus_inplace =\
+softplus = tensor.Elemwise(scalar_softplus, name='softplus')
-tensor.broadcast(ScalarSoftplus, 'Softplus')
 ############
 #
 # TENSOR OPS
 #
+class CrossentropySoftmax1HotWithBias(theano.Op):
-class CrossentropySoftmax1HotWithBias(gof.op.Op):
 """A special compound L{Op} for the output of neural-net classifiers.
 @type x: is a matrix of floats (32 or 64)
 @type b: is a [row] vector of floats (32 or 64), length is number of cols in x
 @type y_idx: a [column] vector of int (32 or 64), length is number of rows in x
 i'th example.
 """
 nin=3
 nout=2
-def __init__(self, x, b, y_idx, **kwargs):
+def __init__(self, **kwargs):
-x = tensor._as_tensor(x)
+theano.Op.__init__(self, **kwargs)
-b = tensor._as_tensor(b)
-y_idx = tensor._as_tensor(y_idx)
+def make_node(self, x, b, y_idx):
-if len(x.broadcastable) != 2 \
+x = tensor.as_tensor(x)
-or x.dtype not in ['float32', 'float64']:
+b = tensor.as_tensor(b)
+y_idx = tensor.as_tensor(y_idx)
+if x.type.ndim != 2 \
+or x.type.dtype not in ['float32', 'float64']:
 raise ValueError('x must be 2-d tensor of floats')
-if len(b.broadcastable) != 1 \
+if b.type.ndim != 1 \
-or x.dtype not in ['float32', 'float64']:
+or x.type.dtype not in ['float32', 'float64']:
 raise ValueError('x must be 1-d tensor of floats')
-if len(y_idx.broadcastable) != 1 \
+if y_idx.type.ndim != 1 \
-or y_idx.dtype not in ['int32', 'int64']:
+or y_idx.type.dtype not in ['int32', 'int64']:
 raise ValueError('x must be 1-d tensor of ints')
 #       TODO: Is this correct? It used to be y, not y_idx
-nll = tensor.Tensor(x.dtype, y_idx.broadcastable)
+nll = tensor.Tensor(x.type.dtype,
+y_idx.type.broadcastable).make_result()
 #        nll = Tensor(x.dtype, y.broadcastable)
-sm = tensor.Tensor(x.dtype, x.broadcastable)
+sm = x.type.make_result()
-self.inputs = [x, b, y_idx]
+return theano.Apply(self, [x, b, y_idx],[nll, sm])
-self.outputs = [nll, sm]
+def perform(self, node, input_storage, output_storage):
-def perform(self):
+x, b, y_idx = input_storage
-x, b, y_idx = [i.data for i in self.inputs]
 if b.shape[0] != x.shape[1]:
 raise ValueError('b must have same number of columns as x')
 if y_idx.shape[0] != x.shape[0]:
 raise ValueError('y_idx must have same number of rows as x')
 for i in xrange(sm.shape[0]):
 row = x[i] + b
 sm[i] = numpy.exp(row - numpy.max(row)) #softmax
 sm[i] *= 1.0 / numpy.sum(sm[i]) #vector scale
 nll[i] = -numpy.log( sm[i, y_idx[i]]) #cross-entropy
-self.outputs[0].data = nll
+output_storage[0][0] = nll
-self.outputs[1].data = sm
+output_storage[1][0] = sm
 def grad(self, (x, b, y_idx), (g_nll, g_sm)):
 if g_sm is not None:
 raise NotImplementedError()
 nll, sm = crossentropy_softmax_1hot_with_bias(x, b, y_idx)
-dx = CrossentropySoftmax1HotWithBiasDx(g_nll, sm, y_idx).outputs[0]
+dx = CrossentropySoftmax1HotWithBiasDx()(g_nll, sm, y_idx)
-db = tensor.Sum(dx, axis = [0]).outputs[0]
+db = tensor.sum(dx, axis = [0])
 return dx, db, None
 def c_headers(self): return ['<iostream>']
 def c_code(self,  (x, b, y_idx), (nll, sm), sub):
 # this implementation was lifted from
 + log(sum);
 //mat_at(y,i,0) = -log( mat_at(s,i,t[i]));  //less accurate?
 //mat_at(y,i,0) =  - mat_at(x,i,t[i]) - mat_at(b,0,t[i]) + (discount_max ? maxi : 0.0) + log(sum);
 }
 """ % dict(locals(), **sub)
+crossentropy_softmax_1hot_with_bias = CrossentropySoftmax1HotWithBias()
-crossentropy_softmax_1hot_with_bias = \
-gof.op.constructor(CrossentropySoftmax1HotWithBias)
+class CrossentropySoftmax1HotWithBiasDx (theano.Op):
-class CrossentropySoftmax1HotWithBiasDx (gof.op.Op):
 nin=3
 nout=1
 """Gradient wrt x of the CrossentropySoftmax1Hot Op"""
-def __init__(self, dy, sm, y_idx,**kwargs):
+def __init__(self, **kwargs):
-dy = tensor._as_tensor(dy)
+theano.Op.__init__(self,**kwargs)
-sm = tensor._as_tensor(sm)
+def make_node(self, dy, sm, y_idx,**kwargs):
-y_idx = tensor._as_tensor(y_idx)
+dy = tensor.as_tensor(dy)
-self.inputs = [dy, sm, y_idx]
+sm = tensor.as_tensor(sm)
-self.outputs = [tensor.Tensor(sm.dtype, sm.broadcastable)]
+y_idx = tensor.as_tensor(y_idx)
-def perform(self):
+return theano.Apply(self, [dy, sm, y_idx],[sm.type.make_result()])
-dy,sm,y_idx = [i.data for i in self.inputs]
+def perform(self, node, input_storage, output_storage):
+dy,sm,y_idx = input_storage
 dx = numpy.zeros_like(sm)
 for i in xrange(sm.shape[0]):
 dx[i] = dy[i] * sm[i] #vector scale
 dx[i, y_idx[i]] -= dy[i] #scalar decrement
-self.outputs[0].data = dx
+output_storage[0][0] = dx
 def grad(self, *args):
 raise NotImplementedError()
 def c_code(self,  (dnll, sm, y_idx), (dx,), sub):
 return """

Mercurial > pylearn

comparison nnet_ops.py @ 117:3ef569b92fba