ift6266: deep/stacked_dae/v_sylvain/stacked

comparison deep/stacked_dae/v_sylvain/stacked_dae.py @ 368:d391ad815d89

Correction d'un bug avec la fonction de log-likelihood pour utilisation de non-linearite de sortie sigmoides

author	SylvainPL <sylvain.pannetier.lebeuf@umontreal.ca>
date	Fri, 23 Apr 2010 12:12:03 -0400
parents	14b28e43ce4e
children

comparison

equal deleted inserted replaced

-:f24b10e43a6f
+:d391ad815d89
 dtype = theano.config.floatX) )
 # initialize the baises b as a vector of n_out 0s
 self.b = theano.shared( value=numpy.zeros((n_out,),
 dtype = theano.config.floatX) )
 # compute vector of class-membership. This is a sigmoid instead of
-#a softmax to be able to classify as nothing later
+#a softmax to be able later to classify as nothing
-##        self.p_y_given_x = T.nnet.softmax(T.dot(input, self.W)+self.b)
+##        self.p_y_given_x = T.nnet.softmax(T.dot(input, self.W)+self.b) #row-wise
 self.p_y_given_x = T.nnet.sigmoid(T.dot(input, self.W)+self.b)
 # compute prediction as class whose probability is maximal in
 # symbolic form
 self.y_pred=T.argmax(self.p_y_given_x, axis=1)
 # list of parameters for this layer
 self.params = [self.W, self.b]
 def negative_log_likelihood(self, y):
-return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]),y])
+##        return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]),y])
+return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]),y]+T.sum(T.log(1-self.p_y_given_x), axis=1)-T.log(1-self.p_y_given_x)[T.arange(y.shape[0]),y])
+##    def kullback_leibler(self,y):
+##        return -T.mean(T.log(1/float(self.p_y_given_x))[T.arange(y.shape[0]),y])
 def errors(self, y):
 # check if y has same dimension of y_pred
 if y.ndim != self.y_pred.ndim:
 raise TypeError('y should have the same shape as self.y_pred',
 #Or use a Tanh everything is always between 0 and 1, the range is
 #changed so it remain the same as when sigmoid is used
 self.y   = (T.tanh(T.dot(self.tilde_x, self.W ) + self.b)+1.0)/2.0
-z_a = T.dot(self.y, self.W_prime) + self.b_prime
+self.z =  (T.tanh(T.dot(self.y, self.W_prime) + self.b_prime)+1.0) / 2.0
-self.z =  (T.tanh(z_a )+1.0) / 2.0
 #To ensure to do not have a log(0) operation
 if self.z <= 0:
 self.z = 0.000001
 if self.z >= 1:
 self.z = 0.999999
-self.L = - T.sum( self.x*T.log(self.z) + (1-self.x)*T.log(1-self.z), axis=1 )
+self.L = - T.sum( self.x*T.log(self.z) + (1.0-self.x)*T.log(1.0-self.z), axis=1 )
 self.cost = T.mean(self.L)
 self.params = [ self.W, self.b, self.b_prime ]

Mercurial > ift6266

comparison deep/stacked_dae/v_sylvain/stacked_dae.py @ 368:d391ad815d89