# HG changeset patch
# User Olivier Delalleau <delallea@iro>
# Date 1243266337 14400
# Node ID 573e3370d0fa7c415a9f62fe708e4b75b4b8de0e
# Parent  88f5b75a4afe38707c10313e9b3e0f4760e3d7ab# Parent  fb9fb142098fe2b264f17e44343cf81ca6dbf5bf
Merged

diff -r 88f5b75a4afe -r 573e3370d0fa pylearn/algorithms/sandbox/DAA_inputs_groups.py
--- a/pylearn/algorithms/sandbox/DAA_inputs_groups.py	Mon May 25 11:43:50 2009 -0400
+++ b/pylearn/algorithms/sandbox/DAA_inputs_groups.py	Mon May 25 11:45:37 2009 -0400
@@ -101,17 +101,17 @@
             self.input_missing_mask = None
         self.noisy_input = None
         self.auxinput = auxinput
-        self.idx_list = T.ivector('idx_list') if not(self.auxinput is None) else None
+        self.idx_list = T.ivector('idx_list') if self.auxinput is not None else None
         self.noisy_idx_list, self.noisy_auxinput = None, None
         
         #parameters
         self.benc = T.dvector('benc')
-        if not(self.input is None):
+        if self.input is not None:
             self.wenc = T.dmatrix('wenc')
             self.wdec = self.wenc.T if tie_weights else T.dmatrix('wdec')
             self.bdec = T.dvector('bdec')
         
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             self.wauxenc = [T.dmatrix('wauxenc%s'%i) for i in range(len(auxin_size))]
             self.wauxdec = [self.wauxenc[i].T if tie_weights else T.dmatrix('wauxdec%s'%i) for i in range(len(auxin_size))]
             self.bauxdec = [T.dvector('bauxdec%s'%i) for i in range(len(auxin_size))]
@@ -129,9 +129,9 @@
     
     ### BEHAVIOURAL MODEL
     def init_behavioural(self):
-        if not(self.input is None):
+        if self.input is not None:
             self.noisy_input = self.corrupt_input()
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             self.noisy_idx_list , self.noisy_auxinput = \
                 scannoise(self.idx_list,self.auxinput,self.noise_level,self.noise_level_group)
         
@@ -157,8 +157,7 @@
         
     def define_propup(self, container, input, idx_list, auxinput):
         if self.input is not None:
-            container.hidden_activation = self.filter_up(input, self.wenc,
-                    self.benc)
+            container.hidden_activation = self.filter_up(input, self.wenc, self.benc)
             if self.auxinput is not None:
                 container.hidden_activation += scandotenc(idx_list,auxinput,self.wauxenc)
         else:
@@ -167,16 +166,16 @@
         
     # DEPENDENCY: define_propup
     def define_propdown(self, container, idx_list, auxinput):
-        if not(self.input is None):
+        if self.input is not None:
             rec_activation1 = self.filter_down(container.hidden,self.wdec,self.bdec)
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             rec_activation2 = scandotdec(idx_list,auxinput,container.hidden,self.wauxdec) +\
                     scanbiasdec(idx_list,auxinput,self.bauxdec)
         
-        if not(self.input is None) and not(auxinput is None):
+        if (self.input is not None) and (self.auxinput is not None):
             container.rec_activation = T.join(1,rec_activation1,rec_activation2)
         else:
-            if not(self.input is None):
+            if self.input is not None:
                 container.rec_activation = rec_activation1
             else:
                 container.rec_activation = rec_activation2
@@ -189,19 +188,19 @@
     # TODO: fix regularization type (outside parameter ?)
     def define_regularization(self):
         self.reg_coef = T.scalar('reg_coef')
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             self.Maskup = scanmaskenc(self.idx_list,self.wauxenc)
             self.Maskdown = scanmaskdec(self.idx_list,self.wauxdec)
-            if not(type(self.Maskup) is list):
+            if type(self.Maskup) is not list:
                 self.Maskup = [self.Maskup]
-            if not(type(self.Maskdown) is list):
+            if type(self.Maskdown) is not list:
                 self.Maskdown = [self.Maskdown]
         listweights = []
         listweightsenc = []
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             listweights += [w*m for w,m in zip(self.Maskup,self.wauxenc)] + [w*m for w,m in zip(self.Maskdown,self.wauxdec)]
             listweightsenc += [w*m for w,m in zip(self.Maskup,self.wauxenc)]
-        if not(self.input is None):
+        if self.input is not None:
             listweights += [self.wenc,self.wdec]
             listweightsenc += [self.wenc]
         self.regularization = self.reg_coef * get_reg_cost(listweights,'l2')
@@ -222,16 +221,16 @@
             self.params = []
         self.params += [self.benc]
         self.paramsenc = copy.copy(self.params)
-        if not(self.input is None):
+        if self.input is not None:
             self.params += [self.wenc] + [self.bdec]
             self.paramsenc += [self.wenc]
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             self.params += self.wauxenc + self.bauxdec
             self.paramsenc += self.wauxenc
         if not(self.tie_weights):
-            if not(self.input is None):
+            if self.input is not None:
                 self.params += [self.wdec]
-            if not(self.auxinput is None):
+            if self.auxinput is not None:
                 self.params += self.wauxdec
     
     # DEPENDENCY: define_cost, define_gradients
@@ -248,13 +247,13 @@
             listin = [self.idx_list, self.auxinput]
         if self.auxinput is None:
             listin = [self.input]
-        if not((self.input is None) or (self.auxinput is None)):
+        if (self.input is not None) and (self.auxinput is not None):
             listin =[self.input,self.idx_list, self.auxinput]
         self.update = theano.Method(listin, self.noise.cost, self.updates)
         self.compute_cost = theano.Method(listin, self.noise.cost)
-        if not(self.input is None):
+        if self.input is not None:
             self.noisify = theano.Method(listin, self.noisy_input)
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             self.auxnoisify = theano.Method(listin, self.noisy_auxinput)
         self.reconstruction = theano.Method(listin, self.clean.rec)
         self.representation = theano.Method(listin, self.clean.hidden)
@@ -276,12 +275,12 @@
             rec = (rec * T.neq(self.input_missing_mask, zero) +
                     (zero - 1e100) * T.eq(self.input_missing_mask, zero))
             
-        if self.input is None:
+        if (self.input is not None) and (self.auxinput is not None):
+            return self.reconstruction_cost_function(T.join(1,self.input,scaninputs(self.idx_list,self.auxinput)), rec)
+        if self.input is not None:
+            return self.reconstruction_cost_function(self.input, rec)
+        if self.auxinput is not None:
             return self.reconstruction_cost_function(scaninputs(self.idx_list,self.auxinput), rec)
-        if self.auxinput is None:
-            return self.reconstruction_cost_function(self.input, rec)
-        if not((self.input is None) or (self.auxinput is None)):
-            return self.reconstruction_cost_function(T.join(1,self.input,scaninputs(self.idx_list,self.auxinput)), rec)
         # All cases should be covered above. If not, something is wrong!
         assert False
     
@@ -304,35 +303,35 @@
         
         obj.__hide__ = ['params']
         
-        if not(self.input is None):
+        if self.input is not None:
             self.inf = 1/numpy.sqrt(self.in_size)
-        if not(self.auxinput is None):
+        if self.auxinput is not None:
             self.inf = 1/numpy.sqrt(sum(self.auxin_size))
-        if not(self.auxinput is None or self.input is None):
+        if (self.auxinput is not None) and (self.input is not None):
             self.inf = 1/numpy.sqrt(sum(self.auxin_size)+self.in_size)
         self.hif = 1/numpy.sqrt(self.n_hid)
         
         
         if alloc:
-            if not(self.input is None):
+            if self.input is not None:
                 wencshp = (self.in_size, self.n_hid)
                 wdecshp = tuple(reversed(wencshp))
                 print 'wencshp = ', wencshp
                 print 'wdecshp = ', wdecshp
                 
                 obj.wenc = self.R.uniform(size=wencshp, low = -self.inf, high = self.inf)
-                if not self.tie_weights:
+                if not(self.tie_weights):
                     obj.wdec = self.R.uniform(size=wdecshp, low=-self.hif, high=self.hif)
                 obj.bdec = numpy.zeros(self.in_size)
             
-            if not(self.auxinput is None):
+            if self.auxinput is not None:
                 wauxencshp = [(i, self.n_hid) for i in self.auxin_size]
                 wauxdecshp = [tuple(reversed(i)) for i in wauxencshp]
                 print 'wauxencshp = ', wauxencshp
                 print 'wauxdecshp = ', wauxdecshp
                 
                 obj.wauxenc = [self.R.uniform(size=i, low = -self.inf, high = self.inf) for i in wauxencshp]
-                if not self.tie_weights:
+                if not(self.tie_weights):
                     obj.wauxdec = [self.R.uniform(size=i, low=-self.hif, high=self.hif) for i in wauxdecshp]
                 obj.bauxdec = [numpy.zeros(i) for i in self.auxin_size]
             
@@ -371,7 +370,7 @@
         self.hid_fn = hid_fn
         self.reconstruction_cost_function = reconstruction_cost_function
         self.n_out = n_out
-        self.target = target if not(target is None) else T.lvector('target')
+        self.target = target if target is not None else T.lvector('target')
         self.debugmethod = debugmethod
         self.totalupdatebool = totalupdatebool
         
@@ -423,7 +422,7 @@
         paramsenc = []
         self.inputs = [None] * (self.depth+1)
         
-        if not(self.input is None):
+        if self.input is not None:
             self.inputs[0] = [self.input]
         else:
             self.inputs[0] = []
@@ -445,13 +444,13 @@
             # method input, outputs and parameters update
             if i:
                 self.inputs[i] = copy.copy(self.inputs[i-1])
-            if not(auxin_size[i] is None):
+            if auxin_size[i] is not None:
                 self.inputs[i] += [self.daaig[i].idx_list,self.auxinput[i-offset]]
             
             noisyout = []
-            if not(inputprec is None):
+            if inputprec is not None:
                 noisyout += [self.daaig[i].noisy_input]
-            if not(auxin_size[i] is None):
+            if auxin_size[i] is not None:
                 noisyout += [self.daaig[i].noisy_auxinput]
             
             paramstot += self.daaig[i].params
diff -r 88f5b75a4afe -r 573e3370d0fa pylearn/sandbox/nips09stopper.py
--- a/pylearn/sandbox/nips09stopper.py	Mon May 25 11:43:50 2009 -0400
+++ b/pylearn/sandbox/nips09stopper.py	Mon May 25 11:45:37 2009 -0400
@@ -32,14 +32,17 @@
     def find_min(self, step, check, save):
         best = None
         while not self.stop:
-            self.iter++
+            self.iter += 1
             step()
             if (self.iter % self.set_score_interval == 0):
                 self.train_score, self.valid_score = check()
-                if (self.valid_score < self.best_valid) and save:
-                    self.best_valid = self.valid_score
-                    self.best_valid_iter = self.iter
-                    best = (save(), self.iter, self.valid_score)
+                if save:
+                    if (self.valid_score < self.best_valid):
+                        self.best_valid = self.valid_score
+                        self.best_valid_iter = self.iter
+                        best = [save(), self.iter, self.valid_score, self.iter]
+                    else:
+                        best[3] = self.iter
 
             if self.iter >= self.n_iter_max:
                 self.stop = True
diff -r 88f5b75a4afe -r 573e3370d0fa pylearn/sandbox/scan_inputs_groups.py
--- a/pylearn/sandbox/scan_inputs_groups.py	Mon May 25 11:43:50 2009 -0400
+++ b/pylearn/sandbox/scan_inputs_groups.py	Mon May 25 11:45:37 2009 -0400
@@ -11,16 +11,16 @@
 # (numpy array), each element will correspond to an available modality and the index list will indicate the weights
 # associated to it).
 # Exemple of index list: [1, 0, -3]
-#	*the 1 says that the first element of the input list will refer to the first element of the weights_list
-#		(auxiliary target as input)
-#								if inputslist[i]>0 it refers to Weightslist[indexlist[i]-1]
-#	*the 0 means that the second element of the input list will not be encoded neither decoded (it is remplaced by zeros)
-#		this is not efficient, so in this case it is better to give: [1,-3] and [inputslist[0],inputslist[2]]
-#		but it allows us to deal with empty lists: give indexlist = numpy.asarray([.0])
-#		and inputlist=numpy.zeros((batchsize,1))
-#	*when an index is negative it means that the input will not be used for encoding but we will still reconstruct it
-#		(auxiliary target as output)
-#								if inputslist[i]<0 it refers to Weightslist[-indexlist[i]-1]
+#    *the 1 says that the first element of the input list will refer to the first element of the weights_list
+#        (auxiliary target as input)
+#                                if inputslist[i]>0 it refers to Weightslist[indexlist[i]-1]
+#    *the 0 means that the second element of the input list will not be encoded neither decoded (it is remplaced by zeros)
+#        this is not efficient, so in this case it is better to give: [1,-3] and [inputslist[0],inputslist[2]]
+#        but it allows us to deal with empty lists: give indexlist = numpy.asarray([.0])
+#        and inputlist=numpy.zeros((batchsize,1))
+#    *when an index is negative it means that the input will not be used for encoding but we will still reconstruct it
+#        (auxiliary target as output)
+#                                if inputslist[i]<0 it refers to Weightslist[-indexlist[i]-1]
 #
 # An entire batch should have the same available inputs configuration.
 #
@@ -46,517 +46,517 @@
 
 # Checking inputs in make_node methods----------------------
 def Checkidx_list(idx_list):
-	idx_list = T.as_tensor_variable(idx_list)
-	nidx = idx_list.type.ndim
-	if nidx != 1: raise TypeError('not vector', idx_list)
-	return idx_list
+    idx_list = T.as_tensor_variable(idx_list)
+    nidx = idx_list.type.ndim
+    if nidx != 1: raise TypeError('not vector', idx_list)
+    return idx_list
 
 def Checkhidd(hidd):
-	hidd = T.as_tensor_variable(hidd)
-	nhidd = hidd.type.ndim
-	if nhidd not in (1,2): raise TypeError('not matrix or vector', hidd)
-	return hidd
+    hidd = T.as_tensor_variable(hidd)
+    nhidd = hidd.type.ndim
+    if nhidd not in (1,2): raise TypeError('not matrix or vector', hidd)
+    return hidd
 
 def Checkweights_list(weights_list):
-	weights_list = map(T.as_tensor_variable, weights_list)
-	for i in range(len(weights_list)):
-		nweights = weights_list[i].type.ndim
-		if nweights not in (1,2): raise TypeError('not matrix or vector', weights_list[i])
-	return weights_list
+    weights_list = map(T.as_tensor_variable, weights_list)
+    for i in range(len(weights_list)):
+        nweights = weights_list[i].type.ndim
+        if nweights not in (1,2): raise TypeError('not matrix or vector', weights_list[i])
+    return weights_list
 
 def Checkbias_list(bias_list):
-	bias_list = map(T.as_tensor_variable, bias_list)
-	for i in range(len(bias_list)):
-		nbias = bias_list[i].type.ndim
-		if nbias != 1: raise TypeError('not vector', bias_list[i])
-	return bias_list
+    bias_list = map(T.as_tensor_variable, bias_list)
+    for i in range(len(bias_list)):
+        nbias = bias_list[i].type.ndim
+        if nbias != 1: raise TypeError('not vector', bias_list[i])
+    return bias_list
 
 # Encoding scan dot product------------------------------------
 class ScanDotEnc(Op):
-	"""This Op takes an index list (as tensor.ivector), a list of matrices representing
-	the available inputs (as theano.generic), and all the encoding weights tensor.dmatrix of the model. It will select the
-	weights corresponding to the inputs (according to index list) and compute only the necessary dot products"""
-	def __init__(self):
-		#Create Theano methods to do the dot products with blas or at least in C.
-		self.M=theano.Module()
-		inputs = T.dmatrix('input')
-		weights = T.dmatrix('weights')
-		self.M.hid = T.dmatrix('hid')
-		self.M.resultin = self.M.hid + T.dot(inputs,weights)
-		result = T.dot(inputs,weights)
-		
-		self.M.dotin = theano.Method([inputs,weights],None,{self.M.hid : self.M.resultin})
-		self.M.dot = theano.Method([inputs,weights],result)
-		self.m = self.M.make()
-	
-	def make_node(self, idx_list, inputs_list, weights_list):
-		idx_list = Checkidx_list(idx_list)
-		weights_list = Checkweights_list(weights_list)
-		return Apply(self, [idx_list] + [inputs_list] + weights_list, [T.dmatrix()])
-	
-	def perform(self, node, args, (hid,)):
-		idx_list = args[0]
-		hidcalc = False
-		
-		batchsize = (args[1][0].shape)[0]
-		n_hid = (args[2].shape)[1]
-		if len(idx_list) != len(args[1]) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		if max(idx_list) >= (len(args)-2)+1 :
-			raise NotImplementedError('index superior to weight list length',idx_list)
-		for i in range(len(args[1])):
-			if (args[1][i].shape)[0] != batchsize:
-				raise NotImplementedError('different batchsize in the inputs list',args[1][i].shape)
-		for i in range(len(args)-2):
-			if (args[2+i].shape)[1] != n_hid:
-				raise NotImplementedError('different length of hidden in the weights list',args[2+i].shape)
-		
-		for i in range(len(idx_list)):
-			if idx_list[i]>0:
-				if hidcalc:
-					self.m.dotin(args[1][i],args[2+int(idx_list[i]-1)])
-				else:
-					self.m.hid = self.m.dot(args[1][i],args[2+int(idx_list[i]-1)])
-					hidcalc = True
-		
-		if not hidcalc:
-			hid[0] = numpy.zeros([batchsize,n_hid])
-		else:
-			hid[0] = self.m.hid
-		
-	
-	def grad(self, args, gz):
-		gradi = ScanDotEncGrad()(args,gz)
-		if type(gradi) != list:
-			return [None, None] + [gradi]
-		else:
-			return [None, None] + gradi
-	
-	def __hash__(self):
-		return hash(ScanDotEnc)^58994
-	
-	def __str__(self):
-		return "ScanDotEnc"
+    """This Op takes an index list (as tensor.ivector), a list of matrices representing
+    the available inputs (as theano.generic), and all the encoding weights tensor.dmatrix of the model. It will select the
+    weights corresponding to the inputs (according to index list) and compute only the necessary dot products"""
+    def __init__(self):
+        #Create Theano methods to do the dot products with blas or at least in C.
+        self.M=theano.Module()
+        inputs = T.dmatrix('input')
+        weights = T.dmatrix('weights')
+        self.M.hid = T.dmatrix('hid')
+        self.M.resultin = self.M.hid + T.dot(inputs,weights)
+        result = T.dot(inputs,weights)
+    
+        self.M.dotin = theano.Method([inputs,weights],None,{self.M.hid : self.M.resultin})
+        self.M.dot = theano.Method([inputs,weights],result)
+        self.m = self.M.make()
+    
+    def make_node(self, idx_list, inputs_list, weights_list):
+        idx_list = Checkidx_list(idx_list)
+        weights_list = Checkweights_list(weights_list)
+        return Apply(self, [idx_list] + [inputs_list] + weights_list, [T.dmatrix()])
+    
+    def perform(self, node, args, (hid,)):
+        idx_list = args[0]
+        hidcalc = False
+    
+        batchsize = (args[1][0].shape)[0]
+        n_hid = (args[2].shape)[1]
+        if len(idx_list) != len(args[1]) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+        if max(idx_list) >= (len(args)-2)+1 :
+            raise NotImplementedError('index superior to weight list length',idx_list)
+        for i in range(len(args[1])):
+            if (args[1][i].shape)[0] != batchsize:
+                raise NotImplementedError('different batchsize in the inputs list',args[1][i].shape)
+        for i in range(len(args)-2):
+            if (args[2+i].shape)[1] != n_hid:
+                raise NotImplementedError('different length of hidden in the weights list',args[2+i].shape)
+    
+        for i in range(len(idx_list)):
+            if idx_list[i]>0:
+                if hidcalc:
+                    self.m.dotin(args[1][i],args[2+int(idx_list[i]-1)])
+                else:
+                    self.m.hid = self.m.dot(args[1][i],args[2+int(idx_list[i]-1)])
+                    hidcalc = True
+    
+        if not hidcalc:
+            hid[0] = numpy.zeros([batchsize,n_hid])
+        else:
+            hid[0] = self.m.hid
+    
+    
+    def grad(self, args, gz):
+        gradi = ScanDotEncGrad()(args,gz)
+        if type(gradi) != list:
+            return [None, None] + [gradi]
+        else:
+            return [None, None] + gradi
+    
+    def __hash__(self):
+        return hash(ScanDotEnc)^58994
+    
+    def __str__(self):
+        return "ScanDotEnc"
 
 scandotenc=ScanDotEnc()
 
 class ScanDotEncGrad(Op):
-	"""This Op computes the gradient wrt the weights for ScanDotEnc"""
-	def __init__(self):
-		#Create Theano methods to do the dot products with blas or at least in C.
-		self.M=theano.Module()
-		input1 = T.dmatrix('input1')
-		self.M.g_out = T.dmatrix('g_out')
-		result = T.dmatrix('result')
-		input2=T.transpose(input1)
-		self.M.resultin = result + T.dot(input2,self.M.g_out)
-		self.M.result = T.dot(input2,self.M.g_out)
-		
-		self.M.dotin = theano.Method([input1,result],self.M.resultin)
-		self.M.dot = theano.Method([input1],self.M.result)
-		self.m = self.M.make()
-	
-	def make_node(self, args, g_out):
-		idx_list = Checkidx_list(args[0])
-		weights_list = Checkweights_list(args[2:])
-		return Apply(self, args + g_out, [T.dmatrix() for i in xrange(2,len(args))])
-	
-	def perform(self, node, args, z):
-		idx_list = args[0]
-		self.m.g_out = args[-1]
-		
-		batchsize = (args[1][0].shape)[0]
-		n_hid = (args[2].shape)[1]
-		if len(idx_list) != len(args[1]) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		if max(idx_list) >= (len(args)-3)+1 :
-			raise NotImplementedError('index superior to weight list length',idx_list)
-		for i in range(len(args[1])):
-			if (args[1][i].shape)[0] != batchsize:
-				raise NotImplementedError('different batchsize in the inputs list',args[1][i].shape)
-		for i in range(len(args)-3):
-			if (args[2+i].shape)[1] != n_hid:
-				raise NotImplementedError('different length of hidden in the weights list',args[2+i].shape)
-		
-		zcalc = [False for i in range(len(args)-3)]
-		
-		for i in range(len(idx_list)):
-			if idx_list[i]>0:
-				if zcalc[int(idx_list[i]-1)]:
-					z[int(idx_list[i]-1)][0] = self.m.dotin(args[1][i],z[int(idx_list[i]-1)][0])
-				else:
-					z[int(idx_list[i]-1)][0] = self.m.dot(args[1][i])
-					zcalc[int(idx_list[i]-1)] = True
-		
-		for i in range(len(args)-3):
-			if not zcalc[i]:
-				shp = args[2+i].shape
-				z[i][0] = numpy.zeros(shp)
-		
-	def __hash__(self):
-		return hash(ScanDotEncGrad)^15684
-		
-	def __str__(self):
-		return "ScanDotEncGrad"
+    """This Op computes the gradient wrt the weights for ScanDotEnc"""
+    def __init__(self):
+        #Create Theano methods to do the dot products with blas or at least in C.
+        self.M=theano.Module()
+        input1 = T.dmatrix('input1')
+        self.M.g_out = T.dmatrix('g_out')
+        result = T.dmatrix('result')
+        input2=T.transpose(input1)
+        self.M.resultin = result + T.dot(input2,self.M.g_out)
+        self.M.result = T.dot(input2,self.M.g_out)
+    
+        self.M.dotin = theano.Method([input1,result],self.M.resultin)
+        self.M.dot = theano.Method([input1],self.M.result)
+        self.m = self.M.make()
+    
+    def make_node(self, args, g_out):
+        idx_list = Checkidx_list(args[0])
+        weights_list = Checkweights_list(args[2:])
+        return Apply(self, args + g_out, [T.dmatrix() for i in xrange(2,len(args))])
+    
+    def perform(self, node, args, z):
+        idx_list = args[0]
+        self.m.g_out = args[-1]
+    
+        batchsize = (args[1][0].shape)[0]
+        n_hid = (args[2].shape)[1]
+        if len(idx_list) != len(args[1]) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+        if max(idx_list) >= (len(args)-3)+1 :
+            raise NotImplementedError('index superior to weight list length',idx_list)
+        for i in range(len(args[1])):
+            if (args[1][i].shape)[0] != batchsize:
+                raise NotImplementedError('different batchsize in the inputs list',args[1][i].shape)
+        for i in range(len(args)-3):
+            if (args[2+i].shape)[1] != n_hid:
+                raise NotImplementedError('different length of hidden in the weights list',args[2+i].shape)
+    
+        zcalc = [False for i in range(len(args)-3)]
+    
+        for i in range(len(idx_list)):
+            if idx_list[i]>0:
+                if zcalc[int(idx_list[i]-1)]:
+                    z[int(idx_list[i]-1)][0] = self.m.dotin(args[1][i],z[int(idx_list[i]-1)][0])
+                else:
+                    z[int(idx_list[i]-1)][0] = self.m.dot(args[1][i])
+                    zcalc[int(idx_list[i]-1)] = True
+    
+        for i in range(len(args)-3):
+            if not zcalc[i]:
+                shp = args[2+i].shape
+                z[i][0] = numpy.zeros(shp)
+    
+    def __hash__(self):
+        return hash(ScanDotEncGrad)^15684
+    
+    def __str__(self):
+        return "ScanDotEncGrad"
 
 # Decoding scan dot product------------------------------------
 class ScanDotDec(Op):
-	"""This Op takes an index list (as tensor.ivector), a list of matrices representing
-	the available inputs (as theano.generic), the hidden layer of the DAA (theano.dmatrix)
-	and all the decoding weights tensor.dmatrix of the model. It will select the
-	weights corresponding to the available inputs (according to index list) and compute
-	only the necessary dot products. The outputs will be concatenated and will represent
-	the reconstruction of the different modality in the same order than the index list"""
-	def __init__(self):
-		#Create Theano methods to do the dot products with blas or at least in C.
-		self.M=theano.Module()
-		weights = T.dmatrix('weights')
-		self.M.hid = T.dmatrix('hid')
-		oldval = T.dmatrix('oldval')
-		resultin = oldval + T.dot(self.M.hid,weights)
-		result = T.dot(self.M.hid,weights)
-		
-		self.M.dotin = theano.Method([weights,oldval],resultin)
-		self.M.dot = theano.Method([weights],result)
-		self.m = self.M.make()
-	
-	def make_node(self, idx_list, input_list, hidd, weights_list):
-		idx_list = Checkidx_list(idx_list)
-		hidd = Checkhidd(hidd)
-		weights_list = Checkweights_list(weights_list)
-		return Apply(self, [idx_list] + [input_list] +[hidd] + weights_list,[T.dmatrix()])
-	
-	def perform(self, node, args, (z,)):
-		
-		idx_list = abs(args[0])
-		self.m.hid = args[2]
-		
-		batchsize = (self.m.hid.shape)[0]
-		n_hid = self.m.hid.shape[1]
-		if max(idx_list) >= len(args)-3+1 :
-			raise NotImplementedError('index superior to weight list length',idx_list)
-		if len(idx_list) != len(args[1]) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		for i in range(len(args)-3):
-			if (args[3+i].shape)[0] != n_hid:
-				raise NotImplementedError('different length of hidden in the weights list',args[3+i].shape)
-		
-		zcalc = [False for i in idx_list]
-		z[0] = [None for i in idx_list]
-		
-		for i in range(len(idx_list)):
-			if idx_list[i]>0:
-				if zcalc[i]:
-					z[0][i] = self.m.dotin(args[3+int(idx_list[i]-1)],z[0][i])
-				else:
-					z[0][i] = self.m.dot(args[3+int(idx_list[i]-1)])
-					zcalc[i] = True
-		
-		for i in range(len(idx_list)):
-			if not zcalc[i]:
-				shp = args[1][int(idx_list[i]-1)].shape
-				z[0][i] = numpy.zeros((batchsize,shp[1]))
-		
-		z[0] = numpy.concatenate(z[0],1)
-		
-	def grad(self, args, gz):
-		gradi = ScanDotDecGrad()(args,gz)
-		if type(gradi) != list:
-			return [None, None] + [gradi]
-		else:
-			return [None, None] + gradi
-	
-	def __hash__(self):
-		return hash(ScanDotDec)^73568
-	
-	def __str__(self):
-		return "ScanDotDec"
+    """This Op takes an index list (as tensor.ivector), a list of matrices representing
+    the available inputs (as theano.generic), the hidden layer of the DAA (theano.dmatrix)
+    and all the decoding weights tensor.dmatrix of the model. It will select the
+    weights corresponding to the available inputs (according to index list) and compute
+    only the necessary dot products. The outputs will be concatenated and will represent
+    the reconstruction of the different modality in the same order than the index list"""
+    def __init__(self):
+        #Create Theano methods to do the dot products with blas or at least in C.
+        self.M=theano.Module()
+        weights = T.dmatrix('weights')
+        self.M.hid = T.dmatrix('hid')
+        oldval = T.dmatrix('oldval')
+        resultin = oldval + T.dot(self.M.hid,weights)
+        result = T.dot(self.M.hid,weights)
+    
+        self.M.dotin = theano.Method([weights,oldval],resultin)
+        self.M.dot = theano.Method([weights],result)
+        self.m = self.M.make()
+    
+    def make_node(self, idx_list, input_list, hidd, weights_list):
+        idx_list = Checkidx_list(idx_list)
+        hidd = Checkhidd(hidd)
+        weights_list = Checkweights_list(weights_list)
+        return Apply(self, [idx_list] + [input_list] +[hidd] + weights_list,[T.dmatrix()])
+    
+    def perform(self, node, args, (z,)):
+    
+        idx_list = abs(args[0])
+        self.m.hid = args[2]
+    
+        batchsize = (self.m.hid.shape)[0]
+        n_hid = self.m.hid.shape[1]
+        if max(idx_list) >= len(args)-3+1 :
+            raise NotImplementedError('index superior to weight list length',idx_list)
+        if len(idx_list) != len(args[1]) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+        for i in range(len(args)-3):
+            if (args[3+i].shape)[0] != n_hid:
+                raise NotImplementedError('different length of hidden in the weights list',args[3+i].shape)
+    
+        zcalc = [False for i in idx_list]
+        z[0] = [None for i in idx_list]
+    
+        for i in range(len(idx_list)):
+            if idx_list[i]>0:
+                if zcalc[i]:
+                    z[0][i] = self.m.dotin(args[3+int(idx_list[i]-1)],z[0][i])
+                else:
+                    z[0][i] = self.m.dot(args[3+int(idx_list[i]-1)])
+                    zcalc[i] = True
+    
+        for i in range(len(idx_list)):
+            if not zcalc[i]:
+                shp = args[1][int(idx_list[i]-1)].shape
+                z[0][i] = numpy.zeros((batchsize,shp[1]))
+    
+        z[0] = numpy.concatenate(z[0],1)
+    
+    def grad(self, args, gz):
+        gradi = ScanDotDecGrad()(args,gz)
+        if type(gradi) != list:
+            return [None, None] + [gradi]
+        else:
+            return [None, None] + gradi
+    
+    def __hash__(self):
+        return hash(ScanDotDec)^73568
+    
+    def __str__(self):
+        return "ScanDotDec"
 
 scandotdec=ScanDotDec()
 
 class ScanDotDecGrad(Op):
-	"""This Op computes the gradient wrt the weights for ScanDotDec"""
-	def __init__(self):
-		self.M=theano.Module()
-		gout = T.dmatrix('gout')
-		self.M.hidt = T.dmatrix('hid')
-		oldval = T.dmatrix('oldval')
-		resultin1 = oldval + T.dot(self.M.hidt,gout)
-		result1 = T.dot(self.M.hidt,gout)
-		weights = T.dmatrix('weights')
-		weights2 = T.transpose(weights)
-		resultin2 = oldval + T.dot(gout,weights2)
-		result2 = T.dot(gout,weights2)
-		
-		self.M.dotin1 = theano.Method([gout,oldval],resultin1)
-		self.M.dot1 = theano.Method([gout],result1)
-		self.M.dotin2 = theano.Method([gout,weights,oldval],resultin2)
-		self.M.dot2 = theano.Method([gout,weights],result2)
-		self.m = self.M.make()
-	
-	
-	def make_node(self, args, g_out):
-		idx_list = Checkidx_list(args[0])
-		hidd = Checkhidd(args[2])
-		weights_list = Checkweights_list(args[3:])
-		return Apply(self, args + g_out, [T.dmatrix() for i in xrange(2,len(args))])
-	
-	def perform(self, node, args, z):
-		idx_list = abs(args[0])
-		self.m.hidt = args[2].T
-		
-		batchsize = (self.m.hidt.shape)[1]
-		n_hid = self.m.hidt.shape[0]
-		if max(idx_list) >= len(args)-4+1 :
-			raise NotImplementedError('index superior to weight list length',idx_list)
-		if len(idx_list) != len(args[1]) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		for i in range(len(args)-4):
-			if (args[3+i].shape)[0] != n_hid:
-				raise NotImplementedError('different length of hidden in the weights list',args[3+i].shape)
-		
-		zidx=numpy.zeros((len(idx_list)+1))
-		
-		for i in range(len(idx_list)):
-			if idx_list[i] == 0:
-				zidx[i+1] = (args[1][i].shape)[1]
-			else:
-				zidx[i+1] = (args[3+idx_list[i]-1].shape)[1]
-		
-		zidx=zidx.cumsum()
-		hidcalc = False
-		zcalc = [False for i in range((len(args)-4))]
-		
-		for i in range(len(idx_list)):
-			if idx_list[i]>0:
-				if zcalc[int(idx_list[i])-1]:
-					z[int(idx_list[i])][0] = self.m.dotin1(args[-1][:,zidx[i]:zidx[i+1]],z[int(idx_list[i])][0])
-				else:
-					z[int(idx_list[i])][0] = self.m.dot1(args[-1][:,zidx[i]:zidx[i+1]])
-					zcalc[int(idx_list[i])-1] = True
-				if hidcalc:
-					z[0][0] = self.m.dotin2(args[-1][:,zidx[i]:zidx[i+1]],args[3+int(idx_list[i]-1)],z[0][0])
-				else:
-					z[0][0] = self.m.dot2(args[-1][:,zidx[i]:zidx[i+1]],args[3+int(idx_list[i]-1)])
-					hidcalc = True
-		
-		if not hidcalc:
-			z[0][0] = numpy.zeros((self.m.hidt.shape[1],self.m.hidt.shape[0]))
-		
-		for i in range((len(args)-4)):
-			if not zcalc[i]:
-				shp = args[3+i].shape
-				z[i+1][0] = numpy.zeros(shp)
-		
-		
-	def __hash__(self):
-		return hash(ScanDotDecGrad)^87445
-	
-	def __str__(self):
-		return "ScanDotDecGrad"
+    """This Op computes the gradient wrt the weights for ScanDotDec"""
+    def __init__(self):
+        self.M=theano.Module()
+        gout = T.dmatrix('gout')
+        self.M.hidt = T.dmatrix('hid')
+        oldval = T.dmatrix('oldval')
+        resultin1 = oldval + T.dot(self.M.hidt,gout)
+        result1 = T.dot(self.M.hidt,gout)
+        weights = T.dmatrix('weights')
+        weights2 = T.transpose(weights)
+        resultin2 = oldval + T.dot(gout,weights2)
+        result2 = T.dot(gout,weights2)
+    
+        self.M.dotin1 = theano.Method([gout,oldval],resultin1)
+        self.M.dot1 = theano.Method([gout],result1)
+        self.M.dotin2 = theano.Method([gout,weights,oldval],resultin2)
+        self.M.dot2 = theano.Method([gout,weights],result2)
+        self.m = self.M.make()
+    
+    
+    def make_node(self, args, g_out):
+        idx_list = Checkidx_list(args[0])
+        hidd = Checkhidd(args[2])
+        weights_list = Checkweights_list(args[3:])
+        return Apply(self, args + g_out, [T.dmatrix() for i in xrange(2,len(args))])
+    
+    def perform(self, node, args, z):
+        idx_list = abs(args[0])
+        self.m.hidt = args[2].T
+    
+        batchsize = (self.m.hidt.shape)[1]
+        n_hid = self.m.hidt.shape[0]
+        if max(idx_list) >= len(args)-4+1 :
+            raise NotImplementedError('index superior to weight list length',idx_list)
+        if len(idx_list) != len(args[1]) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+        for i in range(len(args)-4):
+            if (args[3+i].shape)[0] != n_hid:
+                raise NotImplementedError('different length of hidden in the weights list',args[3+i].shape)
+    
+        zidx=numpy.zeros((len(idx_list)+1))
+    
+        for i in range(len(idx_list)):
+            if idx_list[i] == 0:
+                zidx[i+1] = (args[1][i].shape)[1]
+            else:
+                zidx[i+1] = (args[3+idx_list[i]-1].shape)[1]
+    
+        zidx=zidx.cumsum()
+        hidcalc = False
+        zcalc = [False for i in range((len(args)-4))]
+    
+        for i in range(len(idx_list)):
+            if idx_list[i]>0:
+                if zcalc[int(idx_list[i])-1]:
+                    z[int(idx_list[i])][0] = self.m.dotin1(args[-1][:,zidx[i]:zidx[i+1]],z[int(idx_list[i])][0])
+                else:
+                    z[int(idx_list[i])][0] = self.m.dot1(args[-1][:,zidx[i]:zidx[i+1]])
+                    zcalc[int(idx_list[i])-1] = True
+                if hidcalc:
+                    z[0][0] = self.m.dotin2(args[-1][:,zidx[i]:zidx[i+1]],args[3+int(idx_list[i]-1)],z[0][0])
+                else:
+                    z[0][0] = self.m.dot2(args[-1][:,zidx[i]:zidx[i+1]],args[3+int(idx_list[i]-1)])
+                    hidcalc = True
+    
+        if not hidcalc:
+            z[0][0] = numpy.zeros((self.m.hidt.shape[1],self.m.hidt.shape[0]))
+    
+        for i in range((len(args)-4)):
+            if not zcalc[i]:
+                shp = args[3+i].shape
+                z[i+1][0] = numpy.zeros(shp)
+    
+    
+    def __hash__(self):
+        return hash(ScanDotDecGrad)^87445
+    
+    def __str__(self):
+        return "ScanDotDecGrad"
 
 # DAA input noise------------------------------------
 class ScanNoise(Op):
-	"""This Op takes an index list (as tensor.ivector), a list of matrices representing
-	the available inputs (as theano.generic), a probability of individual bit masking and
-	a probability of modality masking. It will return the inputs list with randoms zeros entry
-	and the index list with some positive values changed to negative values (groups masking)"""
-	def __init__(self, seed = 1):
-		self.M=theano.Module()
-		self.M.rand = T.RandomStreams(seed)
-		self.seed = seed
-		mat = T.matrix('mat')
-		noise_level_bit = T.dscalar('noise_level_bit')
-		noise_level_group = T.dscalar('noise_level_group')
-		self.M.out1 = self.M.rand.binomial(T.shape(mat), 1, 1 - noise_level_bit) * mat
-		self.M.out2 = self.M.rand.binomial((1,1), 1, 1 - noise_level_group)
-		
-		self.M.noisify_bit = theano.Method([mat,noise_level_bit],self.M.out1)
-		self.M.noisify_group_bool = theano.Method([noise_level_group],self.M.out2)
-		self.R = self.M.make()
-		self.R.rand.initialize()
-	
-	def make_node(self, idx_list, inputs_list, noise_level_bit, noise_level_group):
-		idx_list = Checkidx_list(idx_list)
-		return Apply(self, [idx_list] + [inputs_list] + [noise_level_bit] + [noise_level_group],\
-				[T.ivector(), theano.generic()])
-	
-	def perform(self, node, (idx_list,inputs_list,noise_level_bit,noise_level_group), (y,z)):
-		
-		if len(idx_list) != len(inputs_list) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		
-		y[0] = numpy.asarray([-i if (i>0 and not(self.R.noisify_group_bool(noise_level_group))) else i for i in idx_list])
-		z[0] = [(self.R.noisify_bit(inputs_list[i],noise_level_bit) if y[0][i]>0 else numpy.zeros((inputs_list[i].shape)))\
-				for i in range(len(inputs_list))]
-	
-	def grad(self,args,gz):
-		return [None,None,None,None]
-	
-	
-	def __hash__(self):
-		return hash(ScanNoise)^hash(self.seed)^hash(self.R.rand)^12254
-	
-	def __str__(self):
-		return "ScanNoise"
+    """This Op takes an index list (as tensor.ivector), a list of matrices representing
+    the available inputs (as theano.generic), a probability of individual bit masking and
+    a probability of modality masking. It will return the inputs list with randoms zeros entry
+    and the index list with some positive values changed to negative values (groups masking)"""
+    def __init__(self, seed = 1):
+        self.M=theano.Module()
+        self.M.rand = T.RandomStreams(seed)
+        self.seed = seed
+        mat = T.matrix('mat')
+        noise_level_bit = T.dscalar('noise_level_bit')
+        noise_level_group = T.dscalar('noise_level_group')
+        self.M.out1 = self.M.rand.binomial(T.shape(mat), 1, 1 - noise_level_bit) * mat
+        self.M.out2 = self.M.rand.binomial((1,1), 1, 1 - noise_level_group)
+    
+        self.M.noisify_bit = theano.Method([mat,noise_level_bit],self.M.out1)
+        self.M.noisify_group_bool = theano.Method([noise_level_group],self.M.out2)
+        self.R = self.M.make()
+        self.R.rand.initialize()
+    
+    def make_node(self, idx_list, inputs_list, noise_level_bit, noise_level_group):
+        idx_list = Checkidx_list(idx_list)
+        return Apply(self, [idx_list] + [inputs_list] + [noise_level_bit] + [noise_level_group],\
+                [T.ivector(), theano.generic()])
+    
+    def perform(self, node, (idx_list,inputs_list,noise_level_bit,noise_level_group), (y,z)):
+    
+        if len(idx_list) != len(inputs_list) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+    
+        y[0] = numpy.asarray([-i if (i>0 and not(self.R.noisify_group_bool(noise_level_group))) else i for i in idx_list])
+        z[0] = [(self.R.noisify_bit(inputs_list[i],noise_level_bit) if y[0][i]>0 else numpy.zeros((inputs_list[i].shape)))\
+                for i in range(len(inputs_list))]
+    
+    def grad(self,args,gz):
+        return [None,None,None,None]
+    
+    
+    def __hash__(self):
+        return hash(ScanNoise)^hash(self.seed)^hash(self.R.rand)^12254
+    
+    def __str__(self):
+        return "ScanNoise"
 
 scannoise=ScanNoise()
 
 # Total input matrix construction------------------------------------
 class ScanInputs(Op):
-	"""This Op takes an index list (as tensor.ivector) and a list of matrices representing
-	the available inputs (as theano.generic). It will construct the appropriate tensor.dmatrix
-	to compare to the reconstruction obtained with ScanDotDec"""
-	def make_node(self, idx_list, inputs_list):
-		idx_list = Checkidx_list(idx_list)
-		return Apply(self, [idx_list] + [inputs_list],[T.dmatrix()])
-	
-	def perform(self, node, (idx_list, inputs_list), (z,)):
-		
-		if len(idx_list) != len(inputs_list):
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		
-		for i in range(len(idx_list)):
-			if idx_list[i] == 0:
-				inputs_list[i] = 0 * inputs_list[i]
-		
-		z[0] = numpy.concatenate(inputs_list,1)
-	
-	def grad(self,args,gz):
-		return [None,None]
-	
-	def __hash__(self):
-		return hash(ScanInputs)^75902
-	
-	def __str__(self):
-		return "ScanInputs"
+    """This Op takes an index list (as tensor.ivector) and a list of matrices representing
+    the available inputs (as theano.generic). It will construct the appropriate tensor.dmatrix
+    to compare to the reconstruction obtained with ScanDotDec"""
+    def make_node(self, idx_list, inputs_list):
+        idx_list = Checkidx_list(idx_list)
+        return Apply(self, [idx_list] + [inputs_list],[T.dmatrix()])
+    
+    def perform(self, node, (idx_list, inputs_list), (z,)):
+    
+        if len(idx_list) != len(inputs_list):
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+    
+        for i in range(len(idx_list)):
+            if idx_list[i] == 0:
+                inputs_list[i] = 0 * inputs_list[i]
+    
+        z[0] = numpy.concatenate(inputs_list,1)
+    
+    def grad(self,args,gz):
+        return [None,None]
+    
+    def __hash__(self):
+        return hash(ScanInputs)^75902
+    
+    def __str__(self):
+        return "ScanInputs"
 
 scaninputs=ScanInputs()
 
 # Decoding bias vector construction------------------------------------
 class ScanBiasDec(Op):
-	"""This Op takes an index list (as tensor.ivector), a list of matrices representing
-	the available inputs (as theano.generic) and the decoding bias tensor.dvector.
-	It will construct the appropriate bias tensor.dvector
-	to add to the reconstruction obtained with ScanDotDec"""
-	def make_node(self, idx_list, input_list, bias_list):
-		idx_list = Checkidx_list(idx_list)
-		bias_list = Checkbias_list(bias_list)
-		return Apply(self, [idx_list] + [input_list] + bias_list, [T.dvector()])
-	
-	def perform(self, node, args, (z,)):
-		idx_list = abs(args[0])
-		
-		if max(idx_list) >= (len(args)-2)+1 :
-			raise NotImplementedError('index superior to bias list length',idx_list)
-		if len(idx_list) != len(args[1]) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		z[0] = [args[idx_list[i]+1] if idx_list[i] != 0 else numpy.zeros(args[1][i].shape[1]) \
-				for i in range(len(idx_list))]
-		z[0] = numpy.concatenate(z[0],1)
-	
-	def __hash__(self):
-		return hash(ScanBiasDec)^60056
-	
-	def grad(self,args,gz):
-		gradi = ScanBiasDecGrad()(args,gz)
-		if type(gradi) != list:
-			return [None, None] + [gradi]
-		else:
-			return [None, None] + gradi
-	
-	def __str__(self):
-		return "ScanBiasDec"
+    """This Op takes an index list (as tensor.ivector), a list of matrices representing
+    the available inputs (as theano.generic) and the decoding bias tensor.dvector.
+    It will construct the appropriate bias tensor.dvector
+    to add to the reconstruction obtained with ScanDotDec"""
+    def make_node(self, idx_list, input_list, bias_list):
+        idx_list = Checkidx_list(idx_list)
+        bias_list = Checkbias_list(bias_list)
+        return Apply(self, [idx_list] + [input_list] + bias_list, [T.dvector()])
+    
+    def perform(self, node, args, (z,)):
+        idx_list = abs(args[0])
+    
+        if max(idx_list) >= (len(args)-2)+1 :
+            raise NotImplementedError('index superior to bias list length',idx_list)
+        if len(idx_list) != len(args[1]) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+        z[0] = [args[idx_list[i]+1] if idx_list[i] != 0 else numpy.zeros(args[1][i].shape[1]) \
+                for i in range(len(idx_list))]
+        z[0] = numpy.concatenate(z[0],1)
+    
+    def __hash__(self):
+        return hash(ScanBiasDec)^60056
+    
+    def grad(self,args,gz):
+        gradi = ScanBiasDecGrad()(args,gz)
+        if type(gradi) != list:
+            return [None, None] + [gradi]
+        else:
+            return [None, None] + gradi
+    
+    def __str__(self):
+        return "ScanBiasDec"
 
 scanbiasdec=ScanBiasDec()
 
 class ScanBiasDecGrad(Op):
-	"""This Op computes the gradient wrt the bias for ScanBiasDec"""
-	def make_node(self, args, g_out):
-		idx_list = Checkidx_list(args[0])
-		bias_list = Checkbias_list(args[2:])
-		return Apply(self, args + g_out, [T.dvector() for i in range(len(args)-2)])
-	
-	def perform(self, node, args, z):
-		idx_list = abs(args[0])
-		
-		if max(idx_list) >= (len(args)-3)+1 :
-			raise NotImplementedError('index superior to bias list length',idx_list)
-		if len(idx_list) != len(args[1]) :
-			raise NotImplementedError('size of index different of inputs list size',idx_list)
-		
-		zidx=numpy.zeros((len(idx_list)+1))
-		for i in range(len(idx_list)):
-			if idx_list[i] == 0:
-				zidx[i+1] = (args[1][i].shape)[1]
-			else:
-				zidx[i+1] = (args[2+idx_list[i]-1].size)
-		zidx=zidx.cumsum()
-		zcalc = [False for i in range((len(args)-3))]
-		
-		for i in range(len(idx_list)):
-			if idx_list[i]>0:
-				if zcalc[int(idx_list[i])-1]:
-					z[int(idx_list[i])-1][0] += args[-1][zidx[i]:zidx[i+1]]
-				else:
-					z[int(idx_list[i])-1][0] = args[-1][zidx[i]:zidx[i+1]]
-					zcalc[int(idx_list[i])-1] = True
-		
-		for i in range((len(args)-3)):
-			if not zcalc[i]:
-				shp = args[2+i].size
-				z[i][0] = numpy.zeros(shp)
-		
-	
-	def __hash__(self):
-		return hash(ScanBiasDecGrad)^41256
-	
-	def __str__(self):
-		return "ScanBiasDecGrad"
+    """This Op computes the gradient wrt the bias for ScanBiasDec"""
+    def make_node(self, args, g_out):
+        idx_list = Checkidx_list(args[0])
+        bias_list = Checkbias_list(args[2:])
+        return Apply(self, args + g_out, [T.dvector() for i in range(len(args)-2)])
+    
+    def perform(self, node, args, z):
+        idx_list = abs(args[0])
+    
+        if max(idx_list) >= (len(args)-3)+1 :
+            raise NotImplementedError('index superior to bias list length',idx_list)
+        if len(idx_list) != len(args[1]) :
+            raise NotImplementedError('size of index different of inputs list size',idx_list)
+    
+        zidx=numpy.zeros((len(idx_list)+1))
+        for i in range(len(idx_list)):
+            if idx_list[i] == 0:
+                zidx[i+1] = (args[1][i].shape)[1]
+            else:
+                zidx[i+1] = (args[2+idx_list[i]-1].size)
+        zidx=zidx.cumsum()
+        zcalc = [False for i in range((len(args)-3))]
+    
+        for i in range(len(idx_list)):
+            if idx_list[i]>0:
+                if zcalc[int(idx_list[i])-1]:
+                    z[int(idx_list[i])-1][0] += args[-1][zidx[i]:zidx[i+1]]
+                else:
+                    z[int(idx_list[i])-1][0] = args[-1][zidx[i]:zidx[i+1]]
+                    zcalc[int(idx_list[i])-1] = True
+    
+        for i in range((len(args)-3)):
+            if not zcalc[i]:
+                shp = args[2+i].size
+                z[i][0] = numpy.zeros(shp)
+    
+    
+    def __hash__(self):
+        return hash(ScanBiasDecGrad)^41256
+    
+    def __str__(self):
+        return "ScanBiasDecGrad"
 
 # Mask construction------------------------------------
 class ScanMask(Op):
-	"""This Op takes an index list (as tensor.ivector) and a list of weigths.
-	It will construct a list of T.iscalar representing the Mask
-	to do the correct regularisation on the weigths"""
-	def __init__(self,encbool=True):
-		self.encbool = encbool
-	
-	def make_node(self, idx_list, weights_list):
-		idx_list = Checkidx_list(idx_list)
-		weights_list = Checkweights_list(weights_list)
-		return Apply(self, [idx_list] + weights_list, [T.iscalar() for i in range(len(weights_list))])
-	
-	def perform(self, node, args, z):
-		if self.encbool:
-			idx_list = args[0]
-			dim = 1
-		else:
-			idx_list = abs(args[0])
-			dim = 0
-		n_hid = args[1].shape[dim]
+    """This Op takes an index list (as tensor.ivector) and a list of weigths.
+    It will construct a list of T.iscalar representing the Mask
+    to do the correct regularisation on the weigths"""
+    def __init__(self,encbool=True):
+        self.encbool = encbool
+    
+    def make_node(self, idx_list, weights_list):
+        idx_list = Checkidx_list(idx_list)
+        weights_list = Checkweights_list(weights_list)
+        return Apply(self, [idx_list] + weights_list, [T.iscalar() for i in range(len(weights_list))])
+    
+    def perform(self, node, args, z):
+        if self.encbool:
+            idx_list = args[0]
+            dim = 1
+        else:
+            idx_list = abs(args[0])
+            dim = 0
+        n_hid = args[1].shape[dim]
 
-		if max(idx_list) >= (len(args)-1)+1 :
-			raise NotImplementedError('index superior to weights list length',idx_listdec)
-		for i in range(len(args)-1):
-			if args[1+i].shape[dim] != n_hid:
-				raise NotImplementedError('different length of hidden in the encoding weights list',args[1+i].shape)
-		
-		for i in range(len(args[1:])):
-			z[i][0] = numpy.asarray((idx_list == i+1).sum(),dtype='int32')
-	
-	def __hash__(self):
-		return hash(ScanMask)^hash(self.encbool)^11447
-	
-	def grad(self,args,gz):
-		return [None] * len(args)
-	
-	def __str__(self):
-		if self.encbool:
-			string = "Enc"
-		else:
-			string = "Dec"
-		return "ScanMask" + string
+        if max(idx_list) >= (len(args)-1)+1 :
+            raise NotImplementedError('index superior to weights list length',idx_listdec)
+        for i in range(len(args)-1):
+            if args[1+i].shape[dim] != n_hid:
+                raise NotImplementedError('different length of hidden in the encoding weights list',args[1+i].shape)
+    
+        for i in range(len(args[1:])):
+            z[i][0] = numpy.asarray((idx_list == i+1).sum(),dtype='int32')
+    
+    def __hash__(self):
+        return hash(ScanMask)^hash(self.encbool)^11447
+    
+    def grad(self,args,gz):
+        return [None] * len(args)
+    
+    def __str__(self):
+        if self.encbool:
+            string = "Enc"
+        else:
+            string = "Dec"
+        return "ScanMask" + string
 
 scanmaskenc=ScanMask(True)
 scanmaskdec=ScanMask(False)