ift6266: deep/stacked_dae/v2/stacked

comparison deep/stacked_dae/v2/stacked_dae.py @ 239:42005ec87747

Mergé (manuellement) les changements de Sylvain pour utiliser le code de dataset d'Arnaud, à cette différence près que je n'utilse pas les givens. J'ai probablement une approche différente pour limiter la taille du dataset dans mon débuggage, aussi.

author	fsavard
date	Mon, 15 Mar 2010 18:30:21 -0400
parents	02eb98d051fe
children

comparison

equal deleted inserted replaced

-:9fc641d7adda
+:42005ec87747
 self.params = [ self.W, self.b, self.b_prime ]
 class SdA(object):
-def __init__(self, train_set_x, train_set_y, batch_size, n_ins,
+def __init__(self, batch_size, n_ins,
 hidden_layers_sizes, n_outs,
-corruption_levels, rng, pretrain_lr, finetune_lr, input_divider=1.0):
+corruption_levels, rng, pretrain_lr, finetune_lr):
 # Just to make sure those are not modified somewhere else afterwards
 hidden_layers_sizes = copy.deepcopy(hidden_layers_sizes)
 corruption_levels = copy.deepcopy(corruption_levels)
 update_locals(self, locals())
 print "corruption_levels", corruption_levels
 print "n_ins", n_ins
 print "n_outs", n_outs
 print "pretrain_lr", pretrain_lr
 print "finetune_lr", finetune_lr
-print "input_divider", input_divider
 print "----"
-self.shared_divider = theano.shared(numpy.asarray(input_divider, dtype=theano.config.floatX))
 if len(hidden_layers_sizes) < 1 :
 raiseException (' You must have at least one hidden layer ')
 # allocate symbolic variables for the data
-index   = T.lscalar()    # index to a [mini]batch
+#index   = T.lscalar()    # index to a [mini]batch
 self.x  = T.matrix('x')  # the data is presented as rasterized images
 self.y  = T.ivector('y') # the labels are presented as 1D vector of
 # [int] labels
 for i in xrange( self.n_layers ):
 updates = {}
 for param, gparam in zip(dA_layer.params, gparams):
 updates[param] = param - gparam * pretrain_lr
 # create a function that trains the dA
-update_fn = theano.function([index], dA_layer.cost, \
+update_fn = theano.function([self.x], dA_layer.cost, \
-updates = updates,
+updates = updates)#,
-givens = {
+#     givens = {
-self.x : train_set_x[index*batch_size:(index+1)*batch_size] / self.shared_divider})
+#         self.x : ensemble})
+# collect this function into a list
+#update_fn = theano.function([index], dA_layer.cost, \
+#      updates = updates,
+#      givens = {
+#         self.x : train_set_x[index*batch_size:(index+1)*batch_size] / self.shared_divider})
 # collect this function into a list
 self.pretrain_functions += [update_fn]
 # We now need to add a logistic layer on top of the MLP
 # compute list of updates
 updates = {}
 for param,gparam in zip(self.params, gparams):
 updates[param] = param - gparam*finetune_lr
-self.finetune = theano.function([index], cost,
+self.finetune = theano.function([self.x,self.y], cost,
-updates = updates,
+updates = updates)#,
-givens = {
+#        givens = {
-self.x : train_set_x[index*batch_size:(index+1)*batch_size]/self.shared_divider,
+#          self.x : train_set_x[index*batch_size:(index+1)*batch_size]/self.shared_divider,
-self.y : train_set_y[index*batch_size:(index+1)*batch_size]} )
+#          self.y : train_set_y[index*batch_size:(index+1)*batch_size]} )
 # symbolic variable that points to the number of errors made on the
 # minibatch given by self.x and self.y
 self.errors = self.logLayer.errors(self.y)

Mercurial > ift6266

comparison deep/stacked_dae/v2/stacked_dae.py @ 239:42005ec87747