ift6266: deep/stacked_dae/v_sylvain/sgd_optimization.py comparison

comparison deep/stacked_dae/v_sylvain/sgd_optimization.py @ 238:9fc641d7adda

Possibilite de restreindre la taille des ensemble d'entrainement, valid et test afin de pouvoir tester le code rapidement

author	SylvainPL <sylvain.pannetier.lebeuf@umontreal.ca>
date	Mon, 15 Mar 2010 13:22:20 -0400
parents	ecb69e17950b
children	7dd43ef66d15

comparison

equal deleted inserted replaced

-:9b6e0af062af
+:9fc641d7adda
 def train(self):
 self.pretrain(self.dataset)
 self.finetune(self.dataset)
-def pretrain(self,dataset):
+def pretrain(self,dataset,reduce):
 print "STARTING PRETRAINING, time = ", datetime.datetime.now()
 sys.stdout.flush()
 start_time = time.clock()
 ## Pre-train layer-wise
 # go through pretraining epochs
 for epoch in xrange(self.hp.pretraining_epochs_per_layer):
 # go through the training set
 batch_index=int(0)
 for x,y in dataset.train(self.hp.minibatch_size):
+batch_index+=1
+if batch_index > reduce: #If maximum number of mini-batch is used
+break
 c = self.classifier.pretrain_functions[i](x)
-batch_index+=1
 self.series["reconstruction_error"].append((epoch, batch_index), c)
 print 'Pre-training layer %i, epoch %d, cost '%(i,epoch),c
 sys.stdout.flush()
 print ('Pretraining took %f minutes' %((end_time-start_time)/60.))
 self.hp.update({'pretraining_time': end_time-start_time})
 sys.stdout.flush()
-def finetune(self,dataset):
+def finetune(self,dataset,reduce):
 print "STARTING FINETUNING, time = ", datetime.datetime.now()
 #index   = T.lscalar()    # index to a [mini]batch
 minibatch_size = self.hp.minibatch_size
 ensemble_x = T.matrix('ensemble_x')
 done_looping = False
 epoch = 0
 while (epoch < self.hp.max_finetuning_epochs) and (not done_looping):
 epoch = epoch + 1
-minibatch_index=int(-1)
+minibatch_index=int(0)
 for x,y in dataset.train(minibatch_size):
+minibatch_index +=1
-minibatch_index+=1
+if minibatch_index > reduce:   #If maximum number of mini-batchs is used
+break
 cost_ij = self.classifier.finetune(x,y)
 iter    = epoch * self.n_train_batches + minibatch_index
 self.series["training_error"].append((epoch, minibatch_index), cost_ij)
 if (iter+1) % validation_frequency == 0:
-validation_losses = [validate_model(x,y) for x,y in dataset.valid(minibatch_size)]
+#validation_losses = [validate_model(x,y) for x,y in dataset.valid(minibatch_size)]
+test_index=int(0)
+validation_losses=[]
+for x,y in dataset.valid(minibatch_size):
+test_index+=1
+if test_index > reduce:
+break
+validation_losses.append(validate_model(x,y))
 this_validation_loss = numpy.mean(validation_losses)
 self.series["validation_error"].\
 append((epoch, minibatch_index), this_validation_loss*100.)
-print('epoch %i, minibatch %i/%i, validation error %f %%' % \
+print('epoch %i, minibatch %i, validation error %f %%' % \
-(epoch, minibatch_index+1, self.n_train_batches, \
+(epoch, minibatch_index, \
 this_validation_loss*100.))
 # if we got the best validation score until now
 if this_validation_loss < best_validation_loss:
 # save best validation score and iteration number
 best_validation_loss = this_validation_loss
 best_iter = iter
 # test it on the test set
-test_losses = [test_model(x,y) for x,y in dataset.test(minibatch_size)]
+#test_losses = [test_model(x,y) for x,y in dataset.test(minibatch_size)]
+test_losses=[]
+i=0
+for x,y in dataset.test(minibatch_size):
+i+=1
+if i > reduce:
+break
+test_losses.append(test_model(x,y))
 test_score = numpy.mean(test_losses)
 self.series["test_error"].\
 append((epoch, minibatch_index), test_score*100.)
-print(('     epoch %i, minibatch %i/%i, test error of best '
+print(('     epoch %i, minibatch %i, test error of best '
 'model %f %%') %
-(epoch, minibatch_index+1, self.n_train_batches,
+(epoch, minibatch_index,
 test_score*100.))
 sys.stdout.flush()
 self.series['params'].append((epoch,), self.classifier.all_params)

Mercurial > ift6266

comparison deep/stacked_dae/v_sylvain/sgd_optimization.py @ 238:9fc641d7adda