# HG changeset patch # User Xavier Glorot # Date 1265759135 18000 # Node ID bf83682c827be33a9ce4a71cd8106aa597b5488d # Parent ab70fbca513c76d3a2447f0a7f96183e553dd7cd# Parent 1afa95285b9c3cd6071de35e4ddf3f1143bd24b8 merge diff -r ab70fbca513c -r bf83682c827b transformations/pipeline.py --- a/transformations/pipeline.py Tue Feb 09 18:31:24 2010 -0500 +++ b/transformations/pipeline.py Tue Feb 09 18:45:35 2010 -0500 @@ -192,12 +192,16 @@ self.train_data = open(nist_path, 'rb') self.train_labels = open(label_path, 'rb') self.dim = tuple(ft._read_header(self.train_data)[3]) + # in order to seek to the beginning of the file + self.train_data.close() + self.train_data = open(nist_path, 'rb') + def nist_supp_iterator(nist, prob_font, prob_captcha, num_img): subtensor = slice(0, num_img) img = ft.read(nist.train_data, subtensor).astype(numpy.float32)/255 labels = ft.read(nist.train_labels, subtensor) - + for i in xrange(num_img): r = numpy.random.rand() if r<= prob_font: