ift6266: transformations/pipeline.py comparison

comparison transformations/pipeline.py @ 108:a7cd8dd3221c

pipeline.py: placé les modules dans le bon ordre + store NIST en bytes plutôt qu'en float32 dans la RAM

author	boulanni <nicolas_boulanger@hotmail.com>
date	Mon, 15 Feb 2010 16:17:48 -0500
parents	95c491bb5662
children	9c45e0071b52

comparison

equal deleted inserted replaced

-:a9b87b68101d
+:a7cd8dd3221c
 if DEBUG_X:
 import pylab
 pylab.ion()
-#from add_background_image import AddBackground
-from affine_transform import AffineTransformation
 from PoivreSel import PoivreSel
 from thick import Thick
 from BruitGauss import BruitGauss
+from DistorsionGauss import DistorsionGauss
+from PermutPixel import PermutPixel
 from gimp_script import GIMP1
 from Rature import Rature
 from contrast import Contrast
-from Occlusion import Occlusion
 from local_elastic_distortions import LocalElasticDistorter
 from slant import Slant
+from Occlusion import Occlusion
+from add_background_image import AddBackground
+from affine_transform import AffineTransformation
 if DEBUG:
 from visualizer import Visualizer
 # Either put the visualizer as in the MODULES_INSTANCES list
 # after each module you want to visualize, or in the
 # AFTER_EACH_MODULE_HOOK list (but not both, it's redundant)
 VISUALIZER = Visualizer(to_dir=DEBUG_OUTPUT_DIR,  on_screen=False)
-MODULE_INSTANCES = [Thick(),Slant(),GIMP1(),AffineTransformation(),LocalElasticDistorter(),Occlusion(),Rature(),Contrast()]
+###---------------------order of transformation module
+MODULE_INSTANCES = [Slant(),Thick(),AffineTransformation(),LocalElasticDistorter(),GIMP1(),Rature(),Occlusion(), PermutPixel(),DistorsionGauss(),AddBackground(), PoivreSel(), BruitGauss(), Contrast()]
 # These should have a "after_transform_callback(self, image)" method
 # (called after each call to transform_image in a module)
 AFTER_EACH_MODULE_HOOK = []
 if DEBUG:
 self.train_data.close()
 self.train_data = open(nist_path, 'rb')
 self.ocr_data = open(ocr_path, 'rb')
 self.ocr_labels = open(ocrlabel_path, 'rb')
+# cet iterator load tout en ram
 def nist_supp_iterator(nist, prob_font, prob_captcha, prob_ocr, num_img):
-img = ft.read(nist.train_data).astype(numpy.float32)/255
+img = ft.read(nist.train_data)
 labels = ft.read(nist.train_labels)
 if prob_ocr:
-ocr_img = ft.read(nist.ocr_data).astype(numpy.float32)/255
+ocr_img = ft.read(nist.ocr_data)
 ocr_labels = ft.read(nist.ocr_labels)
 for i in xrange(num_img):
 r = numpy.random.rand()
 if r <= prob_font:
 pass #get font
 elif r <= prob_font + prob_captcha:
 pass #get captcha
 elif r <= prob_font + prob_captcha + prob_ocr:
 j = numpy.random.randint(len(ocr_labels))
-yield ocr_img[j], ocr_labels[j]
+yield ocr_img[j].astype(numpy.float32)/255, ocr_labels[j]
 else:
 j = numpy.random.randint(len(labels))
-yield img[j], labels[j]
+yield img[j].astype(numpy.float32)/255, labels[j]
 # Mostly for debugging, for the moment, just to see if we can
 # reload the images and parameters.
 def reload(output_file_path, params_output_file_path):

Mercurial > ift6266

comparison transformations/pipeline.py @ 108:a7cd8dd3221c