ift6266: transformations/pipeline.py comparison

comparison transformations/pipeline.py @ 156:6f3b866c0182

On peut maintenant launcher le pipeline avec un seed donné, résultats déterministes

author	boulanni <nicolas_boulanger@hotmail.com>
date	Wed, 24 Feb 2010 19:12:01 -0500
parents	4981c729149c
children

comparison

equal deleted inserted replaced

-:7640cb31cf1f
+:6f3b866c0182
 DEFAULT_NIST_PATH = '/data/lisa/data/ift6266h10/train_data.ft'
 DEFAULT_LABEL_PATH = '/data/lisa/data/ift6266h10/train_labels.ft'
 DEFAULT_OCR_PATH = '/data/lisa/data/ocr_breuel/filetensor/unlv-corrected-2010-02-01-shuffled.ft'
 DEFAULT_OCRLABEL_PATH = '/data/lisa/data/ocr_breuel/filetensor/unlv-corrected-2010-02-01-labels-shuffled.ft'
 ARGS_FILE = os.environ['PIPELINE_ARGS_TMPFILE']
+# PARSE COMMAND LINE ARGUMENTS
+def get_argv():
+with open(ARGS_FILE) as f:
+args = [l.rstrip() for l in f.readlines()]
+return args
+def usage():
+print '''
+Usage: run_pipeline.sh [-m ...] [-z ...] [-o ...] [-p ...]
+-m, --max-complexity: max complexity to generate for an image
+-z, --probability-zero: probability of using complexity=0 for an image
+-o, --output-file: full path to file to use for output of images
+-p, --params-output-file: path to file to output params to
+-x, --labels-output-file: path to file to output labels to
+-f, --data-file: path to filetensor (.ft) data file (NIST)
+-l, --label-file: path to filetensor (.ft) labels file (NIST labels)
+-c, --ocr-file: path to filetensor (.ft) data file (OCR)
+-d, --ocrlabel-file: path to filetensor (.ft) labels file (OCR labels)
+-a, --prob-font: probability of using a raw font image
+-b, --prob-captcha: probability of using a captcha image
+-g, --prob-ocr: probability of using an ocr image
+-y, --seed: the job seed
+'''
+try:
+opts, args = getopt.getopt(get_argv(), "rm:z:o:p:x:s:f:l:c:d:a:b:g:y:", ["reload","max-complexity=", "probability-zero=", "output-file=", "params-output-file=", "labels-output-file=",
+"stop-after=", "data-file=", "label-file=", "ocr-file=", "ocrlabel-file=", "prob-font=", "prob-captcha=", "prob-ocr=", "seed="])
+except getopt.GetoptError, err:
+# print help information and exit:
+print str(err) # will print something like "option -a not recognized"
+usage()
+pdb.gimp_quit(0)
+sys.exit(2)
+for o, a in opts:
+if o in ('-y','--seed'):
+random.seed(int(a))
+numpy.random.seed(int(a))
 if DEBUG_X:
 import pylab
 pylab.ion()
 from slant import Slant
 from Occlusion import Occlusion
 from add_background_image import AddBackground
 from affine_transform import AffineTransformation
 from ttf2jpg import ttf2jpg
-from pycaptcha.Facade import generateCaptcha
+from Facade import generateCaptcha
 if DEBUG:
 from visualizer import Visualizer
 # Either put the visualizer as in the MODULES_INSTANCES list
 # after each module you want to visualize, or in the
 ##############################################################################
 # MAIN
-def usage():
-print '''
-Usage: run_pipeline.sh [-m ...] [-z ...] [-o ...] [-p ...]
--m, --max-complexity: max complexity to generate for an image
--z, --probability-zero: probability of using complexity=0 for an image
--o, --output-file: full path to file to use for output of images
--p, --params-output-file: path to file to output params to
--x, --labels-output-file: path to file to output labels to
--f, --data-file: path to filetensor (.ft) data file (NIST)
--l, --label-file: path to filetensor (.ft) labels file (NIST labels)
--c, --ocr-file: path to filetensor (.ft) data file (OCR)
--d, --ocrlabel-file: path to filetensor (.ft) labels file (OCR labels)
--a, --prob-font: probability of using a raw font image
--b, --prob-captcha: probability of using a captcha image
--g, --prob-ocr: probability of using an ocr image
-'''
-# See run_pipeline.py
-def get_argv():
-with open(ARGS_FILE) as f:
-args = [l.rstrip() for l in f.readlines()]
-return args
 # Might be called locally or through dbidispatch. In all cases it should be
 # passed to the GIMP executable to be able to use GIMP filters.
 # Ex:
 def _main():
 prob_font = 0.0
 prob_captcha = 0.0
 prob_ocr = 0.0
 stop_after = None
 reload_mode = False
-try:
-opts, args = getopt.getopt(get_argv(), "rm:z:o:p:x:s:f:l:c:d:a:b:g:", ["reload","max-complexity=", "probability-zero=", "output-file=", "params-output-file=", "labels-output-file=",
-"stop-after=", "data-file=", "label-file=", "ocr-file=", "ocrlabel-file=", "prob-font=", "prob-captcha=", "prob-ocr="])
-except getopt.GetoptError, err:
-# print help information and exit:
-print str(err) # will print something like "option -a not recognized"
-usage()
-pdb.gimp_quit(0)
-sys.exit(2)
 for o, a in opts:
 if o in ('-m', '--max-complexity'):
 max_complexity = float(a)
 assert max_complexity >= 0.0 and max_complexity <= 1.0
 prob_font = float(a)
 elif o in ('-b', "--prob-captcha"):
 prob_captcha = float(a)
 elif o in ('-g', "--prob-ocr"):
 prob_ocr = float(a)
+elif o in ('-y', "--seed"):
+pass
 else:
 assert False, "unhandled option"
 if output_file_path == None or params_output_file_path == None or labels_output_file_path == None:
 print "Must specify the three output files."

Mercurial > ift6266

comparison transformations/pipeline.py @ 156:6f3b866c0182