Mercurial > pylearn
annotate pylearn/algorithms/tests/test_mcRBM.py @ 1507:2a6a6f16416c
fix import.
author | Frederic Bastien <nouiz@nouiz.org> |
---|---|
date | Mon, 12 Sep 2011 11:45:41 -0400 |
parents | 7c51c0355d86 |
children | b28e8730c948 |
rev | line source |
---|---|
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
1 import sys |
1507 | 2 |
3 import numpy | |
4 import theano | |
5 from theano import tensor | |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
6 |
1507 | 7 from pylearn.algorithms.mcRBM import mcRBM, mcRBMTrainer, mcRBM_withP, l2 |
8 #import pylearn.datasets.cifar10 | |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
9 import pylearn.dataset_ops.cifar10 |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
10 from pylearn.shared.layers.logreg import LogisticRegression |
1507 | 11 from pylearn.io import image_tiling |
12 import pylearn.dataset_ops.image_patches | |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
13 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
14 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
15 def _default_rbm_alloc(n_I, n_K=256, n_J=100): |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
16 return mcRBM.alloc(n_I, n_K, n_J) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
17 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
18 def _default_trainer_alloc(rbm, train_batch, batchsize, l1_penalty, l1_penalty_start): |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
19 return mcRBMTrainer.alloc(rbm, train_batch, batchsize, l1_penalty=l1_penalty, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
20 l1_penalty_start=l1_penalty_start,persistent_chains=persistent_chains) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
21 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
22 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
23 def test_reproduce_ranzato_hinton_2010(dataset='MAR', as_unittest=True, n_train_iters=5000, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
24 rbm_alloc=_default_rbm_alloc, trainer_alloc=_default_trainer_alloc, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
25 lr_per_example=.075, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
26 l1_penalty=1e-3, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
27 l1_penalty_start=1000, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
28 persistent_chains=True, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
29 ): |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
30 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
31 batchsize = 128 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
32 |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
33 if dataset == 'MAR': |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
34 n_vis=105 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
35 n_patches=10240 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
36 epoch_size=n_patches |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
37 elif dataset=='cifar10patches8x8': |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
38 R,C= 8,8 # the size of image patches |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
39 n_vis=96 # pca components |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
40 epoch_size=batchsize*500 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
41 n_patches=epoch_size*20 |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
42 elif dataset=='tinyimages_patches': |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
43 R,C=8,8 |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
44 n_vis=81 |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
45 epoch_size=batchsize*500 |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
46 n_patches=epoch_size*20 |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
47 else: |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
48 R,C= 16,16 # the size of image patches |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
49 n_vis=R*C |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
50 n_patches=100000 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
51 epoch_size=n_patches |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
52 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
53 def l2(X): |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
54 return numpy.sqrt((X**2).sum()) |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
55 |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
56 if dataset == 'MAR': |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
57 tile = pylearn.dataset_ops.image_patches.save_filters_of_ranzato_hinton_2010 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
58 elif dataset == 'cifar10patches8x8': |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
59 def tile(X, fname): |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
60 _img = pylearn.datasets.cifar10.tile_rasterized_examples( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
61 pylearn.preprocessing.pca.pca_whiten_inverse( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
62 pylearn.dataset_ops.cifar10.random_cifar_patches_pca( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
63 n_vis, None, 'float32', n_patches, R, C,), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
64 X), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
65 img_shape=(R,C)) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
66 image_tiling.save_tiled_raster_images(_img, fname) |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
67 elif dataset == 'tinyimages_patches': |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
68 tile = pylearn.dataset_ops.tinyimages.save_filters |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
69 else: |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
70 def tile(X, fname): |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
71 _img = image_tiling.tile_raster_images(X, |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
72 img_shape=(R,C), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
73 min_dynamic_range=1e-2) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
74 image_tiling.save_tiled_raster_images(_img, fname) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
75 |
1507 | 76 batch_idx = tensor.iscalar() |
77 batch_range =batch_idx * batchsize + numpy.arange(batchsize) | |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
78 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
79 if dataset == 'MAR': |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
80 train_batch = pylearn.dataset_ops.image_patches.ranzato_hinton_2010_op(batch_range) |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
81 elif dataset == 'cifar10patches8x8': |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
82 train_batch = pylearn.dataset_ops.cifar10.cifar10_patches( |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
83 batch_range, 'train', n_patches=n_patches, patch_size=(R,C), |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
84 pca_components=n_vis) |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
85 elif dataset == 'tinyimages_patches': |
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
86 train_batch = pylearn.dataset_ops.tinyimages.tinydataset_op(batch_range) |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
87 else: |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
88 train_batch = pylearn.dataset_ops.image_patches.image_patches( |
1507 | 89 s_idx = (batch_idx * batchsize + numpy.arange(batchsize)), |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
90 dims = (n_patches,R,C), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
91 center=True, |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
92 unitvar=True, |
1507 | 93 dtype=theano.config.floatX, |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
94 rasterized=True) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
95 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
96 if not as_unittest: |
1507 | 97 imgs_fn = theano.function([batch_idx], outputs=train_batch) |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
98 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
99 trainer = trainer_alloc( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
100 rbm_alloc(n_I=n_vis), |
1267
075c193afd1b
refactoring mcRBM
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1000
diff
changeset
|
101 train_batch, |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
102 batchsize, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
103 initial_lr_per_example=lr_per_example, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
104 l1_penalty=l1_penalty, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
105 l1_penalty_start=l1_penalty_start, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
106 persistent_chains=persistent_chains) |
1267
075c193afd1b
refactoring mcRBM
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1000
diff
changeset
|
107 rbm=trainer.rbm |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
108 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
109 if persistent_chains: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
110 grads = trainer.contrastive_grads() |
1507 | 111 learn_fn = theano.function([batch_idx], |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
112 outputs=[grads[0].norm(2), grads[0].norm(2), grads[1].norm(2)], |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
113 updates=trainer.cd_updates()) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
114 else: |
1507 | 115 learn_fn = theano.function([batch_idx], outputs=[], updates=trainer.cd_updates()) |
1267
075c193afd1b
refactoring mcRBM
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1000
diff
changeset
|
116 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
117 if persistent_chains: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
118 smplr = trainer.sampler |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
119 else: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
120 smplr = trainer._last_cd1_sampler |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
121 |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
122 if dataset == 'cifar10patches8x8': |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
123 cPickle.dump( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
124 pylearn.dataset_ops.cifar10.random_cifar_patches_pca( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
125 n_vis, None, 'float32', n_patches, R, C,), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
126 open('test_mcRBM.pca.pkl','w')) |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
127 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
128 print "Learning..." |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
129 last_epoch = -1 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
130 for jj in xrange(n_train_iters): |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
131 epoch = jj*batchsize / epoch_size |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
132 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
133 print_jj = epoch != last_epoch |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
134 last_epoch = epoch |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
135 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
136 if as_unittest and epoch == 5: |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
137 U = rbm.U.value |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
138 W = rbm.W.value |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
139 def allclose(a,b): |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
140 return numpy.allclose(a,b,rtol=1.01,atol=1e-3) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
141 print "" |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
142 print "--------------" |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
143 print "assert allclose(l2(U), %f)"%l2(U) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
144 print "assert allclose(l2(W), %f)"%l2(W) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
145 print "assert allclose(U.min(), %f)"%U.min() |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
146 print "assert allclose(U.max(), %f)"%U.max() |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
147 print "assert allclose(W.min(),%f)"%W.min() |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
148 print "assert allclose(W.max(), %f)"%W.max() |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
149 print "--------------" |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
150 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
151 assert allclose(l2(U), 21.351664) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
152 assert allclose(l2(W), 6.275828) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
153 assert allclose(U.min(), -1.176703) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
154 assert allclose(U.max(), 0.859802) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
155 assert allclose(W.min(),-0.223128) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
156 assert allclose(W.max(), 0.227558 ) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
157 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
158 break |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
159 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
160 if print_jj: |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
161 if not as_unittest: |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
162 tile(imgs_fn(jj), "imgs_%06i.png"%jj) |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
163 if persistent_chains: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
164 tile(smplr.positions.value, "sample_%06i.png"%jj) |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
165 tile(rbm.U.value.T, "U_%06i.png"%jj) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
166 tile(rbm.W.value.T, "W_%06i.png"%jj) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
167 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
168 print 'saving samples', jj, 'epoch', jj/(epoch_size/batchsize) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
169 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
170 print 'l2(U)', l2(rbm.U.value), |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
171 print 'l2(W)', l2(rbm.W.value), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
172 print 'l1_penalty', |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
173 try: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
174 print trainer.effective_l1_penalty.value |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
175 except: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
176 print trainer.effective_l1_penalty |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
177 |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
178 print 'U min max', rbm.U.value.min(), rbm.U.value.max(), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
179 print 'W min max', rbm.W.value.min(), rbm.W.value.max(), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
180 print 'a min max', rbm.a.value.min(), rbm.a.value.max(), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
181 print 'b min max', rbm.b.value.min(), rbm.b.value.max(), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
182 print 'c min max', rbm.c.value.min(), rbm.c.value.max() |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
183 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
184 if persistent_chains: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
185 print 'parts min', smplr.positions.value.min(), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
186 print 'max',smplr.positions.value.max(), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
187 print 'HMC step', smplr.stepsize.value, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
188 print 'arate', smplr.avg_acceptance_rate.value |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
189 |
1267
075c193afd1b
refactoring mcRBM
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1000
diff
changeset
|
190 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
191 l2_of_Ugrad = learn_fn(jj) |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
192 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
193 if persistent_chains and print_jj: |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
194 print 'l2(U_grad)', float(l2_of_Ugrad[0]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
195 print 'l2(U_inc)', float(l2_of_Ugrad[1]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
196 print 'l2(W_inc)', float(l2_of_Ugrad[2]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
197 #print 'FE+', float(l2_of_Ugrad[2]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
198 #print 'FE+[0]', float(l2_of_Ugrad[3]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
199 #print 'FE+[1]', float(l2_of_Ugrad[4]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
200 #print 'FE+[2]', float(l2_of_Ugrad[5]), |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
201 #print 'FE+[3]', float(l2_of_Ugrad[6]) |
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
202 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
203 if not as_unittest: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
204 if jj % 2000 == 0: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
205 print '' |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
206 print 'Saving rbm...' |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
207 cPickle.dump(rbm, open('mcRBM.rbm.%06i.pkl'%jj, 'w'), -1) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
208 if persistent_chains: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
209 print 'Saving sampler...' |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
210 cPickle.dump(smplr, open('mcRBM.smplr.%06i.pkl'%jj, 'w'), -1) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
211 |
1000
d4a14c6c36e0
mcRBM - post code-review #1 with Guillaume
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff
changeset
|
212 |
1273
7bb5dd98e671
mcRBM - added hack to main script to pickle final model and sampler
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1272
diff
changeset
|
213 if not as_unittest: |
7bb5dd98e671
mcRBM - added hack to main script to pickle final model and sampler
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1272
diff
changeset
|
214 return rbm, smplr |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
215 |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
216 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
217 def run_classif_experiment(checkpoint): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
218 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
219 R,C=8,8 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
220 n_vis=74 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
221 # PRETRAIN |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
222 # |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
223 # extract 1 million 8x8 patches from TinyImages |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
224 # pre-process them the right way |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
225 # find 74 dims of PCA |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
226 # filter patches through PCA |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
227 whitened_patches, pca_dct = pylearn.dataset_ops.tinyimages.main(n_imgs=100000, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
228 max_components=n_vis, seed=234) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
229 # |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
230 # Set up mcRBM Trainer |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
231 # Initialize P using topological 3x3 overlapping patches thing |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
232 # start learning P matrix after 2 passes through dataset |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
233 # |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
234 rbm_filename = 'mcRBM.rbm.%06i.pkl'%46000 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
235 try: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
236 open(rbm_filename).close() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
237 load_mcrbm = True |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
238 except: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
239 load_mcrbm = False |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
240 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
241 if load_mcrbm: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
242 print 'loading mcRBM from file', rbm_filename |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
243 rbm = cPickle.load(open(rbm_filename)) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
244 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
245 else: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
246 print "Training mcRBM" |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
247 batchsize=128 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
248 epoch_size=len(whitened_patches) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
249 tile = pylearn.dataset_ops.tinyimages.save_filters |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
250 train_batch = theano.tensor.matrix() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
251 trainer = mcRBMTrainer.alloc_for_P( |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
252 rbm=mcRBM_withP.alloc_topo_P(n_I=n_vis, n_J=81), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
253 visible_batch=train_batch, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
254 batchsize=batchsize, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
255 initial_lr_per_example=0.05, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
256 l1_penalty=1e-3, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
257 l1_penalty_start=sys.maxint, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
258 p_training_start=2*epoch_size//batchsize, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
259 persistent_chains=False) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
260 rbm=trainer.rbm |
1507 | 261 learn_fn = theano.function([train_batch], outputs=[], updates=trainer.cd_updates()) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
262 smplr = trainer._last_cd1_sampler |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
263 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
264 ii = 0 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
265 for i_epoch in range(6): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
266 for i_batch in xrange(epoch_size // batchsize): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
267 batch_vals = whitened_patches[i_batch*batchsize:(i_batch+1)*batchsize] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
268 learn_fn(batch_vals) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
269 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
270 if (ii % 1000) == 0: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
271 #tile(imgs_fn(ii), "imgs_%06i.png"%ii) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
272 tile(rbm.U.value.T, "U_%06i.png"%ii) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
273 tile(rbm.W.value.T, "W_%06i.png"%ii) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
274 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
275 print 'saving samples', ii, 'epoch', i_epoch, i_batch |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
276 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
277 print 'l2(U)', l2(rbm.U.value), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
278 print 'l2(W)', l2(rbm.W.value), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
279 print 'l1_penalty', |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
280 try: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
281 print trainer.effective_l1_penalty.value |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
282 except: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
283 print trainer.effective_l1_penalty |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
284 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
285 print 'U min max', rbm.U.value.min(), rbm.U.value.max(), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
286 print 'W min max', rbm.W.value.min(), rbm.W.value.max(), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
287 print 'a min max', rbm.a.value.min(), rbm.a.value.max(), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
288 print 'b min max', rbm.b.value.min(), rbm.b.value.max(), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
289 print 'c min max', rbm.c.value.min(), rbm.c.value.max() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
290 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
291 print 'HMC step', smplr.stepsize.value, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
292 print 'arate', smplr.avg_acceptance_rate.value |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
293 print 'P min max', rbm.P.value.min(), rbm.P.value.max(), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
294 print 'P_lr', trainer.p_lr.value |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
295 print '' |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
296 print 'Saving rbm...' |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
297 cPickle.dump(rbm, open('mcRBM.rbm.%06i.pkl'%ii, 'w'), -1) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
298 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
299 ii += 1 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
300 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
301 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
302 # extract convolutional features from the CIFAR10 data |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
303 feat_filename = 'mcrbm_features.npy' |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
304 feat_filename = 'cifar10.features.46000.npy' |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
305 try: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
306 open(feat_filename).close() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
307 load_features = True |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
308 except: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
309 load_features = False |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
310 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
311 if load_features: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
312 print 'Loading features from', feat_filename |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
313 all_features = numpy.load(feat_filename, mmap_mode='r') |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
314 else: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
315 batchsize=100 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
316 feat_idx = tensor.lscalar() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
317 feat_idx_range = feat_idx * batchsize + tensor.arange(batchsize) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
318 train_batch_x, train_batch_y = pylearn.dataset_ops.cifar10.cifar10( |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
319 feat_idx_range, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
320 split='all', |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
321 dtype='uint8', |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
322 rasterized=False, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
323 color='rgb') |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
324 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
325 WINDOW_SIZE=8 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
326 WINDOW_STRIDE=4 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
327 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
328 # put these into shared vars because support for big matrix constants is bad, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
329 # (comparing them is slow) |
1507 | 330 pca_eigvecs = theano.shared(pca_dct['eig_vecs'].astype('float32')) |
331 pca_eigvals = theano.shared(pca_dct['eig_vals'].astype('float32')) | |
332 pca_mean = theano.shared(pca_dct['mean'].astype('float32')) | |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
333 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
334 def theano_pca_whiten(X): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
335 #copying preprepcessing.pca.pca_whiten |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
336 return tensor.true_div( |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
337 tensor.dot(X-pca_mean, pca_eigvecs), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
338 tensor.sqrt(pca_eigvals)+1e-8) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
339 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
340 h_list = [] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
341 g_list = [] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
342 for r_offset in range(0, 32-WINDOW_SIZE+1, WINDOW_STRIDE): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
343 for c_offset in range(0, 32-WINDOW_SIZE+1, WINDOW_STRIDE): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
344 window = train_batch_x[:, r_offset:r_offset+WINDOW_SIZE, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
345 c_offset:c_offset+WINDOW_SIZE, :] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
346 assert window.dtype=='uint8' |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
347 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
348 #rasterize the patches |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
349 raster_window = tensor.flatten(tensor.cast(window, 'float32'),2) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
350 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
351 #subtract off the mean of each image |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
352 raster_window = raster_window - raster_window.mean(axis=1).reshape((batchsize,1)) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
353 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
354 h,g = rbm.expected_h_g_given_v(theano_pca_whiten(raster_window)) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
355 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
356 h_list.append(h) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
357 g_list.append(g) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
358 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
359 hg = tensor.concatenate(h_list + g_list, axis=1) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
360 |
1507 | 361 feat_fn = theano.function([feat_idx], hg) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
362 features = numpy.empty((60000, 11025), dtype='float32') |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
363 for i in xrange(60000//batchsize): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
364 if i % 100 == 0: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
365 print("feature batch %i"%i) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
366 features[i*batchsize:(i+1)*batchsize] = feat_fn(i) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
367 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
368 print("saving features to %s"%feat_filename) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
369 numpy.save(feat_filename, features) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
370 all_features = features |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
371 del features |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
372 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
373 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
374 # CLASSIFY FEATURES |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
375 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
376 if 0: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
377 # nothing to load |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
378 pass |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
379 else: |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
380 batchsize=100 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
381 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
382 if feat_filename.startswith('cifar'): |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
383 learnrate = 0.002 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
384 l1_regularization = 0.004 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
385 anneal_epoch=100 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
386 n_epochs = 500 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
387 else: |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
388 learnrate = 0.005 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
389 l1_regularization = 0.004 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
390 n_epochs = 100 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
391 anneal_epoch=20 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
392 |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
393 x_i = tensor.matrix() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
394 y_i = tensor.ivector() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
395 lr = tensor.scalar() |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
396 #l1_regularization = float(sys.argv[1]) #1.e-3 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
397 #l2_regularization = float(sys.argv[2]) #1.e-3*0 |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
398 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
399 feature_logreg = LogisticRegression.new(x_i, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
400 n_in = 11025, n_out=10, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
401 dtype=x_i.dtype) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
402 |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
403 # marc'aurelio does this... |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
404 feature_logreg.w.value = numpy.random.RandomState(44).randn(11025,10)*.02 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
405 |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
406 traincost = feature_logreg.nll(y_i).sum() |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
407 traincost = traincost + abs(feature_logreg.w).sum() * l1_regularization |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
408 #traincost = traincost + (feature_logreg.w**2).sum() * l2_regularization |
1507 | 409 train_logreg_fn = theano.function([x_i, y_i, lr], |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
410 [feature_logreg.nll(y_i).mean(), |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
411 feature_logreg.errors(y_i).mean()], |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
412 updates=pylearn.gd.sgd.sgd_updates( |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
413 params=feature_logreg.params, |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
414 grads=tensor.grad(traincost, feature_logreg.params), |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
415 stepsizes=[lr,lr/10.])) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
416 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
417 all_labels = pylearn.dataset_ops.cifar10.all_data_labels('uint8')[1] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
418 pylearn.dataset_ops.cifar10.all_data_labels.forget() # clear memo cache |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
419 assert len(all_labels)==60000 |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
420 if 0: |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
421 print "Using validation set" |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
422 train_labels = all_labels[:40000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
423 valid_labels = all_labels[40000:50000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
424 test_labels = all_labels[50000:60000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
425 train_features = all_features[:40000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
426 valid_features = all_features[40000:50000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
427 test_features = all_features[50000:60000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
428 else: |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
429 print "NOT USING validation set" |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
430 train_labels = all_labels[:50000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
431 valid_labels = None |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
432 test_labels = all_labels[50000:60000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
433 train_features = all_features[:50000] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
434 valid_features = None |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
435 test_features = all_features[50000:60000] |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
436 |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
437 if 1: |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
438 print "Computing mean and std.dev" |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
439 train_mean = train_features.mean(axis=0) |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
440 train_std = train_features.std(axis=0)+1e-4 |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
441 preproc = lambda x: (x-train_mean)/(0.1+train_std) |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
442 else: |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
443 print "Not centering data" |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
444 preproc = lambda x:x |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
445 |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
446 for epoch in xrange(n_epochs): |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
447 print 'epoch', epoch |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
448 # validate |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
449 # Marc'Aurelio, you crazy!! |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
450 # the division by batchsize is done in the cost function |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
451 e_lr = learnrate / (batchsize*max(1.0, numpy.floor(max(1., epoch/float(anneal_epoch))-2))) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
452 |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
453 if valid_features is not None: |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
454 l01s = [] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
455 nlls = [] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
456 for i in xrange(10000/batchsize): |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
457 x_i = valid_features[i*batchsize:(i+1)*batchsize] |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
458 y_i = valid_labels[i*batchsize:(i+1)*batchsize] |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
459 |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
460 #lr=0.0 -> no learning, safe for validation set |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
461 nll, l01 = train_logreg_fn(preproc(x_i), y_i, 0.0) |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
462 nlls.append(nll) |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
463 l01s.append(l01) |
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
464 print 'validate log_reg', numpy.mean(nlls), numpy.mean(l01s) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
465 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
466 # test |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
467 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
468 l01s = [] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
469 nlls = [] |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
470 for i in xrange(len(test_features)//batchsize): |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
471 x_i = test_features[i*batchsize:(i+1)*batchsize] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
472 y_i = test_labels[i*batchsize:(i+1)*batchsize] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
473 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
474 #lr=0.0 -> no learning, safe for validation set |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
475 nll, l01 = train_logreg_fn(preproc(x_i), y_i, 0.0) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
476 nlls.append(nll) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
477 l01s.append(l01) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
478 print 'test log_reg', numpy.mean(nlls), numpy.mean(l01s) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
479 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
480 #train |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
481 l01s = [] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
482 nlls = [] |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
483 for i in xrange(len(train_features)//batchsize): |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
484 x_i = train_features[i*batchsize:(i+1)*batchsize] |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
485 y_i = train_labels[i*batchsize:(i+1)*batchsize] |
1333
c7b2da4e2df6
modifs to test_mcRBM to reproduce mcRBM classif results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
486 nll, l01 = train_logreg_fn(preproc(x_i), y_i, e_lr) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
487 nlls.append(nll) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
488 l01s.append(l01) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
489 print 'train log_reg', numpy.mean(nlls), numpy.mean(l01s) |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
490 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
491 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
492 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
493 |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
494 import pickle as cPickle |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
495 #import cPickle |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
496 if __name__ == '__main__': |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
497 if 0: |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
498 #learning 16 x 16 pinwheel filters from official cifar patches (MAR) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
499 rbm,smplr = test_reproduce_ranzato_hinton_2010( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
500 as_unittest=False, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
501 n_train_iters=5000, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
502 rbm_alloc=lambda n_I : mcRBM_withP.alloc_topo_P(n_I, n_J=81), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
503 trainer_alloc=mcRBMTrainer.alloc_for_P, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
504 dataset='MAR' |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
505 ) |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
506 |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
507 if 0: |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
508 # pretraining settings |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
509 rbm,smplr = test_reproduce_ranzato_hinton_2010( |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
510 as_unittest=False, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
511 n_train_iters=60000, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
512 rbm_alloc=lambda n_I : mcRBM_withP.alloc_topo_P(n_I, n_J=81), |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
513 trainer_alloc=mcRBMTrainer.alloc_for_P, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
514 lr_per_example=0.05, |
1286
8905186b176c
test_mcRBM - added code to iterate over tinyimages
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1284
diff
changeset
|
515 dataset='tinyimages_patches', |
1284
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
516 l1_penalty=1e-3, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
517 l1_penalty_start=30000, |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
518 #l1_penalty_start=350, #DEBUG |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
519 persistent_chains=False |
1817485d586d
mcRBM - many changes incl. adding support for pooling matrix
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1273
diff
changeset
|
520 ) |
1323
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
521 |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
522 if 1: |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
523 def checkpoint(): |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
524 return checkpoint |
d6726417cf57
adding training script for test_mcRBM to reproduce classification results
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1286
diff
changeset
|
525 run_classif_experiment(checkpoint=checkpoint) |
1332
837768915081
added test idea to test_mcRBM
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
1323
diff
changeset
|
526 |