annotate pylearn/datasets/flickr.py @ 602:28f7dc848efc

fixed flickr relpath mistake
author James Bergstra <bergstrj@iro.umontreal.ca>
date Wed, 14 Jan 2009 17:22:23 -0500
parents fd95ff96dd47
children f6c74f34cd35
rev   line source
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
1 """
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
2 Routines to load variations on the Flickr image dataset.
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
3 """
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
4 from __future__ import absolute_import
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
5
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
6 import os
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
7 import numpy
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
8
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
9 from ..io import filetensor
602
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
10 if 0:
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
11 from .config import data_root
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
12 else:
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
13 def data_root():
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
14 return '/u/lisa/db/flickr/filetensor'
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
15 from .dataset import Dataset
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
16
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
17
602
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
18 path_test_10class ='flickr_10classes_test.ft'
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
19
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
20 path_train_10class = 'flickr_10classes_train.ft'
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
21
602
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
22 path_valid_10class = 'flickr_10classes_valid.ft'
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
23
602
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
24 def basic_10class(folder = None):
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
25 """Return the basic flickr image classification problem.
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
26 The images are 75x75, and there are 7500 training examples.
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
27 """
602
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
28 root = data_root() if folder is None else folder
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
29 train = filetensor.read(open(os.path.join(root, path_train_10class)))
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
30 valid = filetensor.read(open(os.path.join(root, path_valid_10class)))
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
31 test = filetensor.read(open(os.path.join(root, path_test_10class)))
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
32
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
33 rval = Dataset()
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
34
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
35 rval.train = Dataset.Obj(
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
36 x=train[:, 0:-1],
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
37 y=numpy.asarray(train[:, -1], dtype='int64'))
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
38 rval.valid = Dataset.Obj(
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
39 x=valid[:, 0:-1],
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
40 y=numpy.asarray(valid[:, -1], dtype='int64'))
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
41 rval.test = Dataset.Obj(
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
42 x=test[:, 0:-1],
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
43 y=numpy.asarray(test[:, -1], dtype='int64'))
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
44
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
45 rval.n_classes = 10
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
46 rval.img_shape = (75,75)
602
28f7dc848efc fixed flickr relpath mistake
James Bergstra <bergstrj@iro.umontreal.ca>
parents: 601
diff changeset
47
600
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
48 return rval
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
49
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
50 def translations_10class():
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
51 raise NotImplementedError('TODO')
e56303df3c77 initial flickr
James Bergstra <bergstrj@iro.umontreal.ca>
parents:
diff changeset
52