# HG changeset patch # User James Bergstra # Date 1231966479 18000 # Node ID e56303df3c773583a2a3afc7c03545f112b9da5a # Parent bd777e960c7c3c693a903b5fb7a760b5b0123def initial flickr diff -r bd777e960c7c -r e56303df3c77 pylearn/datasets/flickr.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/pylearn/datasets/flickr.py Wed Jan 14 15:54:39 2009 -0500 @@ -0,0 +1,61 @@ +""" +Routines to load variations on the Flickr image dataset. +""" +from __future__ import absolute_import + +import os +import numpy + +from ..io import filetensor +from .config import data_root +from .dataset import Dataset + + +def test_10class(): + #TODO: make path an option, + #TODO: make default path relative to data_root() + f = open('flickr_10classes_test.ft') + data = filetensor.read(f) + return data.T.copy() #put in to one example per row, row major + +def train_10class(): + #TODO: make path an option, + #TODO: make default path relative to data_root() + f = open('flickr_10classes_train.ft') + data = filetensor.read(f) + return data.T.copy() #put in to one example per row, row major + +def valid_10class(): + #TODO: make path an option, + #TODO: make default path relative to data_root() + f = open('flickr_10classes_valid.ft') + data = filetensor.read(f) + return data.T.copy() #put in to one example per row, row major + +def basic_10class(): + """Return the basic flickr image classification problem. + The images are 75x75, and there are 7500 training examples. + """ + train = train_10class() + valid = valid_10class() + test = test_10class() + + rval = Dataset() + + rval.train = Dataset.Obj( + x=train[:, 0:-1], + y=numpy.asarray(train[:, -1], dtype='int64')) + rval.valid = Dataset.Obj( + x=valid[:, 0:-1], + y=numpy.asarray(valid[:, -1], dtype='int64')) + rval.test = Dataset.Obj( + x=test[:, 0:-1], + y=numpy.asarray(test[:, -1], dtype='int64')) + + rval.n_classes = 10 + rval.img_shape = (75,75) + return rval + +def translations_10class(): + raise NotImplementedError('TODO') +