view pylearn/datasets/caltech.py @ 1476:8c10bda4bb5f

Configured default train/valid/test split for icml07.MNIST_rotated_background dataset. Defaults are the ones used by Hugo in the ICML07 paper and in all contracting auto-encoder papers.
author gdesjardins
date Fri, 20 May 2011 16:53:00 -0400
parents 124b939d997f
children 4727a7e4d506
line wrap: on
line source

"""
Various routines to load/access MNIST data.
"""

import os
import numpy

from pylearn.io.pmat import PMat
from pylearn.datasets.config import data_root # config
from pylearn.datasets.dataset import Dataset

def caltech_silhouette():

    rval = Dataset()

    
    path = os.path.join(data_root(), 'caltech_silhouettes')

    rval.train = Dataset.Obj(x=numpy.load(os.path.join(path,'train_data.npy')),
                             y=numpy.load(os.path.join(path,'train_labels.npy')))
    rval.valid = Dataset.Obj(x=numpy.load(os.path.join(path,'val_data.npy')),
                             y=numpy.load(os.path.join(path,'val_labels.npy')))
    rval.test  = Dataset.Obj(x=numpy.load(os.path.join(path,'test_data.npy')),
                             y=numpy.load(os.path.join(path,'test_labels.npy')))

    rval.n_classes = 101
    rval.img_shape = (28,28)

    return rval