pylearn: pmat.py comparison

comparison pmat.py @ 380:c2f17f231960

added function to load amat file

author	Frederic Bastien <bastienf@iro.umontreal.ca>
date	Wed, 09 Jul 2008 16:55:27 -0400
parents	9330d941fa1f
children

comparison

equal deleted inserted replaced

-:74b402b5a81b
+:c2f17f231960
 # Author: Pascal Vincent
 #import numarray, sys, os, os.path
 import numpy.numarray, sys, os, os.path
+import fpconst
 def array_columns( a, cols ):
 indices = None
 if isinstance( cols, int ):
 indices = [ cols ]
 row = row.split()
 if len(row)>0:
 fieldnames.append(row[0])
 f.close()
 else:
+self.fieldnames = [ "field_"+str(i) for i in range(a.shape[1]) ]
+return dataset.ArrayDataSet(a,lookup_list.LookupList(fieldnames,[x for x in range(a.shape[1])]))
+def load_amat_as_array_dataset(fname):
+import dataset,lookup_list
+#load the amat as array
+(a,fieldnames)=readAMat(fname)
+#load the fieldnames
+if len(fieldnames)==0:
 self.fieldnames = [ "field_"+str(i) for i in range(a.shape[1]) ]
 return dataset.ArrayDataSet(a,lookup_list.LookupList(fieldnames,[x for x in range(a.shape[1])]))
 def save_array_dataset_as_pmat(fname,ds):
 self.putRow(i,row)
 def __len__(self):
 return self.length
+#copied from PLEARNDIR:python_modules/plearn/vmat/readAMat.py
+def safefloat(str):
+"""Convert the given string to its float value. It is 'safe' in the sense
+that missing values ('nan') will be properly converted to the corresponding
+float value under all platforms, contrarily to 'float(str)'.
+"""
+if str.lower() == 'nan':
+return fpconst.NaN
+else:
+return float(str)
+#copied from PLEARNDIR:python_modules/plearn/vmat/readAMat.py
+def readAMat(amatname):
+"""Read a PLearn .amat file and return it as a numarray Array.
+Return a tuple, with as the first argument the array itself, and as
+the second argument the fieldnames (list of strings).
+"""
+### NOTE: this version is much faster than first creating the array and
+### updating each row as it is read...  Bizarrely enough
+f = open(amatname)
+a = []
+fieldnames = []
+for line in f:
+if line.startswith("#size:"):
+(length,width) = line[6:].strip().split()
+elif line.startswith("#sizes:"):  # ignore input/target/weight/extra sizes
+continue
+elif line.startswith("#:"):
+fieldnames = line[2:].strip().split()
+pass
+elif not line.startswith('#'):
+# Add all non-comment lines.
+row = [ safefloat(x) for x in line.strip().split() ]
+if row:
+a.append(row)
+f.close()
+return numpy.numarray.array(a), fieldnames
 if __name__ == '__main__':
 pmat = PMat( 'tmp.pmat', 'w', fieldnames=['F1', 'F2'] )
 pmat.append( [1, 2] )
 pmat.append( [3, 4] )

Mercurial > pylearn

comparison pmat.py @ 380:c2f17f231960