Mercurial > pylearn
view sandbox/embeddings/one-per-line.py @ 467:f3711bcc467e
Fixed a bug in how embeddings are read
author | Joseph Turian <turian@iro.umontreal.ca> |
---|---|
date | Mon, 20 Oct 2008 19:14:06 -0400 |
parents | 131e19dfe793 |
children |
line wrap: on
line source
#!/usr/bin/python import string #import psyco weightsfile = "lm-weights.txt" vocabfile = "words.asc" size = 30000 dimensions = 50 import numpy, math import sys from common.str import percent word_to_vector = {} f = open(weightsfile) f.readline() vals = [float(v) for v in string.split(f.readline())] assert len(vals) == size * dimensions vals.reverse() #for i in range(size): r = range(size) r.reverse() for i in r: l = vals[dimensions*i:dimensions*(i+1)] print string.join([`s` for s in l], "\t")