view sandbox/embeddings/files.py @ 459:f400f62e7f9e

Fixed embedding preprocessing
author Joseph Turian <turian@iro.umontreal.ca>
date Tue, 07 Oct 2008 23:00:10 -0400
parents ed6b0b3be8d2
children
line wrap: on
line source

"""
Locations of the embedding data files.
"""
WEIGHTSFILE     = "/u/turian/data/word_embeddings.collobert-and-weston/lm-weights.txt"
VOCABFILE       = "/u/turian/data/word_embeddings.collobert-and-weston/words.asc"
NUMBER_OF_WORDS = 30000
DIMENSIONS      = 50
UNKNOWN         = "UNKNOWN"