2013-08-01 21:29:38 +02:00
|
|
|
make
|
|
|
|
if [ ! -e text8 ]; then
|
|
|
|
wget http://mattmahoney.net/dc/text8.zip -O text8.gz
|
|
|
|
gzip -d text8.gz -f
|
|
|
|
fi
|
2014-09-06 18:54:27 +02:00
|
|
|
time ./word2vec -train text8 -output vectors.bin -cbow 1 -size 200 -window 8 -negative 25 -hs 0 -sample 1e-4 -threads 20 -binary 1 -iter 15
|
2013-08-01 21:29:38 +02:00
|
|
|
./compute-accuracy vectors.bin 30000 < questions-words.txt
|
|
|
|
# to compute accuracy with the full vocabulary, use: ./compute-accuracy vectors.bin < questions-words.txt
|