File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1+ make
2+ if [ ! -e text8 ]; then
3+ wget http://mattmahoney.net/dc/text8.zip -O text8.gz
4+ gzip -d text8.gz -f
5+ fi
6+ echo ----------------------------------------------------------------------------------------------------------------
7+ echo Note that the accuracy and coverage of the test set questions is going to be low with this small training corpus
8+ echo To achieve better accuracy, larger training set is needed
9+ echo ----------------------------------------------------------------------------------------------------------------
10+ time ./word2phrase -train text8 -output text8-phrase -threshold 500 -debug 2 -min-count 3
11+ time ./word2vec -train text8-phrase -output vectors-phrase.bin -cbow 0 -size 300 -window 10 -negative 0 -hs 1 -sample 1e-3 -threads 12 -binary 1 -min-count 3
12+ ./compute-accuracy vectors-phrase.bin < questions-phrases.txt
You can’t perform that action at this time.
0 commit comments