#include "gflags/gflags.h"
#include "constants.h"
#include "tbb/task_scheduler_init.h"
Go to the source code of this file.
Functions | |
DEFINE_int32 (iter, 1000,"Number of iterations the topic modeller should be run") | |
DEFINE_int32 (burnin, 299,"Number of iterations after which alpha optimization should be to be run after every <optimizestats> iterations") | |
DEFINE_int32 (optimizestats, 25,"Optimize hyper parameters every these many iterations") | |
DEFINE_int32 (printloglikelihood, 25,"Print log likelihood after every <printlogLikelihood> iterations after burn-in") | |
DEFINE_int32 (topics, 100,"The number of topics to be used by LDA.") | |
DEFINE_string (inputprefix,"lda","The output prefix used for the FormatData routine") | |
DEFINE_string (dumpprefix,"","The word-topic counts are initialized from this file which is generated by the preprocessing step or at the end of an iteration") | |
DEFINE_bool (restart, false,"Indicates use of failure recovery mode. The iteration to start with should also be specified") | |
DEFINE_bool (online, false,"Uses online initialization instead of random") | |
DEFINE_int32 (startiter, 1,"This the iteration at which failure recovery should start") | |
DEFINE_bool (test, false,"Run the test pipeline. No updates are done & requires an earlier dump of the word-topic counts table") | |
DEFINE_bool (teststream, false,"Run the test pipeline in streaming mode. Formatting is a part of the pipeline. No updates are done & requires an earlier dump of the word-topic counts table & dictionary") | |
DEFINE_double (alpha, ALPHA_SUM,"Weight of the Dirichlet conjugate for topics") | |
DEFINE_double (beta, BETA,"Weight of the Dirichlet conjugate for words") | |
DEFINE_int32 (chkptinterval, 25,"The topic assignments are saved every these many iterations") | |
DEFINE_string (chkptdir,"","The directory to which the checkpoints need to written") | |
DEFINE_string (servers,"specify","The set of all memcached servers that are storing the state. E.g. 192.168.0.1, 192.168.0.3:44, 200.132.12.34") | |
DEFINE_int32 (numdumps, 1,"Number of word-topic count dumps in the training data") | |
DEFINE_int32 (maxmemory, 2048,"The max memory that can be used") | |
DEFINE_string (dictionary,"specify","The dump of the global dictionary produced in the training run. To be use for teststream") | |
DEFINE_int32 (livetokens, 500,"Max Live Tokens in pipeline") | |
DEFINE_int32 (model, 1,"Unigram-1") | |
DEFINE_int32 (samplerthreads, tbb::task_scheduler_init::automatic,"The number of foreground threads that run actual LDA pipeline. Default is to figure out automatically") |
DEFINE_bool | ( | teststream | , | |
false | , | |||
"Run the test pipeline in streaming mode. Formatting is a part of the pipeline. No updates are done & requires an earlier dump of the word-topic counts table & dictionary" | ||||
) |
DEFINE_bool | ( | test | , | |
false | , | |||
"Run the test pipeline. No updates are done & requires an earlier dump of the word-topic counts table" | ||||
) |
DEFINE_bool | ( | online | , | |
false | , | |||
"Uses online initialization instead of random" | ||||
) |
DEFINE_bool | ( | restart | , | |
false | , | |||
"Indicates use of failure recovery mode. The iteration to start with should also be specified" | ||||
) |
DEFINE_double | ( | beta | , | |
BETA | , | |||
"Weight of the Dirichlet conjugate for words" | ||||
) |
DEFINE_double | ( | alpha | , | |
ALPHA_SUM | , | |||
"Weight of the Dirichlet conjugate for topics" | ||||
) |
DEFINE_int32 | ( | samplerthreads | , | |
tbb::task_scheduler_init::automatic | , | |||
"The number of foreground threads that run actual LDA pipeline. Default is to figure out automatically" | ||||
) |
DEFINE_int32 | ( | model | , | |
1 | , | |||
"Unigram-1" | ||||
) |
DEFINE_int32 | ( | livetokens | , | |
500 | , | |||
"Max Live Tokens in pipeline" | ||||
) |
DEFINE_int32 | ( | maxmemory | , | |
2048 | , | |||
"The max memory that can be used" | ||||
) |
DEFINE_int32 | ( | numdumps | , | |
1 | , | |||
"Number of word-topic count dumps in the training data" | ||||
) |
DEFINE_int32 | ( | chkptinterval | , | |
25 | , | |||
"The topic assignments are saved every these many iterations" | ||||
) |
DEFINE_int32 | ( | startiter | , | |
1 | , | |||
"This the iteration at which failure recovery should start" | ||||
) |
DEFINE_int32 | ( | topics | , | |
100 | , | |||
"The number of topics to be used by LDA." | ||||
) |
DEFINE_int32 | ( | printloglikelihood | , | |
25 | , | |||
"Print log likelihood after every <printlogLikelihood> iterations after burn-in" | ||||
) |
DEFINE_int32 | ( | optimizestats | , | |
25 | , | |||
"Optimize hyper parameters every these many iterations" | ||||
) |
DEFINE_int32 | ( | burnin | , | |
299 | , | |||
"Number of iterations after which alpha optimization should be to be run after every <optimizestats> iterations" | ||||
) |
DEFINE_int32 | ( | iter | , | |
1000 | , | |||
"Number of iterations the topic modeller should be run" | ||||
) |
DEFINE_string | ( | dictionary | , | |
"specify" | , | |||
"The dump of the global dictionary produced in the training run. To be use for teststream" | ||||
) |
DEFINE_string | ( | servers | , | |
"specify" | , | |||
"The set of all memcached servers that are storing the state. E.g. 192.168.0. | 1, | |||
192.168.0.3:44 | , | |||
200.132.12.34" | ||||
) |
DEFINE_string | ( | chkptdir | , | |
"" | , | |||
"The directory to which the checkpoints need to written" | ||||
) |
DEFINE_string | ( | dumpprefix | , | |
"" | , | |||
"The word-topic counts are initialized from this file which is generated by the preprocessing step or at the end of an iteration" | ||||
) |
DEFINE_string | ( | inputprefix | , | |
"lda" | , | |||
"The output prefix used for the FormatData routine" | ||||
) |