crawlserv++  [under development]
Application for crawling and analyzing textual content of websites.
crawlservpp::Data::TopicModel Member List

This is the complete list of members for crawlservpp::Data::TopicModel, including all inherited members.

addDocument(const std::string &name, const std::vector< std::string > &tokens, std::size_t firstToken, std::size_t numTokens)crawlservpp::Data::TopicModelinline
clear(bool labelingOptions)crawlservpp::Data::TopicModelinline
getBurnInIterations() constcrawlservpp::Data::TopicModelinline
getDocumentId(const std::string &name) constcrawlservpp::Data::TopicModelinline
getDocuments() constcrawlservpp::Data::TopicModelinline
getDocumentsTopics(std::unordered_set< std::string > &done) constcrawlservpp::Data::TopicModelinline
getDocumentsTopics(const std::vector< std::vector< std::string >> &documents, std::size_t maxIterations, std::size_t numberOfWorkers) constcrawlservpp::Data::TopicModelinline
getIterations() constcrawlservpp::Data::TopicModelinline
getLogLikelihoodPerToken() constcrawlservpp::Data::TopicModelinline
getModelInfo() constcrawlservpp::Data::TopicModelinline
getModelName() constcrawlservpp::Data::TopicModelinline
getNumberOfDocuments() constcrawlservpp::Data::TopicModelinline
getNumberOfTokens() constcrawlservpp::Data::TopicModelinline
getNumberOfTopics() constcrawlservpp::Data::TopicModelinline
getOriginalVocabularySize() constcrawlservpp::Data::TopicModelinline
getParameterOptimizationInterval() constcrawlservpp::Data::TopicModelinline
getRandomNumberGenerationSeed() constcrawlservpp::Data::TopicModelinline
getRemovedTokens() constcrawlservpp::Data::TopicModelinline
getTermWeighting() constcrawlservpp::Data::TopicModelinline
getTokenEntropy() constcrawlservpp::Data::TopicModelinline
getTopics() constcrawlservpp::Data::TopicModelinline
getTopicsSorted() constcrawlservpp::Data::TopicModelinline
getTopicTopNLabels(std::size_t topic, std::size_t n) constcrawlservpp::Data::TopicModelinline
getTopicTopNTokens(std::size_t topic, std::size_t n) constcrawlservpp::Data::TopicModelinline
getVocabulary() constcrawlservpp::Data::TopicModelinline
getVocabularySize() constcrawlservpp::Data::TopicModelinline
label(std::size_t threads)crawlservpp::Data::TopicModelinline
load(const std::string &fileName)crawlservpp::Data::TopicModelinline
save(const std::string &fileName, bool full) constcrawlservpp::Data::TopicModelinline
setBurnInIteration(std::size_t skipIterations)crawlservpp::Data::TopicModelinline
setFixedNumberOfTopics(std::size_t k)crawlservpp::Data::TopicModelinline
setInitialParameters(std::size_t initialTopics, float alpha, float eta, float gamma)crawlservpp::Data::TopicModelinline
setLabelingOptions(bool activate, std::size_t minCf, std::size_t minDf, std::size_t minLength, std::size_t maxLength, std::size_t maxCandidates, float smoothing, float mu, std::size_t windowSize)crawlservpp::Data::TopicModelinline
setParameterOptimizationInterval(std::size_t interval)crawlservpp::Data::TopicModelinline
setRandomNumberGenerationSeed(std::size_t newSeed)crawlservpp::Data::TopicModelinline
setTokenRemoval(std::size_t collectionFrequency, std::size_t documentFrequency, std::size_t fixedNumberOfTopTokens)crawlservpp::Data::TopicModelinline
setUseIdf(bool idf)crawlservpp::Data::TopicModelinline
startTraining()crawlservpp::Data::TopicModelinline
train(std::size_t iterations, std::size_t threads)crawlservpp::Data::TopicModelinline