Class Vocab

Class Documentation

class Vocab

Public Functions

Vocab(Ptr<Options> options, size_t batchIndex)
size_t loadOrCreate(const std::string &vocabPath, const std::vector<std::string> &trainPaths, size_t maxSize = 0)
size_t load(const std::string &vocabPath, size_t maxSize = 0)
void create(const std::string &vocabPath, const std::vector<std::string> &trainPaths, size_t maxSize)
void create(const std::string &vocabPath, const std::string &trainPath, size_t maxSize)
Word operator[](const std::string &word) const
const std::string &operator[](Word word) const
Words encode(const std::string &line, bool addEOS = true, bool inference = false) const
std::string decode(const Words &sentence, bool ignoreEOS = true) const
std::string surfaceForm(const Words &sentence) const
size_t size() const
size_t lemmaSize() const
std::string type() const
Word getEosId() const
Word getUnkId() const
std::vector<Word> suppressedIds(bool suppressUnk = true, bool suppressSpecial = true) const
std::vector<WordIndex> suppressedIndices(bool suppressUnk = true, bool suppressSpecial = true) const
std::string toUpper(const std::string &line) const
std::string toEnglishTitleCase(const std::string &line) const
void transcodeToShortlistInPlace(WordIndex *ptr, size_t num) const
void createFake()
Word randWord()
template<class VocabType>
Ptr<VocabType> tryAs() const