|
Joshua
open source statistical hierarchical phrase-based machine translation system
|
#include <vocab.hh>
Public Member Functions | |
| SortedVocabulary () | |
| WordIndex | Index (const StringPiece &str) const |
| WordIndex | Bound () const |
| void | SetupMemory (void *start, std::size_t allocated, std::size_t entries, const Config &config) |
| void | ConfigureEnumerate (EnumerateVocab *to, std::size_t max_entries) |
| WordIndex | Insert (const StringPiece &str) |
| void | FinishedLoading (ProbBackoff *reorder_vocab) |
| std::size_t | UnkCountChangePadding () const |
| bool | SawUnk () const |
| void | LoadedBinary (int fd, EnumerateVocab *to) |
Static Public Member Functions | |
| static size_t | Size (std::size_t entries, const Config &config) |
Private Attributes | |
| uint64_t * | begin_ |
| uint64_t * | end_ |
| WordIndex | bound_ |
| WordIndex | highest_value_ |
| bool | saw_unk_ |
| EnumerateVocab * | enumerate_ |
| std::vector< std::string > | strings_to_enumerate_ |
| WordIndex lm::ngram::SortedVocabulary::Bound | ( | ) | const |
| void lm::ngram::SortedVocabulary::ConfigureEnumerate | ( | EnumerateVocab * | to, |
| std::size_t | max_entries | ||
| ) |
| void lm::ngram::SortedVocabulary::FinishedLoading | ( | ProbBackoff * | reorder_vocab | ) |
| WordIndex lm::ngram::SortedVocabulary::Index | ( | const StringPiece & | str | ) | const [virtual] |
Implements lm::base::Vocabulary.
| WordIndex lm::ngram::SortedVocabulary::Insert | ( | const StringPiece & | str | ) |
| void lm::ngram::SortedVocabulary::LoadedBinary | ( | int | fd, |
| EnumerateVocab * | to | ||
| ) |
| bool lm::ngram::SortedVocabulary::SawUnk | ( | ) | const |
| void lm::ngram::SortedVocabulary::SetupMemory | ( | void * | start, |
| std::size_t | allocated, | ||
| std::size_t | entries, | ||
| const Config & | config | ||
| ) |
| std::size_t lm::ngram::SortedVocabulary::Size | ( | std::size_t | entries, |
| const Config & | config | ||
| ) | [static] |
| std::size_t lm::ngram::SortedVocabulary::UnkCountChangePadding | ( | ) | const |
uint64_t* lm::ngram::SortedVocabulary::begin_ [private] |
WordIndex lm::ngram::SortedVocabulary::bound_ [private] |
uint64_t * lm::ngram::SortedVocabulary::end_ [private] |
bool lm::ngram::SortedVocabulary::saw_unk_ [private] |
std::vector<std::string> lm::ngram::SortedVocabulary::strings_to_enumerate_ [private] |