mosesdecoder/mert/Vocabulary.cpp
Tetsuo Kiso 8fdec9bf30 Use boost::unordered_map instead of std::map.
For storing the word vocabulary used in computation of
BLEU scores. This change will reduce the running time
of extractor about 2-3 seconds (9% reduction).
2012-12-07 05:12:24 +09:00

44 lines
908 B
C++

#include "Vocabulary.h"
#include "Singleton.h"
namespace mert {
namespace {
Vocabulary* g_vocab = NULL;
} // namespace
int Vocabulary::Encode(const std::string& token) {
iterator it = m_vocab.find(token);
int encoded_token;
if (it == m_vocab.end()) {
// Add an new entry to the vocaburary.
encoded_token = static_cast<int>(m_vocab.size());
m_vocab[token] = encoded_token;
} else {
encoded_token = it->second;
}
return encoded_token;
}
bool Vocabulary::Lookup(const std::string&str , int* v) const {
const_iterator it = m_vocab.find(str);
if (it == m_vocab.end()) return false;
*v = it->second;
return true;
}
Vocabulary* VocabularyFactory::GetVocabulary() {
if (g_vocab == NULL) {
return MosesTuning::Singleton<Vocabulary>::GetInstance();
} else {
return g_vocab;
}
}
void VocabularyFactory::SetVocabulary(Vocabulary* vocab) {
g_vocab = vocab;
}
} // namespace mert