mirror of
https://github.com/moses-smt/mosesdecoder.git
synced 2024-12-26 05:14:36 +03:00
27 lines
631 B
C++
27 lines
631 B
C++
#include "hash.hh"
|
|
|
|
uint64_t getHash(StringPiece text) {
|
|
std::size_t len = text.size();
|
|
uint64_t key = util::MurmurHashNative(text.data(), len);
|
|
return key;
|
|
}
|
|
|
|
std::vector<uint64_t> getVocabIDs(StringPiece textin){
|
|
//Tokenize
|
|
std::vector<uint64_t> output;
|
|
|
|
util::TokenIter<util::SingleCharacter> it(textin, util::SingleCharacter(' '));
|
|
|
|
while(it){
|
|
output.push_back(getHash(*it));
|
|
it++;
|
|
}
|
|
|
|
return output;
|
|
}
|
|
|
|
uint64_t getVocabID(std::string candidate) {
|
|
std::size_t len = candidate.length();
|
|
uint64_t key = util::MurmurHashNative(candidate.c_str(), len);
|
|
return key;
|
|
} |