mosesdecoder/probingpt/querying.h
2017-02-16 19:30:07 +00:00

80 lines
1.8 KiB
C++

#pragma once
#include <boost/iostreams/device/mapped_file.hpp>
#include <boost/unordered_map.hpp>
#include <sys/stat.h> //For finding size of file
#include <algorithm> //toLower
#include <deque>
#include "vocabid.h"
#include "probing_hash_utils.h"
#include "hash.h" //Includes line splitter
#include "line_splitter.h"
#include "util.h"
#include "moses2/legacy/Util2.h"
namespace probingpt
{
class QueryEngine
{
std::map<uint64_t, std::string> source_vocabids;
typedef std::vector<unsigned char> Alignments;
std::vector<Alignments> alignColl;
Table table;
char *mem; //Memory for the table, necessary so that we can correctly destroy the object
size_t table_filesize;
bool is_reordering;
util::scoped_fd file_;
util::scoped_memory memory_;
// target phrases
boost::iostreams::mapped_file_source file;
util::scoped_fd fileTPS_;
util::scoped_memory memoryTPS_;
void read_alignments(const std::string &alignPath);
void file_exits(const std::string &basePath);
public:
int num_scores;
int num_lex_scores;
bool logProb;
const char *memTPS;
QueryEngine(const char *, util::LoadMethod load_method);
~QueryEngine();
std::pair<bool, uint64_t> query(uint64_t key);
const std::map<uint64_t, std::string> &getSourceVocab() const {
return source_vocabids;
}
const std::vector<Alignments> &getAlignments() const {
return alignColl;
}
uint64_t getKey(uint64_t source_phrase[], size_t size) const;
template<typename T>
inline bool Get(const boost::unordered_map<std::string, std::string> &keyValue, const std::string &sought, T &found) const {
boost::unordered_map<std::string, std::string>::const_iterator iter = keyValue.find(sought);
if (iter == keyValue.end()) {
return false;
}
const std::string &foundStr = iter->second;
found = Scan<T>(foundStr);
return true;
}
};
}