mirror of
https://github.com/moses-smt/mosesdecoder.git
synced 2025-01-08 12:36:35 +03:00
54 lines
1.4 KiB
C++
54 lines
1.4 KiB
C++
#pragma once
|
|
|
|
#include <string>
|
|
#include <vector>
|
|
#include "moses/Factor.h"
|
|
#include "moses/Util.h"
|
|
#include "SingleFactor.h"
|
|
#include "moses/TranslationModel/DynSAInclude/onlineRLM.h"
|
|
//#include "multiOnlineRLM.h"
|
|
#include "moses/TranslationModel/DynSAInclude/FileHandler.h"
|
|
#include "moses/TranslationModel/DynSAInclude/vocab.h"
|
|
|
|
namespace Moses
|
|
{
|
|
class Factor;
|
|
class Phrase;
|
|
|
|
/** @todo ask ollie
|
|
*/
|
|
class LanguageModelORLM : public LanguageModelSingleFactor
|
|
{
|
|
public:
|
|
typedef count_t T; // type for ORLM filter
|
|
LanguageModelORLM(const std::string &line)
|
|
:LanguageModelSingleFactor(line)
|
|
,m_lm(0) {
|
|
}
|
|
bool Load(const std::string &filePath, FactorType factorType, size_t nGramOrder);
|
|
virtual LMResult GetValue(const std::vector<const Word*> &contextFactor, State* finalState = NULL) const;
|
|
~LanguageModelORLM() {
|
|
//save LM with markings
|
|
Utils::rtrim(m_filePath, ".gz");
|
|
FileHandler fout(m_filePath + ".marked.gz", std::ios::out|std::ios::binary, false);
|
|
m_lm->save(&fout);
|
|
fout.close();
|
|
delete m_lm;
|
|
}
|
|
void CleanUpAfterSentenceProcessing() {
|
|
m_lm->clearCache(); // clear caches
|
|
}
|
|
|
|
bool UpdateORLM(const std::vector<string>& ngram, const int value);
|
|
protected:
|
|
OnlineRLM<T>* m_lm;
|
|
//MultiOnlineRLM<T>* m_lm;
|
|
wordID_t m_oov_id;
|
|
std::vector<wordID_t> lm_ids_vec_;
|
|
void CreateFactors();
|
|
wordID_t GetLmID(const std::string &str) const;
|
|
wordID_t GetLmID(const Factor *factor) const;
|
|
};
|
|
} // end namespace
|
|
|