mirror of
https://github.com/moses-smt/mosesdecoder.git
synced 2025-01-04 09:56:33 +03:00
import OnDisk pt
This commit is contained in:
parent
29d6824942
commit
9a089b5baa
@ -12,21 +12,11 @@
|
|||||||
#include "../Scores.h"
|
#include "../Scores.h"
|
||||||
#include "../MemPool.h"
|
#include "../MemPool.h"
|
||||||
|
|
||||||
#include "SkeletonStatelessFF.h"
|
#include "../TranslationModel/PhraseTable.h"
|
||||||
#include "SkeletonStatefulFF.h"
|
|
||||||
#include "WordPenalty.h"
|
|
||||||
#include "PhrasePenalty.h"
|
|
||||||
#include "Distortion.h"
|
|
||||||
#include "LexicalReordering/LexicalReordering.h"
|
|
||||||
#include "../TranslationModel/Memory/PhraseTableMemory.h"
|
|
||||||
#include "../TranslationModel/ProbingPT.h"
|
|
||||||
#include "../TranslationModel/UnknownWordPenalty.h"
|
#include "../TranslationModel/UnknownWordPenalty.h"
|
||||||
#include "../LM/LanguageModel.h"
|
|
||||||
//#include "../LM/LanguageModelDALM.h"
|
|
||||||
#include "../LM/KENLM.h"
|
|
||||||
#include "../SCFG/TargetPhraseImpl.h"
|
#include "../SCFG/TargetPhraseImpl.h"
|
||||||
#include "util/exception.hh"
|
|
||||||
#include "../SCFG/Word.h"
|
#include "../SCFG/Word.h"
|
||||||
|
#include "util/exception.hh"
|
||||||
|
|
||||||
using namespace std;
|
using namespace std;
|
||||||
|
|
||||||
|
@ -1,6 +1,7 @@
|
|||||||
#include "FeatureRegistry.h"
|
#include "FeatureRegistry.h"
|
||||||
|
|
||||||
#include "../TranslationModel/Memory/PhraseTableMemory.h"
|
#include "../TranslationModel/Memory/PhraseTableMemory.h"
|
||||||
|
#include "../TranslationModel/PhraseTableOnDisk.h"
|
||||||
#include "../TranslationModel/ProbingPT.h"
|
#include "../TranslationModel/ProbingPT.h"
|
||||||
#include "../TranslationModel/UnknownWordPenalty.h"
|
#include "../TranslationModel/UnknownWordPenalty.h"
|
||||||
|
|
||||||
@ -50,6 +51,7 @@ FeatureRegistry::FeatureRegistry()
|
|||||||
#define MOSES_FNAME2(name, type) Add(name, new DefaultFeatureFactory< type >());
|
#define MOSES_FNAME2(name, type) Add(name, new DefaultFeatureFactory< type >());
|
||||||
|
|
||||||
MOSES_FNAME2("PhraseDictionaryMemory", PhraseTableMemory);
|
MOSES_FNAME2("PhraseDictionaryMemory", PhraseTableMemory);
|
||||||
|
MOSES_FNAME2("PhraseDictionaryOnDisk", PhraseTableOnDisk);
|
||||||
MOSES_FNAME(ProbingPT);
|
MOSES_FNAME(ProbingPT);
|
||||||
MOSES_FNAME(UnknownWordPenalty);
|
MOSES_FNAME(UnknownWordPenalty);
|
||||||
|
|
||||||
|
@ -50,6 +50,7 @@ alias deps : ../../..//z ../../..//boost_iostreams ../../..//boost_filesystem .
|
|||||||
LM/GPULM.cpp
|
LM/GPULM.cpp
|
||||||
|
|
||||||
TranslationModel/PhraseTable.cpp
|
TranslationModel/PhraseTable.cpp
|
||||||
|
TranslationModel/PhraseTableOnDisk.cpp
|
||||||
TranslationModel/ProbingPT.cpp
|
TranslationModel/ProbingPT.cpp
|
||||||
TranslationModel/UnknownWordPenalty.cpp
|
TranslationModel/UnknownWordPenalty.cpp
|
||||||
TranslationModel/Memory/PhraseTableMemory.cpp
|
TranslationModel/Memory/PhraseTableMemory.cpp
|
||||||
|
@ -0,0 +1,239 @@
|
|||||||
|
/*
|
||||||
|
* PhraseTableOnDisk.cpp
|
||||||
|
*
|
||||||
|
* Created on: 28 Oct 2015
|
||||||
|
* Author: hieu
|
||||||
|
*/
|
||||||
|
#include <boost/foreach.hpp>
|
||||||
|
#include "PhraseTableOnDisk.h"
|
||||||
|
#include "../System.h"
|
||||||
|
#include "../Scores.h"
|
||||||
|
#include "../InputType.h"
|
||||||
|
#include "../PhraseBased/Manager.h"
|
||||||
|
#include "../PhraseBased/TargetPhraseImpl.h"
|
||||||
|
#include "../PhraseBased/InputPath.h"
|
||||||
|
#include "../PhraseBased/TargetPhrases.h"
|
||||||
|
#include "../PhraseBased/Sentence.h"
|
||||||
|
#include "../SCFG/InputPath.h"
|
||||||
|
#include "../SCFG/TargetPhraseImpl.h"
|
||||||
|
#include "../SCFG/Manager.h"
|
||||||
|
#include "../SCFG/Sentence.h"
|
||||||
|
|
||||||
|
using namespace std;
|
||||||
|
|
||||||
|
namespace Moses2
|
||||||
|
{
|
||||||
|
|
||||||
|
PhraseTableOnDisk::PhraseTableOnDisk(size_t startInd, const std::string &line) :
|
||||||
|
PhraseTable(startInd, line)
|
||||||
|
{
|
||||||
|
ReadParameters();
|
||||||
|
}
|
||||||
|
|
||||||
|
PhraseTableOnDisk::~PhraseTableOnDisk()
|
||||||
|
{
|
||||||
|
// TODO Auto-generated destructor stub
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::ProcessXML(
|
||||||
|
const Manager &mgr,
|
||||||
|
MemPool &pool,
|
||||||
|
const Sentence &sentence,
|
||||||
|
InputPaths &inputPaths) const
|
||||||
|
{
|
||||||
|
const Vector<const InputType::XMLOption*> &xmlOptions = sentence.GetXMLOptions();
|
||||||
|
BOOST_FOREACH(const InputType::XMLOption *xmlOption, xmlOptions) {
|
||||||
|
TargetPhraseImpl *target = TargetPhraseImpl::CreateFromString(pool, *this, mgr.system, xmlOption->GetTranslation());
|
||||||
|
|
||||||
|
if (xmlOption->prob) {
|
||||||
|
Scores &scores = target->GetScores();
|
||||||
|
scores.PlusEquals(mgr.system, *this, Moses2::TransformScore(xmlOption->prob));
|
||||||
|
}
|
||||||
|
|
||||||
|
InputPath *path = inputPaths.GetMatrix().GetValue(xmlOption->startPos, xmlOption->phraseSize - 1);
|
||||||
|
const SubPhrase<Moses2::Word> &source = path->subPhrase;
|
||||||
|
|
||||||
|
mgr.system.featureFunctions.EvaluateInIsolation(pool, mgr.system, source, *target);
|
||||||
|
|
||||||
|
TargetPhrases *tps = new (pool.Allocate<TargetPhrases>()) TargetPhrases(pool, 1);
|
||||||
|
|
||||||
|
tps->AddTargetPhrase(*target);
|
||||||
|
mgr.system.featureFunctions.EvaluateAfterTablePruning(pool, *tps, source);
|
||||||
|
|
||||||
|
path->AddTargetPhrases(*this, tps);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::Lookup(const Manager &mgr,
|
||||||
|
InputPathsBase &inputPaths) const
|
||||||
|
{
|
||||||
|
BOOST_FOREACH(InputPathBase *pathBase, inputPaths){
|
||||||
|
InputPath *path = static_cast<InputPath*>(pathBase);
|
||||||
|
|
||||||
|
if (SatisfyBackoff(mgr, *path)) {
|
||||||
|
const SubPhrase<Moses2::Word> &phrase = path->subPhrase;
|
||||||
|
|
||||||
|
TargetPhrases *tps = Lookup(mgr, mgr.GetPool(), *path);
|
||||||
|
path->AddTargetPhrases(*this, tps);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
TargetPhrases *PhraseTableOnDisk::Lookup(const Manager &mgr, MemPool &pool,
|
||||||
|
InputPath &inputPath) const
|
||||||
|
{
|
||||||
|
const System &system = mgr.system;
|
||||||
|
TargetPhrases *tps = NULL;
|
||||||
|
|
||||||
|
// any other pt translate this?
|
||||||
|
size_t numPt = mgr.system.mappings.size();
|
||||||
|
const TargetPhrases **allTPS =
|
||||||
|
static_cast<InputPath&>(inputPath).targetPhrases;
|
||||||
|
for (size_t i = 0; i < numPt; ++i) {
|
||||||
|
const TargetPhrases *otherTps = allTPS[i];
|
||||||
|
|
||||||
|
if (otherTps && otherTps->GetSize()) {
|
||||||
|
return tps;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
const SubPhrase<Moses2::Word> &source = inputPath.subPhrase;
|
||||||
|
const Moses2::Word &sourceWord = source[0];
|
||||||
|
const Factor *factor = sourceWord[0];
|
||||||
|
|
||||||
|
tps = new (pool.Allocate<TargetPhrases>()) TargetPhrases(pool, 1);
|
||||||
|
|
||||||
|
TargetPhraseImpl *target =
|
||||||
|
new (pool.Allocate<TargetPhraseImpl>()) TargetPhraseImpl(pool, *this,
|
||||||
|
system, 1);
|
||||||
|
Moses2::Word &word = (*target)[0];
|
||||||
|
|
||||||
|
//FactorCollection &fc = system.vocab;
|
||||||
|
//const Factor *factor = fc.AddFactor("SSS", false);
|
||||||
|
word[0] = factor;
|
||||||
|
|
||||||
|
Scores &scores = target->GetScores();
|
||||||
|
scores.PlusEquals(mgr.system, *this, -100);
|
||||||
|
|
||||||
|
MemPool &memPool = mgr.GetPool();
|
||||||
|
system.featureFunctions.EvaluateInIsolation(memPool, system, source, *target);
|
||||||
|
|
||||||
|
tps->AddTargetPhrase(*target);
|
||||||
|
system.featureFunctions.EvaluateAfterTablePruning(memPool, *tps, source);
|
||||||
|
|
||||||
|
return tps;
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::EvaluateInIsolation(const System &system,
|
||||||
|
const Phrase<Moses2::Word> &source, const TargetPhrase<Moses2::Word> &targetPhrase, Scores &scores,
|
||||||
|
SCORE *estimatedScore) const
|
||||||
|
{
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::InitActiveChart(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
SCFG::InputPath &path) const
|
||||||
|
{
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::Lookup(MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
size_t maxChartSpan,
|
||||||
|
const SCFG::Stacks &stacks,
|
||||||
|
SCFG::InputPath &path) const
|
||||||
|
{
|
||||||
|
const System &system = mgr.system;
|
||||||
|
|
||||||
|
size_t numWords = path.range.GetNumWordsCovered();
|
||||||
|
if (numWords > 1) {
|
||||||
|
// only create 1 word phrases
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (path.GetNumRules()) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
// don't do 1st of last word
|
||||||
|
if (path.range.GetStartPos() == 0) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
const SCFG::Sentence &sentence = static_cast<const SCFG::Sentence&>(mgr.GetInput());
|
||||||
|
if (path.range.GetStartPos() + 1 == sentence.GetSize()) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
// terminal
|
||||||
|
const SCFG::Word &lastWord = path.subPhrase.Back();
|
||||||
|
//cerr << "PhraseTableOnDisk lastWord=" << lastWord << endl;
|
||||||
|
|
||||||
|
const Factor *factor = lastWord[0];
|
||||||
|
SCFG::TargetPhraseImpl *tp = new (pool.Allocate<SCFG::TargetPhraseImpl>()) SCFG::TargetPhraseImpl(pool, *this, system, 1);
|
||||||
|
SCFG::Word &word = (*tp)[0];
|
||||||
|
word.CreateFromString(system.GetVocab(), system, factor->GetString().as_string());
|
||||||
|
|
||||||
|
tp->lhs.CreateFromString(system.GetVocab(), system, "[X]");
|
||||||
|
|
||||||
|
size_t endPos = path.range.GetEndPos();
|
||||||
|
const SCFG::InputPath &subPhrasePath = *mgr.GetInputPaths().GetMatrix().GetValue(endPos, 1);
|
||||||
|
|
||||||
|
SCFG::SymbolBind symbolBind(pool);
|
||||||
|
symbolBind.Add(subPhrasePath.range, lastWord, NULL);
|
||||||
|
|
||||||
|
Scores &scores = tp->GetScores();
|
||||||
|
scores.PlusEquals(mgr.system, *this, -100);
|
||||||
|
|
||||||
|
MemPool &memPool = mgr.GetPool();
|
||||||
|
const SubPhrase<SCFG::Word> &source = path.subPhrase;
|
||||||
|
system.featureFunctions.EvaluateInIsolation(memPool, system, source, *tp);
|
||||||
|
|
||||||
|
path.AddTargetPhrase(pool, *this, symbolBind, tp);
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::LookupUnary(MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const SCFG::Stacks &stacks,
|
||||||
|
SCFG::InputPath &path) const
|
||||||
|
{
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::LookupNT(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const Moses2::Range &subPhraseRange,
|
||||||
|
const SCFG::InputPath &prevPath,
|
||||||
|
const SCFG::Stacks &stacks,
|
||||||
|
SCFG::InputPath &outPath) const
|
||||||
|
{
|
||||||
|
UTIL_THROW2("Not implemented");
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::LookupGivenWord(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const SCFG::InputPath &prevPath,
|
||||||
|
const SCFG::Word &wordSought,
|
||||||
|
const Moses2::Hypotheses *hypos,
|
||||||
|
const Moses2::Range &subPhraseRange,
|
||||||
|
SCFG::InputPath &outPath) const
|
||||||
|
{
|
||||||
|
UTIL_THROW2("Not implemented");
|
||||||
|
}
|
||||||
|
|
||||||
|
void PhraseTableOnDisk::LookupGivenNode(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const SCFG::ActiveChartEntry &prevEntry,
|
||||||
|
const SCFG::Word &wordSought,
|
||||||
|
const Moses2::Hypotheses *hypos,
|
||||||
|
const Moses2::Range &subPhraseRange,
|
||||||
|
SCFG::InputPath &outPath) const
|
||||||
|
{
|
||||||
|
UTIL_THROW2("Not implemented");
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
@ -0,0 +1,84 @@
|
|||||||
|
/*
|
||||||
|
* UnknownWordPenalty.h
|
||||||
|
*
|
||||||
|
* Created on: 28 Oct 2015
|
||||||
|
* Author: hieu
|
||||||
|
*/
|
||||||
|
|
||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include "PhraseTable.h"
|
||||||
|
|
||||||
|
namespace Moses2
|
||||||
|
{
|
||||||
|
class Sentence;
|
||||||
|
class InputPaths;
|
||||||
|
class Range;
|
||||||
|
|
||||||
|
class PhraseTableOnDisk : public PhraseTable
|
||||||
|
{
|
||||||
|
public:
|
||||||
|
PhraseTableOnDisk(size_t startInd, const std::string &line);
|
||||||
|
virtual ~PhraseTableOnDisk();
|
||||||
|
|
||||||
|
void Lookup(const Manager &mgr, InputPathsBase &inputPaths) const;
|
||||||
|
virtual TargetPhrases *Lookup(const Manager &mgr, MemPool &pool,
|
||||||
|
InputPath &inputPath) const;
|
||||||
|
|
||||||
|
void ProcessXML(
|
||||||
|
const Manager &mgr,
|
||||||
|
MemPool &pool,
|
||||||
|
const Sentence &sentence,
|
||||||
|
InputPaths &inputPaths) const;
|
||||||
|
|
||||||
|
virtual void
|
||||||
|
EvaluateInIsolation(const System &system, const Phrase<Moses2::Word> &source,
|
||||||
|
const TargetPhrase<Moses2::Word> &targetPhrase, Scores &scores,
|
||||||
|
SCORE *estimatedScore) const;
|
||||||
|
|
||||||
|
virtual void InitActiveChart(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
SCFG::InputPath &path) const;
|
||||||
|
|
||||||
|
void Lookup(MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
size_t maxChartSpan,
|
||||||
|
const SCFG::Stacks &stacks,
|
||||||
|
SCFG::InputPath &path) const;
|
||||||
|
|
||||||
|
void LookupUnary(MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const SCFG::Stacks &stacks,
|
||||||
|
SCFG::InputPath &path) const;
|
||||||
|
|
||||||
|
protected:
|
||||||
|
virtual void LookupNT(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const Moses2::Range &subPhraseRange,
|
||||||
|
const SCFG::InputPath &prevPath,
|
||||||
|
const SCFG::Stacks &stacks,
|
||||||
|
SCFG::InputPath &outPath) const;
|
||||||
|
|
||||||
|
virtual void LookupGivenWord(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const SCFG::InputPath &prevPath,
|
||||||
|
const SCFG::Word &wordSought,
|
||||||
|
const Moses2::Hypotheses *hypos,
|
||||||
|
const Moses2::Range &subPhraseRange,
|
||||||
|
SCFG::InputPath &outPath) const;
|
||||||
|
|
||||||
|
virtual void LookupGivenNode(
|
||||||
|
MemPool &pool,
|
||||||
|
const SCFG::Manager &mgr,
|
||||||
|
const SCFG::ActiveChartEntry &prevEntry,
|
||||||
|
const SCFG::Word &wordSought,
|
||||||
|
const Moses2::Hypotheses *hypos,
|
||||||
|
const Moses2::Range &subPhraseRange,
|
||||||
|
SCFG::InputPath &outPath) const;
|
||||||
|
};
|
||||||
|
|
||||||
|
}
|
||||||
|
|
Loading…
Reference in New Issue
Block a user