2010-04-12 14:15:49 +04:00
|
|
|
/***********************************************************************
|
|
|
|
Moses - factored phrase-based language decoder
|
|
|
|
Copyright (C) 2010 Hieu Hoang
|
2011-02-24 16:14:42 +03:00
|
|
|
|
2010-04-12 14:15:49 +04:00
|
|
|
This library is free software; you can redistribute it and/or
|
|
|
|
modify it under the terms of the GNU Lesser General Public
|
|
|
|
License as published by the Free Software Foundation; either
|
|
|
|
version 2.1 of the License, or (at your option) any later version.
|
2011-02-24 16:14:42 +03:00
|
|
|
|
2010-04-12 14:15:49 +04:00
|
|
|
This library is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
Lesser General Public License for more details.
|
2011-02-24 16:14:42 +03:00
|
|
|
|
2010-04-12 14:15:49 +04:00
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
|
|
License along with this library; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
***********************************************************************/
|
2010-04-08 21:16:10 +04:00
|
|
|
|
2012-09-25 20:34:43 +04:00
|
|
|
#include "ChartTranslationOptions.h"
|
2012-01-25 16:26:28 +04:00
|
|
|
#include "ChartHypothesis.h"
|
2012-09-27 20:33:31 +04:00
|
|
|
#include "ChartCellLabel.h"
|
2013-08-12 22:01:06 +04:00
|
|
|
#include "ChartTranslationOption.h"
|
2013-09-22 17:09:49 +04:00
|
|
|
#include "InputPath.h"
|
|
|
|
#include "StaticData.h"
|
|
|
|
|
|
|
|
using namespace std;
|
2012-09-25 16:17:52 +04:00
|
|
|
|
2010-04-08 21:16:10 +04:00
|
|
|
namespace Moses
|
|
|
|
{
|
|
|
|
|
2013-08-09 13:27:46 +04:00
|
|
|
ChartTranslationOptions::ChartTranslationOptions(const TargetPhraseCollection &targetPhraseColl,
|
2013-08-09 21:17:18 +04:00
|
|
|
const StackVec &stackVec,
|
|
|
|
const WordsRange &wordsRange,
|
|
|
|
float score)
|
|
|
|
: m_stackVec(stackVec)
|
|
|
|
, m_wordsRange(&wordsRange)
|
|
|
|
, m_estimateOfBestScore(score)
|
2013-08-09 13:27:46 +04:00
|
|
|
{
|
2013-08-09 21:17:18 +04:00
|
|
|
TargetPhraseCollection::const_iterator iter;
|
|
|
|
for (iter = targetPhraseColl.begin(); iter != targetPhraseColl.end(); ++iter) {
|
|
|
|
const TargetPhrase *origTP = *iter;
|
2013-08-09 21:16:31 +04:00
|
|
|
|
2013-08-12 13:34:45 +04:00
|
|
|
boost::shared_ptr<ChartTranslationOption> ptr(new ChartTranslationOption(*origTP));
|
2013-08-13 15:12:58 +04:00
|
|
|
m_collection.push_back(ptr);
|
2013-08-09 21:17:18 +04:00
|
|
|
}
|
2013-08-09 13:27:46 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
ChartTranslationOptions::~ChartTranslationOptions()
|
|
|
|
{
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2012-09-25 20:34:43 +04:00
|
|
|
float ChartTranslationOptions::CalcEstimateOfBestScore(
|
2013-05-29 21:16:15 +04:00
|
|
|
const TargetPhraseCollection &tpc,
|
|
|
|
const StackVec &stackVec)
|
2011-04-05 00:43:02 +04:00
|
|
|
{
|
2012-02-07 03:54:01 +04:00
|
|
|
const TargetPhrase &targetPhrase = **(tpc.begin());
|
|
|
|
float estimateOfBestScore = targetPhrase.GetFutureScore();
|
|
|
|
for (StackVec::const_iterator p = stackVec.begin(); p != stackVec.end();
|
2012-01-25 16:26:28 +04:00
|
|
|
++p) {
|
2012-10-08 00:48:15 +04:00
|
|
|
const HypoList *stack = (*p)->GetStack().cube;
|
2012-01-25 16:26:28 +04:00
|
|
|
assert(stack);
|
|
|
|
assert(!stack->empty());
|
|
|
|
const ChartHypothesis &bestHypo = **(stack->begin());
|
2012-02-07 03:54:01 +04:00
|
|
|
estimateOfBestScore += bestHypo.GetTotalScore();
|
2011-04-05 00:43:02 +04:00
|
|
|
}
|
2012-02-07 03:54:01 +04:00
|
|
|
return estimateOfBestScore;
|
2011-04-05 00:43:02 +04:00
|
|
|
}
|
|
|
|
|
2013-08-13 15:16:55 +04:00
|
|
|
void ChartTranslationOptions::Evaluate(const InputType &input, const InputPath &inputPath)
|
2013-08-13 15:12:58 +04:00
|
|
|
{
|
2013-09-22 18:15:00 +04:00
|
|
|
SetInputPath(&inputPath);
|
|
|
|
if (StaticData::Instance().GetPlaceholderFactor() != NOT_FOUND) {
|
2013-09-27 12:35:24 +04:00
|
|
|
CreateSourceRuleFromInputPath();
|
2013-09-22 18:15:00 +04:00
|
|
|
}
|
|
|
|
|
2013-08-13 15:12:58 +04:00
|
|
|
CollType::iterator iter;
|
|
|
|
for (iter = m_collection.begin(); iter != m_collection.end(); ++iter) {
|
2013-08-16 00:14:04 +04:00
|
|
|
ChartTranslationOption &transOpt = **iter;
|
2013-09-12 21:50:09 +04:00
|
|
|
transOpt.SetInputPath(&inputPath);
|
2013-08-16 00:14:04 +04:00
|
|
|
transOpt.Evaluate(input, inputPath);
|
2013-08-13 15:12:58 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2013-09-22 18:15:00 +04:00
|
|
|
void ChartTranslationOptions::SetInputPath(const InputPath *inputPath)
|
|
|
|
{
|
|
|
|
CollType::iterator iter;
|
|
|
|
for (iter = m_collection.begin(); iter != m_collection.end(); ++iter) {
|
2013-09-27 12:35:24 +04:00
|
|
|
ChartTranslationOption &transOpt = **iter;
|
|
|
|
transOpt.SetInputPath(inputPath);
|
2013-09-22 18:15:00 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void ChartTranslationOptions::CreateSourceRuleFromInputPath()
|
|
|
|
{
|
2013-09-27 12:35:24 +04:00
|
|
|
if (m_collection.size() == 0) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
const InputPath *inputPath = m_collection.front()->GetInputPath();
|
|
|
|
CHECK(inputPath);
|
|
|
|
std::vector<const Word*> &ruleSourceFromInputPath = inputPath->AddRuleSourceFromInputPath();
|
|
|
|
|
|
|
|
size_t chartCellIndex = 0;
|
|
|
|
const ChartCellLabel *chartCellLabel = (chartCellIndex < m_stackVec.size()) ? m_stackVec[chartCellIndex] : NULL;
|
|
|
|
|
|
|
|
size_t ind = 0;
|
|
|
|
for (size_t sourcePos = m_wordsRange->GetStartPos(); sourcePos <= m_wordsRange->GetEndPos(); ++sourcePos, ++ind) {
|
|
|
|
if (chartCellLabel) {
|
|
|
|
if (sourcePos == chartCellLabel->GetCoverage().GetEndPos()) {
|
|
|
|
// end of child range. push an empty word to denote non-term
|
|
|
|
ruleSourceFromInputPath.push_back(NULL);
|
|
|
|
++chartCellIndex;
|
|
|
|
chartCellLabel = (chartCellIndex < m_stackVec.size()) ? m_stackVec[chartCellIndex] : NULL;
|
|
|
|
} else if (sourcePos >= chartCellLabel->GetCoverage().GetStartPos()) {
|
|
|
|
// in the range of child hypo. do nothing
|
|
|
|
} else {
|
|
|
|
// not yet reached child range. add word
|
|
|
|
ruleSourceFromInputPath.push_back(&inputPath->GetPhrase().GetWord(ind));
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// no child in sight. add word
|
|
|
|
ruleSourceFromInputPath.push_back(&inputPath->GetPhrase().GetWord(ind));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// save it to each trans opt
|
2013-09-22 18:15:00 +04:00
|
|
|
CollType::iterator iter;
|
|
|
|
for (iter = m_collection.begin(); iter != m_collection.end(); ++iter) {
|
2013-09-27 12:35:24 +04:00
|
|
|
ChartTranslationOption &transOpt = **iter;
|
|
|
|
transOpt.SetSourceRuleFromInputPath(&ruleSourceFromInputPath);
|
2013-09-22 18:15:00 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2010-04-08 21:16:10 +04:00
|
|
|
}
|