2008-06-11 14:52:57 +04:00
|
|
|
// vim:tabstop=2
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
Moses - factored phrase-based language decoder
|
|
|
|
Copyright (C) 2006 University of Edinburgh
|
|
|
|
|
|
|
|
This library is free software; you can redistribute it and/or
|
|
|
|
modify it under the terms of the GNU Lesser General Public
|
|
|
|
License as published by the Free Software Foundation; either
|
|
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
|
|
|
|
This library is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
Lesser General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
|
|
License along with this library; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
***********************************************************************/
|
|
|
|
|
2012-11-27 19:08:31 +04:00
|
|
|
#include "moses/TranslationModel/PhraseDictionary.h"
|
|
|
|
#include "moses/TranslationModel/PhraseDictionaryTreeAdaptor.h"
|
2012-11-27 20:57:23 +04:00
|
|
|
#include "moses/TranslationModel/RuleTable/PhraseDictionarySCFG.h"
|
|
|
|
#include "moses/TranslationModel/RuleTable/PhraseDictionaryOnDisk.h"
|
|
|
|
#include "moses/TranslationModel/RuleTable/PhraseDictionaryALSuffixArray.h"
|
|
|
|
#include "moses/TranslationModel/RuleTable/PhraseDictionaryFuzzyMatch.h"
|
2012-07-18 20:59:21 +04:00
|
|
|
|
2010-04-12 17:50:11 +04:00
|
|
|
#ifndef WIN32
|
2012-11-27 19:08:31 +04:00
|
|
|
#include "moses/TranslationModel/PhraseDictionaryDynSuffixArray.h"
|
2012-11-27 22:04:01 +04:00
|
|
|
#include "moses/TranslationModel/CompactPT/PhraseDictionaryCompact.h"
|
2010-04-12 17:50:11 +04:00
|
|
|
#endif
|
2012-11-27 20:57:23 +04:00
|
|
|
#include "moses/TranslationModel/RuleTable/UTrie.h"
|
2011-11-04 19:43:42 +04:00
|
|
|
|
2012-11-27 19:08:31 +04:00
|
|
|
#include "moses/StaticData.h"
|
|
|
|
#include "moses/InputType.h"
|
|
|
|
#include "moses/TranslationOption.h"
|
|
|
|
#include "moses/UserMessage.h"
|
2008-06-11 14:52:57 +04:00
|
|
|
|
2010-08-10 17:51:20 +04:00
|
|
|
using namespace std;
|
|
|
|
|
2011-02-24 16:14:42 +03:00
|
|
|
namespace Moses
|
|
|
|
{
|
2008-06-11 14:52:57 +04:00
|
|
|
|
2013-02-22 23:17:57 +04:00
|
|
|
PhraseDictionary::PhraseDictionary(const std::string &description, const std::string &line)
|
|
|
|
:DecodeFeature(description, line)
|
2008-06-11 14:52:57 +04:00
|
|
|
{
|
2013-02-22 23:17:57 +04:00
|
|
|
m_tableLimit= 20; // TODO default?
|
2008-06-11 14:52:57 +04:00
|
|
|
|
2013-02-04 05:09:15 +04:00
|
|
|
for (size_t i = 0; i < m_args.size(); ++i) {
|
|
|
|
const vector<string> &args = m_args[i];
|
2013-02-01 19:50:57 +04:00
|
|
|
|
2013-02-22 23:17:57 +04:00
|
|
|
if (args[0] == "input-factor") {
|
2013-03-16 20:41:38 +04:00
|
|
|
m_input =Tokenize<FactorType>(args[1], ",");
|
2013-02-04 16:07:21 +04:00
|
|
|
m_inputFactors = FactorMask(m_input);
|
2013-02-01 19:50:57 +04:00
|
|
|
}
|
|
|
|
else if (args[0] == "output-factor") {
|
2013-03-16 20:41:38 +04:00
|
|
|
m_output =Tokenize<FactorType>(args[1], ",");
|
2013-02-04 16:07:21 +04:00
|
|
|
m_outputFactors = FactorMask(m_output);
|
2013-02-01 19:50:57 +04:00
|
|
|
}
|
2013-02-04 03:30:36 +04:00
|
|
|
else if (args[0] == "num-input-features") {
|
|
|
|
m_numInputScores = Scan<unsigned>(args[1]);
|
2013-02-01 19:50:57 +04:00
|
|
|
}
|
|
|
|
else if (args[0] == "path") {
|
|
|
|
m_filePath = args[1];
|
|
|
|
}
|
|
|
|
else if (args[0] == "table-limit") {
|
|
|
|
m_tableLimit = Scan<size_t>(args[1]);
|
|
|
|
}
|
2013-02-04 03:55:05 +04:00
|
|
|
else if (args[0] == "target-path") {
|
|
|
|
m_targetFile = args[1];
|
|
|
|
}
|
|
|
|
else if (args[0] == "alignment-path") {
|
|
|
|
m_alignmentsFile = args[1];
|
|
|
|
}
|
|
|
|
else {
|
2013-02-19 21:31:11 +04:00
|
|
|
throw "Unknown argument " + args[0];
|
2013-02-04 03:55:05 +04:00
|
|
|
}
|
2013-02-01 19:50:57 +04:00
|
|
|
} // for (size_t i = 0; i < toks.size(); ++i) {
|
|
|
|
|
2013-02-22 23:17:57 +04:00
|
|
|
}
|
2013-02-21 22:06:03 +04:00
|
|
|
|
2013-02-22 23:17:57 +04:00
|
|
|
|
|
|
|
const TargetPhraseCollection *PhraseDictionary::
|
|
|
|
GetTargetPhraseCollection(InputType const& src,WordsRange const& range) const
|
|
|
|
{
|
2013-04-26 15:20:49 +04:00
|
|
|
Phrase phrase = src.GetSubString(range);
|
|
|
|
phrase.OnlyTheseFactors(m_inputFactors);
|
|
|
|
return GetTargetPhraseCollection(phrase);
|
2013-02-01 19:50:57 +04:00
|
|
|
}
|
|
|
|
|
2008-10-09 03:51:26 +04:00
|
|
|
}
|
|
|
|
|