2008-06-11 14:52:57 +04:00
|
|
|
// $Id$
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
Moses - factored phrase-based language decoder
|
|
|
|
Copyright (C) 2006 University of Edinburgh
|
|
|
|
|
|
|
|
This library is free software; you can redistribute it and/or
|
|
|
|
modify it under the terms of the GNU Lesser General Public
|
|
|
|
License as published by the Free Software Foundation; either
|
|
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
|
|
|
|
This library is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
Lesser General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
|
|
License along with this library; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
***********************************************************************/
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include <iostream>
|
|
|
|
#include <map>
|
|
|
|
#include <list>
|
|
|
|
#include <vector>
|
|
|
|
#include <string>
|
2009-08-07 20:47:54 +04:00
|
|
|
|
|
|
|
#ifdef WITH_THREADS
|
|
|
|
#include <boost/thread/tss.hpp>
|
|
|
|
#endif
|
|
|
|
|
2008-06-11 14:52:57 +04:00
|
|
|
#include "Phrase.h"
|
|
|
|
#include "TargetPhrase.h"
|
|
|
|
#include "Dictionary.h"
|
|
|
|
#include "TargetPhraseCollection.h"
|
2009-02-06 18:43:06 +03:00
|
|
|
#include "FeatureFunction.h"
|
2008-06-11 14:52:57 +04:00
|
|
|
|
2008-10-09 03:51:26 +04:00
|
|
|
namespace Moses
|
|
|
|
{
|
|
|
|
|
2008-06-11 14:52:57 +04:00
|
|
|
class StaticData;
|
|
|
|
class InputType;
|
|
|
|
class WordsRange;
|
|
|
|
|
2009-08-07 20:47:54 +04:00
|
|
|
class PhraseDictionaryFeature;
|
|
|
|
/**
|
|
|
|
* Abstract base class for phrase dictionaries (tables).
|
|
|
|
**/
|
|
|
|
class PhraseDictionary: public Dictionary {
|
|
|
|
public:
|
|
|
|
PhraseDictionary(size_t numScoreComponent, const PhraseDictionaryFeature* feature):
|
|
|
|
Dictionary(numScoreComponent), m_tableLimit(0), m_feature(feature) {}
|
|
|
|
//! table limit number.
|
|
|
|
size_t GetTableLimit() const { return m_tableLimit; }
|
|
|
|
DecodeType GetDecodeType() const { return Translate; }
|
|
|
|
const PhraseDictionaryFeature* GetFeature() const;
|
|
|
|
/** set/change translation weights and recalc weighted score for each translation.
|
|
|
|
* TODO This may be redundant now we use ScoreCollection
|
|
|
|
*/
|
|
|
|
virtual void SetWeightTransModel(const std::vector<float> &weightT)=0;
|
|
|
|
|
|
|
|
//! find list of translations that can translates src. Only for phrase input
|
|
|
|
virtual const TargetPhraseCollection *GetTargetPhraseCollection(const Phrase& src) const=0;
|
|
|
|
//! find list of translations that can translates a portion of src. Used by confusion network decoding
|
|
|
|
virtual const TargetPhraseCollection *GetTargetPhraseCollection(InputType const& src,WordsRange const& range) const;
|
|
|
|
//! Create entry for translation of source to targetPhrase
|
|
|
|
virtual void AddEquivPhrase(const Phrase &source, const TargetPhrase &targetPhrase)=0;
|
|
|
|
virtual void InitializeForInput(InputType const& source) = 0;
|
|
|
|
|
|
|
|
|
|
|
|
protected:
|
|
|
|
size_t m_tableLimit;
|
|
|
|
const PhraseDictionaryFeature* m_feature;
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Represents a feature derived from a phrase table.
|
|
|
|
*/
|
|
|
|
class PhraseDictionaryFeature : public StatelessFeatureFunction
|
2008-06-11 14:52:57 +04:00
|
|
|
{
|
2009-08-07 20:47:54 +04:00
|
|
|
|
2008-06-11 14:52:57 +04:00
|
|
|
|
|
|
|
public:
|
2009-08-07 20:47:54 +04:00
|
|
|
PhraseDictionaryFeature( size_t numScoreComponent
|
|
|
|
, unsigned numInputScores
|
|
|
|
, const std::vector<FactorType> &input
|
|
|
|
, const std::vector<FactorType> &output
|
|
|
|
, const std::string &filePath
|
|
|
|
, const std::vector<float> &weight
|
|
|
|
, size_t tableLimit);
|
|
|
|
|
|
|
|
virtual ~PhraseDictionaryFeature();
|
2008-06-11 14:52:57 +04:00
|
|
|
|
2009-08-07 20:47:54 +04:00
|
|
|
virtual bool ComputeValueInTranslationOption() const;
|
2009-02-06 18:43:06 +03:00
|
|
|
|
2008-06-11 14:52:57 +04:00
|
|
|
std::string GetScoreProducerDescription() const;
|
2009-05-26 23:30:35 +04:00
|
|
|
std::string GetScoreProducerWeightShortName() const
|
|
|
|
{
|
|
|
|
return "tm";
|
|
|
|
}
|
2008-06-11 14:52:57 +04:00
|
|
|
size_t GetNumScoreComponents() const;
|
|
|
|
|
2009-02-06 18:43:06 +03:00
|
|
|
size_t GetNumInputScores() const;
|
|
|
|
|
2009-08-07 20:47:54 +04:00
|
|
|
PhraseDictionary* GetDictionary(const InputType& source);
|
|
|
|
|
|
|
|
private:
|
|
|
|
size_t m_numScoreComponent;
|
|
|
|
unsigned m_numInputScores;
|
|
|
|
std::vector<FactorType> m_input;
|
|
|
|
std::vector<FactorType> m_output;
|
|
|
|
std::string m_filePath;
|
|
|
|
std::vector<float> m_weight;
|
|
|
|
size_t m_tableLimit;
|
|
|
|
//Only instantiate one of these
|
|
|
|
std::auto_ptr<PhraseDictionary> m_memoryDictionary;
|
|
|
|
#ifdef WITH_THREADS
|
|
|
|
boost::thread_specific_ptr<PhraseDictionary> m_treeDictionary;
|
|
|
|
#else
|
|
|
|
std::auto_ptr<PhraseDictionary> m_treeDictionary;
|
|
|
|
#endif
|
2009-02-06 18:43:06 +03:00
|
|
|
|
2009-08-07 20:47:54 +04:00
|
|
|
};
|
2009-02-06 18:43:06 +03:00
|
|
|
|
2008-06-11 14:52:57 +04:00
|
|
|
|
2008-10-09 03:51:26 +04:00
|
|
|
|
|
|
|
}
|