/*********************************************************************** Moses - factored phrase-based language decoder Copyright (C) 2006 University of Edinburgh This library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this library; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA ***********************************************************************/ #ifndef moses_PhraseDictionaryMultiModel_h #define moses_PhraseDictionaryMultiModel_h #include "moses/TranslationModel/PhraseDictionary.h" #include #include #include "moses/StaticData.h" #include "moses/TargetPhrase.h" #include "moses/Util.h" #include "moses/UserMessage.h" #ifdef WITH_DLIB #include #endif namespace Moses { struct multiModelStatistics { TargetPhrase *targetPhrase; std::vector > p; ~multiModelStatistics() { delete targetPhrase; }; }; struct multiModelStatisticsOptimization: multiModelStatistics { size_t f; }; class OptimizationObjective; /** Implementation of a virtual phrase table constructed from multiple component phrase tables. */ class PhraseDictionaryMultiModel: public PhraseDictionary { #ifdef WITH_DLIB friend class CrossEntropy; #endif public: PhraseDictionaryMultiModel(const std::string &line); PhraseDictionaryMultiModel(int type, const std::string &line); ~PhraseDictionaryMultiModel(); void Load(); virtual void CollectSufficientStatistics(const Phrase& src, std::map* allStats) const; virtual TargetPhraseCollection* CreateTargetPhraseCollectionLinearInterpolation(const Phrase& src, std::map* allStats, std::vector > &multimodelweights) const; std::vector > getWeights(size_t numWeights, bool normalize) const; std::vector normalizeWeights(std::vector &weights) const; void CacheForCleanup(TargetPhraseCollection* tpc); void CleanUpAfterSentenceProcessing(const InputType &source); virtual void CleanUpComponentModels(const InputType &source); #ifdef WITH_DLIB virtual std::vector MinimizePerplexity(std::vector > &phrase_pair_vector); std::vector Optimize(OptimizationObjective * ObjectiveFunction, size_t numModels); #endif // functions below required by base class virtual const TargetPhraseCollection* GetTargetPhraseCollectionLEGACY(const Phrase& src) const; virtual void InitializeForInput(InputType const&) { /* Don't do anything source specific here as this object is shared between threads.*/ } ChartRuleLookupManager *CreateRuleLookupManager(const ChartParser &, const ChartCellCollectionBase&); void SetParameter(const std::string& key, const std::string& value); const std::vector* GetTemporaryMultiModelWeightsVector() const; void SetTemporaryMultiModelWeightsVector(std::vector weights); protected: std::string m_mode; std::vector m_pdStr; std::vector m_pd; size_t m_numModels; std::vector m_multimodelweights; typedef std::vector PhraseCache; #ifdef WITH_THREADS boost::shared_mutex m_lock_cache; typedef std::map SentenceCache; #else typedef PhraseCache SentenceCache; #endif SentenceCache m_sentenceCache; PhraseCache& GetPhraseCache() { #ifdef WITH_THREADS { // first try read-only lock boost::shared_lock read_lock(m_lock_cache); SentenceCache::iterator i = m_sentenceCache.find(boost::this_thread::get_id()); if (i != m_sentenceCache.end()) return i->second; } boost::unique_lock lock(m_lock_cache); return m_sentenceCache[boost::this_thread::get_id()]; #else return m_sentenceCache; #endif } #ifdef WITH_THREADS //reader-writer lock mutable boost::shared_mutex m_lock_weights; std::map > m_multimodelweights_tmp; #else std::vector m_multimodelweights_tmp; #endif }; #ifdef WITH_DLIB class OptimizationObjective { public: virtual double operator() ( const dlib::matrix& arg) const = 0; }; class CrossEntropy: public OptimizationObjective { public: CrossEntropy ( std::vector &optimizerStats, PhraseDictionaryMultiModel * model, size_t iFeature ) { m_optimizerStats = optimizerStats; m_model = model; m_iFeature = iFeature; } double operator() ( const dlib::matrix& arg) const; protected: std::vector m_optimizerStats; PhraseDictionaryMultiModel * m_model; size_t m_iFeature; }; #endif PhraseDictionary *FindPhraseDictionary(const std::string &ptName); } // end namespace #endif