2012-01-26 15:38:40 +04:00
|
|
|
/***********************************************************************
|
|
|
|
Moses - statistical machine translation system
|
|
|
|
Copyright (C) 2006-2012 University of Edinburgh
|
2013-05-29 21:16:15 +04:00
|
|
|
|
2012-01-26 15:38:40 +04:00
|
|
|
This library is free software; you can redistribute it and/or
|
|
|
|
modify it under the terms of the GNU Lesser General Public
|
|
|
|
License as published by the Free Software Foundation; either
|
|
|
|
version 2.1 of the License, or (at your option) any later version.
|
2013-05-29 21:16:15 +04:00
|
|
|
|
2012-01-26 15:38:40 +04:00
|
|
|
This library is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
Lesser General Public License for more details.
|
2013-05-29 21:16:15 +04:00
|
|
|
|
2012-01-26 15:38:40 +04:00
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
|
|
License along with this library; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
***********************************************************************/
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
2012-11-12 23:56:18 +04:00
|
|
|
#include "moses/NonTerminal.h"
|
|
|
|
#include "moses/TargetPhrase.h"
|
|
|
|
#include "moses/TargetPhraseCollection.h"
|
|
|
|
#include "moses/Terminal.h"
|
|
|
|
#include "moses/Util.h"
|
|
|
|
#include "moses/Word.h"
|
|
|
|
#include "Trie.h"
|
2012-01-26 15:38:40 +04:00
|
|
|
|
|
|
|
#include <boost/functional/hash.hpp>
|
|
|
|
#include <boost/unordered_map.hpp>
|
|
|
|
#include <boost/version.hpp>
|
|
|
|
|
|
|
|
#include <map>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
namespace Moses
|
|
|
|
{
|
|
|
|
|
|
|
|
class RuleTableUTrie;
|
|
|
|
|
2012-07-23 17:07:36 +04:00
|
|
|
//! @todo ask phil williams - whats the diff between this and phrasedictionaryNode
|
2012-01-26 15:38:40 +04:00
|
|
|
class UTrieNode
|
|
|
|
{
|
2013-05-29 21:16:15 +04:00
|
|
|
public:
|
2012-01-26 15:38:40 +04:00
|
|
|
typedef std::vector<std::vector<Word> > LabelTable;
|
|
|
|
#if defined(BOOST_VERSION) && (BOOST_VERSION >= 104200)
|
|
|
|
typedef boost::unordered_map<Word,
|
2013-05-29 21:16:15 +04:00
|
|
|
UTrieNode,
|
|
|
|
TerminalHasher,
|
|
|
|
TerminalEqualityPred> TerminalMap;
|
2012-01-26 15:38:40 +04:00
|
|
|
|
|
|
|
typedef boost::unordered_map<std::vector<int>,
|
2013-05-29 21:16:15 +04:00
|
|
|
TargetPhraseCollection> LabelMap;
|
2012-01-26 15:38:40 +04:00
|
|
|
#else
|
|
|
|
typedef std::map<Word, UTrieNode> TerminalMap;
|
|
|
|
typedef std::map<std::vector<int>, TargetPhraseCollection> LabelMap;
|
|
|
|
#endif
|
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
~UTrieNode() {
|
|
|
|
delete m_gapNode;
|
|
|
|
}
|
2012-01-26 15:38:40 +04:00
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
const LabelTable &GetLabelTable() const {
|
|
|
|
return m_labelTable;
|
|
|
|
}
|
|
|
|
const LabelMap &GetLabelMap() const {
|
|
|
|
return m_labelMap;
|
|
|
|
}
|
|
|
|
const TerminalMap &GetTerminalMap() const {
|
|
|
|
return m_terminalMap;
|
|
|
|
}
|
2012-01-26 15:38:40 +04:00
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
const UTrieNode *GetNonTerminalChild() const {
|
|
|
|
return m_gapNode;
|
|
|
|
}
|
2012-01-26 15:38:40 +04:00
|
|
|
|
|
|
|
UTrieNode *GetOrCreateTerminalChild(const Word &sourceTerm);
|
|
|
|
UTrieNode *GetOrCreateNonTerminalChild(const Word &targetNonTerm);
|
|
|
|
|
|
|
|
TargetPhraseCollection &GetOrCreateTargetPhraseCollection(
|
2013-05-29 21:16:15 +04:00
|
|
|
const TargetPhrase &);
|
2012-01-26 15:38:40 +04:00
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
bool IsLeaf() const {
|
|
|
|
return m_terminalMap.empty() && m_gapNode == NULL;
|
|
|
|
}
|
2012-01-26 15:38:40 +04:00
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
bool HasRules() const {
|
|
|
|
return !m_labelMap.empty();
|
|
|
|
}
|
2012-01-26 15:38:40 +04:00
|
|
|
|
|
|
|
void Prune(size_t tableLimit);
|
|
|
|
void Sort(size_t tableLimit);
|
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
private:
|
2012-01-26 15:38:40 +04:00
|
|
|
friend class RuleTableUTrie;
|
|
|
|
|
|
|
|
UTrieNode() : m_gapNode(NULL) {}
|
|
|
|
|
2013-05-29 21:16:15 +04:00
|
|
|
int InsertLabel(int i, const Word &w) {
|
2012-01-26 15:38:40 +04:00
|
|
|
std::vector<Word> &inner = m_labelTable[i];
|
|
|
|
for (size_t j = 0; j < inner.size(); ++j) {
|
|
|
|
if (inner[j] == w) {
|
|
|
|
return j;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
inner.push_back(w);
|
|
|
|
return inner.size()-1;
|
|
|
|
}
|
|
|
|
|
|
|
|
LabelTable m_labelTable;
|
|
|
|
LabelMap m_labelMap;
|
|
|
|
TerminalMap m_terminalMap;
|
|
|
|
UTrieNode *m_gapNode;
|
|
|
|
};
|
|
|
|
|
|
|
|
} // namespace Moses
|