mirror of
https://github.com/moses-smt/mosesdecoder.git
synced 2025-01-02 17:09:36 +03:00
9e88f794e6
This performs some minor transformations to Egret forests: escaping of Moses special characters; removal of "^g" suffixes from constituent labels; and marking of slash/hyphen split points (using @ characters).
57 lines
1.6 KiB
C++
57 lines
1.6 KiB
C++
#include "TopologicalSorter.h"
|
|
|
|
namespace MosesTraining
|
|
{
|
|
namespace Syntax
|
|
{
|
|
namespace PostprocessEgretForests
|
|
{
|
|
|
|
void TopologicalSorter::Sort(const Forest &forest,
|
|
std::vector<const Forest::Vertex *> &permutation)
|
|
{
|
|
permutation.clear();
|
|
BuildPredSets(forest);
|
|
m_visited.clear();
|
|
for (std::vector<boost::shared_ptr<Forest::Vertex> >::const_iterator
|
|
p = forest.vertices.begin(); p != forest.vertices.end(); ++p) {
|
|
if (m_visited.find(p->get()) == m_visited.end()) {
|
|
Visit(**p, permutation);
|
|
}
|
|
}
|
|
}
|
|
|
|
void TopologicalSorter::BuildPredSets(const Forest &forest)
|
|
{
|
|
m_predSets.clear();
|
|
for (std::vector<boost::shared_ptr<Forest::Vertex> >::const_iterator
|
|
p = forest.vertices.begin(); p != forest.vertices.end(); ++p) {
|
|
const Forest::Vertex &head = **p;
|
|
for (std::vector<boost::shared_ptr<Forest::Hyperedge> >::const_iterator
|
|
q = head.incoming.begin(); q != head.incoming.end(); ++q) {
|
|
const Forest::Hyperedge &e = **q;
|
|
for (std::vector<Forest::Vertex *>::const_iterator
|
|
r = e.tail.begin(); r != e.tail.end(); ++r) {
|
|
m_predSets[&head].insert(*r);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void TopologicalSorter::Visit(const Forest::Vertex &v,
|
|
std::vector<const Forest::Vertex *> &permutation)
|
|
{
|
|
m_visited.insert(&v);
|
|
const VertexSet &predSet = m_predSets[&v];
|
|
for (VertexSet::const_iterator p = predSet.begin(); p != predSet.end(); ++p) {
|
|
if (m_visited.find(*p) == m_visited.end()) {
|
|
Visit(**p, permutation);
|
|
}
|
|
}
|
|
permutation.push_back(&v);
|
|
}
|
|
|
|
} // namespace PostprocessEgretForests
|
|
} // namespace Syntax
|
|
} // namespace MosesTraining
|