mosesdecoder/phrase-extract/postprocess-egret-forests/ForestWriter.h
Phil Williams 9e88f794e6 Add phrase-extract/postprocess-egret-forests
This performs some minor transformations to Egret forests: escaping of
Moses special characters; removal of "^g" suffixes from constituent labels;
and marking of slash/hyphen split points (using @ characters).
2015-03-10 13:51:30 +00:00

37 lines
733 B
C++

#pragma once
#include <ostream>
#include <string>
#include "Forest.h"
#include "Options.h"
namespace MosesTraining
{
namespace Syntax
{
namespace PostprocessEgretForests
{
class ForestWriter
{
public:
ForestWriter(const Options &options, std::ostream &out)
: m_options(options), m_out(out) {}
void Write(const std::string &, const Forest &, std::size_t);
private:
std::string Escape(const std::string &) const;
std::string PossiblyEscape(const std::string &) const;
void WriteHyperedgeLine(const Forest::Hyperedge &);
void WriteVertex(const Forest::Vertex &);
const Options &m_options;
std::ostream &m_out;
};
} // namespace PostprocessEgretForests
} // namespace Syntax
} // namespace MosesTraining