commiting a script by Loic Barrault to display moses search graph

(-output-search-graph) using graphviz dot


git-svn-id: https://mosesdecoder.svn.sourceforge.net/svnroot/mosesdecoder/trunk@2672 1f5c12ca-751b-0410-a591-d2e778427230
This commit is contained in:
bojar 2010-01-26 17:01:12 +00:00
parent def35604af
commit 536c7bdbcc

101
scripts/analysis/sg2dot.pl Executable file
View File

@ -0,0 +1,101 @@
#!/usr/bin/perl -w
#
# Author : Loic BARRAULT
# Script to convert MOSES searchgraph to DOT format
#
use strict;
use File::Path;
use File::Basename;
use File::Copy;
if ($#ARGV+1 != 1)
{
print "\n\n INPUT:";
print "\n 1) Search graph file ";
print "\n";
exit(-1);
}
my $searchgraph = $ARGV[0];
print STDERR "searchgraph = $searchgraph\n";
my %stacks = ();
$stacks{0}{0} = 0;
print STDOUT "digraph searchgraph\n{\nrankdir=LR\n";
my($line, $cpt, $from, $to, $label, $recombined, $transition, $o, $stack, $state);
$cpt = 0;
open(LISTFD, "<$searchgraph") or die "Cannot read input file $searchgraph, Erreur: $!\n";
$line=<LISTFD>; #skip first line ...
while(($line=<LISTFD>) )
{
$from = "";
$to = "";
$label = "";
$recombined = "";
chomp($line);
#print STDERR "$line\n";
#Three kinds of lines in searchgraph
#0 hyp=0 stack=0 forward=1 fscore=-205.192
#0 hyp=5 stack=1 back=0 score=-0.53862 transition=-0.53862 forward=181 fscore=-205.36 covered=0-0 out=I am , pC=-0.401291, c=-0.98555
#256 hyp=6566 stack=2 back=23 score=-2.15644 transition=-0.921959 recombined=6302 forward=15519 fscore=-112.807 covered=2-2 out=countries , , pC=-0.640574, c=-1.07215
if($line =~ /hyp=(\d+).+stack=(\d+).+back=(\d+).+transition=([^ ]*).+recombined=(\d+).+out=(.*), pC/)
{
#print STDERR "hyp=$1, stack=$2, from=$3, transition=$4, recombined=$5, out=$6\n";
$to = $1;
$stack = $2;
$from = $3;
$transition=$4;
$recombined = $5;
$o = $6;
$label = "[color=blue label=";
$to = $recombined;
$stacks{$stack}{$recombined} = $recombined;
#$stack++;
#$stacks{$stack}{$recombined} = $recombined;
}
elsif($line =~ /hyp=(\d+).+stack=(\d+).+back=(\d+).+transition=([^ ]*).+out=(.*), pC/)
{
#print STDERR "hyp=$1, stack=$2, from=$3, transition=$4, out=$5\n";
$to = $1;
$stack = $2;
$from = $3;
$transition=$4;
$o = $5;
$label = "[label=";
$stacks{$stack}{$to} = $to;
#$stack++;
#$stacks{$stack}{$to} = $to;
}
else{ print STDERR "Bad file format ..."; exit(); }
$o =~ s/\"/\\"/g ;
#print STDERR "out = $o after regexp\n";
$label .= "\"$o p=$transition\"]\n";
#$label .= " p=$transition\"]\n";
print STDOUT "$from -> $to $label";
$cpt++;
}
foreach $stack (sort (keys(%stacks)))
{
print STDOUT "{ rank=same; ";
foreach $state (sort keys %{ $stacks{$stack} } )
{
print STDOUT "$stacks{$stack}{$state} ";
}
print STDOUT "}\n";
}
print STDOUT "\n}\n";