mirror of
https://github.com/marian-nmt/marian.git
synced 2024-12-03 03:54:56 +03:00
104 lines
2.3 KiB
Perl
Executable File
104 lines
2.3 KiB
Perl
Executable File
#!/usr/bin/env perl
|
|
|
|
use strict;
|
|
use Getopt::Long;
|
|
use File::Temp qw(tempfile);
|
|
use POSIX;
|
|
|
|
$File::Temp::KEEP_ALL = 1;
|
|
|
|
my $PID = $$;
|
|
$SIG{TERM} = $SIG{INT} = $SIG{QUIT} = sub { die; };
|
|
|
|
my $RESCORER;
|
|
my $INPUT;
|
|
my $NBEST;
|
|
my $WEIGHTS;
|
|
|
|
my @MODELS;
|
|
my ($VSRC, $VTRG);
|
|
my @FEATURES;
|
|
|
|
GetOptions(
|
|
"i|input=s" => \$INPUT,
|
|
"n|n-best=s" => \$NBEST,
|
|
"f|features=s" => \@FEATURES,
|
|
"m|models=s" => \@MODELS,
|
|
"s|source=s" => \$VSRC,
|
|
"t|target=s" => \$VTRG,
|
|
"r|rescorer=s" => \$RESCORER,
|
|
"w|weights=s" => \$WEIGHTS
|
|
);
|
|
|
|
my $BEFORE = "LM1=";
|
|
open(W, "<", $WEIGHTS) or die "Could not open";
|
|
chomp(my $FIRST = <W>);
|
|
($BEFORE) = split(/\s/, $FIRST);
|
|
while (<W>) {
|
|
my ($CURRENT) = split(/\s/, $_);
|
|
print STDERR "$CURRENT\n";
|
|
if ($CURRENT eq "$FEATURES[0]=") {
|
|
print STDERR "Found $FEATURES[0] after $BEFORE\n";
|
|
last;
|
|
}
|
|
$BEFORE = $CURRENT;
|
|
}
|
|
close(W);
|
|
|
|
my $PATTERN1 = join(" ", map { "\\b$_= \\S+" } @FEATURES);
|
|
my $PATTERN2 = "\\b$BEFORE \\S+";
|
|
|
|
print STDERR $PATTERN1, "\n";
|
|
print STDERR $PATTERN2, "\n";
|
|
|
|
my ($NBEST_TEMP_HANDLE, $NBEST_TEMP_FILE1) = tempfile();
|
|
my (undef, $NBEST_TEMP_FILE2) = tempfile();
|
|
open(NBEST_IN, "<", $NBEST) or die "Could not open";
|
|
while (<NBEST_IN>) {
|
|
chomp;
|
|
foreach my $name (@FEATURES) {
|
|
s/$name= \S+ //g;
|
|
}
|
|
print $NBEST_TEMP_HANDLE $_, "\n";
|
|
}
|
|
close(NBEST_IN);
|
|
close($NBEST_TEMP_HANDLE);
|
|
|
|
foreach my $i (0 .. $#MODELS) {
|
|
execute("$RESCORER -i $INPUT -m $MODELS[$i] -s $VSRC -t $VTRG -f $FEATURES[$i] -n $NBEST_TEMP_FILE1 > $NBEST_TEMP_FILE2");
|
|
rename($NBEST_TEMP_FILE2, $NBEST_TEMP_FILE1);
|
|
}
|
|
|
|
open($NBEST_TEMP_HANDLE, "<", $NBEST_TEMP_FILE1) or die "Could not open";
|
|
|
|
while (<$NBEST_TEMP_HANDLE>) {
|
|
chomp;
|
|
if (/$PATTERN2/) {
|
|
if(s/($PATTERN1)//) {
|
|
my $FEAT = $1;
|
|
s/($PATTERN2 )/$1$FEAT /;
|
|
}
|
|
}
|
|
print "$_\n";
|
|
}
|
|
|
|
sub execute {
|
|
my $command = shift;
|
|
logMessage("Executing:\t$command");
|
|
my $ret = system($command);
|
|
if($ret != 0) {
|
|
logMessage("Command '$command' finished with return status $ret");
|
|
logMessage("Aborting and killing parent process");
|
|
kill(2, $PID);
|
|
die;
|
|
}
|
|
}
|
|
|
|
sub logMessage {
|
|
my $message = shift;
|
|
my $time = POSIX::strftime("%m/%d/%Y %H:%M:%S", localtime());
|
|
my $log_message = $time."\t$message\n";
|
|
print STDERR $log_message;
|
|
}
|
|
|