2006-08-01 00:13:25 +04:00
|
|
|
#!/usr/bin/perl
|
2007-03-15 01:22:36 +03:00
|
|
|
|
|
|
|
# $Id$
|
2007-05-09 04:54:07 +04:00
|
|
|
# given a moses.ini file, creates a fresh version of it
|
2006-08-01 00:13:25 +04:00
|
|
|
# in the current directory
|
2007-05-09 04:54:07 +04:00
|
|
|
# All relevant files are hardlinked or copied to the directory, too.
|
2006-08-01 00:13:25 +04:00
|
|
|
|
2006-08-08 03:04:33 +04:00
|
|
|
use strict;
|
|
|
|
use Getopt::Long;
|
|
|
|
|
|
|
|
my @fixpath = ();
|
|
|
|
# specify search-replace pattern to fix paths.
|
|
|
|
# use a space to delimit source and target pathnames
|
2007-05-09 04:54:07 +04:00
|
|
|
my $symlink = 0; # prefer symlink over hardlink, but revert to hardlink or copy
|
|
|
|
# if symlink fails
|
2006-08-08 03:04:33 +04:00
|
|
|
GetOptions(
|
|
|
|
"fixpath=s" => \@fixpath,
|
2007-05-09 04:54:07 +04:00
|
|
|
"symlink"=>\$symlink,
|
2006-08-08 03:04:33 +04:00
|
|
|
);
|
|
|
|
my @fixrepls = map {
|
|
|
|
my ($fixsrc, $fixtgt) = split / /, $_;
|
|
|
|
print STDERR "Will replace >$fixsrc< with >$fixtgt<\n";
|
|
|
|
[ $fixsrc, $fixtgt ];
|
|
|
|
} @fixpath;
|
|
|
|
|
2006-08-01 00:13:25 +04:00
|
|
|
my $ini = shift;
|
2007-05-09 04:54:07 +04:00
|
|
|
die "usage: clone_moses_model.pl /a/source/moses.ini" if !defined $ini;
|
|
|
|
|
|
|
|
die "./moses.ini exists, will not overwrite" if -e "moses.ini";
|
2006-08-01 00:13:25 +04:00
|
|
|
|
|
|
|
my %cnt; # count files per section
|
|
|
|
open INI, $ini or die "Can't read $ini";
|
|
|
|
open OUT, ">moses.ini" or die "Can't write ./moses.ini";
|
2006-08-08 03:04:33 +04:00
|
|
|
my $section = undef;
|
2006-08-01 00:13:25 +04:00
|
|
|
while (<INI>) {
|
|
|
|
if (/^\[([^\]]*)\]\s*$/) {
|
|
|
|
$section = $1;
|
|
|
|
}
|
|
|
|
if (/^[0-9]/) {
|
2010-04-20 21:02:41 +04:00
|
|
|
if ($section eq "ttable-file") {
|
2006-08-01 00:13:25 +04:00
|
|
|
chomp;
|
2010-04-09 15:37:43 +04:00
|
|
|
my ($a, $b, $c, $d, $fn) = split / /;
|
2006-08-01 00:13:25 +04:00
|
|
|
$cnt{$section}++;
|
2006-08-08 03:04:33 +04:00
|
|
|
$fn = fixpath($fn);
|
2007-05-09 04:54:07 +04:00
|
|
|
$fn = ensure_relative_from_origin($fn, $ini);
|
2007-03-26 02:55:31 +04:00
|
|
|
$fn = ensure_exists_or_gzipped_exists($fn);
|
|
|
|
my $suffix = ($fn =~ /\.gz$/ ? ".gz" : "");
|
2007-05-09 04:54:07 +04:00
|
|
|
clone_file_or_die($fn, "./$section.$cnt{$section}$suffix");
|
2010-04-09 15:37:43 +04:00
|
|
|
$_ = "$a $b $c $d ./$section.$cnt{$section}$suffix\n";
|
2006-08-01 00:13:25 +04:00
|
|
|
}
|
2010-04-20 21:02:41 +04:00
|
|
|
if ($section eq "generation-file" || $section eq "lmodel-file") {
|
2006-08-01 00:13:25 +04:00
|
|
|
chomp;
|
2006-08-04 08:45:48 +04:00
|
|
|
my ($a, $b, $c, $fn) = split / /;
|
2006-08-01 00:13:25 +04:00
|
|
|
$cnt{$section}++;
|
2006-08-08 03:04:33 +04:00
|
|
|
$fn = fixpath($fn);
|
2007-05-09 04:54:07 +04:00
|
|
|
$fn = ensure_relative_from_origin($fn, $ini);
|
2007-03-26 02:55:31 +04:00
|
|
|
$fn = ensure_exists_or_gzipped_exists($fn);
|
|
|
|
my $suffix = ($fn =~ /\.gz$/ ? ".gz" : "");
|
2007-05-09 04:54:07 +04:00
|
|
|
clone_file_or_die($fn, "./$section.$cnt{$section}$suffix");
|
2006-08-04 08:45:48 +04:00
|
|
|
$_ = "$a $b $c ./$section.$cnt{$section}$suffix\n";
|
2006-08-01 00:13:25 +04:00
|
|
|
}
|
|
|
|
if ($section eq "distortion-file") {
|
|
|
|
chomp;
|
2008-02-26 13:24:53 +03:00
|
|
|
my ($a, $b, $c, $fn) = split / /;
|
2006-08-01 00:13:25 +04:00
|
|
|
$cnt{$section}++;
|
2006-08-08 03:04:33 +04:00
|
|
|
$fn = fixpath($fn);
|
2007-05-09 04:54:07 +04:00
|
|
|
$fn = ensure_relative_from_origin($fn, $ini);
|
2007-03-26 02:55:31 +04:00
|
|
|
$fn = ensure_exists_or_gzipped_exists($fn);
|
|
|
|
my $suffix = ($fn =~ /\.gz$/ ? ".gz" : "");
|
2007-05-09 04:54:07 +04:00
|
|
|
clone_file_or_die($fn, "./$section.$cnt{$section}$suffix");
|
2008-02-26 13:24:53 +03:00
|
|
|
$_ = "$a $b $c ./$section.$cnt{$section}$suffix\n";
|
2006-08-01 00:13:25 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
print OUT $_;
|
|
|
|
}
|
|
|
|
close INI;
|
|
|
|
close OUT;
|
|
|
|
|
2007-05-09 04:54:07 +04:00
|
|
|
sub clone_file_or_die {
|
|
|
|
my $src = shift;
|
|
|
|
my $tgt = shift;
|
|
|
|
|
|
|
|
my $src = resolve($src); # resolve symlinks
|
|
|
|
|
|
|
|
my $ok = 0;
|
|
|
|
if ($symlink) {
|
|
|
|
# attemt a symlink
|
|
|
|
$ok = safesystem("ln", "-s", $src, $tgt);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!$ok) {
|
|
|
|
# perform a hardlink or a copy
|
|
|
|
if (! safesystem("ln", $src, $tgt)) {
|
|
|
|
# hardlink failed perform a copy
|
|
|
|
safesystem("cp", "-u", $src, $tgt)
|
|
|
|
or die "Failed to clone $src into $tgt";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
safesystem("echo $src > $tgt.info"); # dump a short information
|
|
|
|
}
|
|
|
|
|
2007-03-26 02:55:31 +04:00
|
|
|
sub ensure_exists_or_gzipped_exists {
|
|
|
|
my $fn = shift;
|
|
|
|
return $fn if -e $fn;
|
|
|
|
my $tryfn = $fn.".gz";
|
|
|
|
return $tryfn if -e $tryfn;
|
|
|
|
die "$0:$ini:Neither file $fn nor $tryfn found.";
|
|
|
|
}
|
2006-08-08 03:04:33 +04:00
|
|
|
|
|
|
|
sub fixpath {
|
|
|
|
my $fn = shift;
|
|
|
|
foreach my $pair (@fixrepls) {
|
|
|
|
$fn =~ s/$pair->[0]/$pair->[1]/g;
|
|
|
|
}
|
|
|
|
return $fn;
|
|
|
|
}
|
|
|
|
|
2006-08-01 00:13:25 +04:00
|
|
|
sub safesystem {
|
|
|
|
print STDERR "Executing: @_\n";
|
|
|
|
system(@_);
|
|
|
|
if ($? == -1) {
|
|
|
|
print STDERR "Failed to execute: @_\n $!\n";
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
elsif ($? & 127) {
|
|
|
|
printf STDERR "Execution of: @_\n died with signal %d, %s coredump\n",
|
|
|
|
($? & 127), ($? & 128) ? 'with' : 'without';
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
my $exitcode = $? >> 8;
|
|
|
|
print STDERR "Exit code: $exitcode\n" if $exitcode;
|
|
|
|
return ! $exitcode;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-05-09 04:54:07 +04:00
|
|
|
sub resolve {
|
|
|
|
my $f = shift;
|
|
|
|
return $f if ! -l $f;
|
|
|
|
my $targ_from_lnk = readlink($f) or die "Can't lstat $f";
|
|
|
|
my $targ = ensure_relative_from_origin($targ_from_lnk, $f);
|
|
|
|
# print STDERR "$f ---> $targ_from_lnk ---> $targ\n";
|
|
|
|
|
|
|
|
my $fully = 1; # resolve the full chain of symlinks
|
|
|
|
if ($fully) {
|
|
|
|
my $newtarg = resolve($targ);
|
|
|
|
$targ = $newtarg if defined $newtarg;
|
|
|
|
}
|
|
|
|
return $targ;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub ensure_relative_from_origin {
|
2006-08-01 00:13:25 +04:00
|
|
|
my $target = shift;
|
|
|
|
my $originfile = shift;
|
|
|
|
return $target if $target =~ /^\/|^~/; # the target path is absolute already
|
|
|
|
$originfile =~ s/[^\/]*$//;
|
2007-05-09 04:54:07 +04:00
|
|
|
my $prefix = ($originfile eq "" ? "" : $originfile."/");
|
|
|
|
return simplify_path($prefix.$target);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
sub simplify_path {
|
|
|
|
my $path = shift;
|
|
|
|
my $lastpath = "";
|
|
|
|
while ($lastpath ne $path) {
|
|
|
|
$lastpath = $path;
|
|
|
|
$path =~ s/\/+/\//g;
|
|
|
|
$path =~ s/(\/\.)+\//\//g;
|
|
|
|
$path =~ s/\/[^\/]+(?<!\/\.\.)\/\.\.\//\//g;
|
|
|
|
$path =~ s/^[^\/]+(?<!\/\.\.)\/\.\.\///g;
|
|
|
|
}
|
|
|
|
return $path;
|
2006-08-01 00:13:25 +04:00
|
|
|
}
|