diff options
| -rw-r--r-- | word-aligner/support/generate-per-sentence-grammars.pl | 5 | 
1 files changed, 3 insertions, 2 deletions
| diff --git a/word-aligner/support/generate-per-sentence-grammars.pl b/word-aligner/support/generate-per-sentence-grammars.pl index 695cfc17..d621213e 100644 --- a/word-aligner/support/generate-per-sentence-grammars.pl +++ b/word-aligner/support/generate-per-sentence-grammars.pl @@ -4,7 +4,7 @@ use utf8;  die "Usage: $0 f.voc corpus.f-e grammar.f-e.gz\n" unless scalar @ARGV == 3; -my $MAX_INMEM = 1000; +my $MAX_INMEM = 3000;  open FV,"<$ARGV[0]" or die "Can't read $ARGV[0]: $!";  open C,"<$ARGV[1]" or die "Can't read $ARGV[1]: $!"; @@ -19,7 +19,7 @@ my %most_freq;  $most_freq{"<eps>"} = 1;  while(my $f = <FV>) {    chomp $f; -  %most_freq{$f}=1; +  $most_freq{$f}=1;    $vc++;    last if $vc == $MAX_INMEM;  } @@ -27,6 +27,7 @@ close FV;  print STDERR "Loaded $vc vocabulary items for permanent translation cache\n"; +my %grammar;  my $memrc = 0;  my $loadrc = 0;  while(<G>) { | 
