summaryrefslogtreecommitdiff
path: root/word-aligner
diff options
context:
space:
mode:
Diffstat (limited to 'word-aligner')
-rw-r--r--word-aligner/support/generate-per-sentence-grammars.pl5
1 files changed, 3 insertions, 2 deletions
diff --git a/word-aligner/support/generate-per-sentence-grammars.pl b/word-aligner/support/generate-per-sentence-grammars.pl
index 695cfc17..d621213e 100644
--- a/word-aligner/support/generate-per-sentence-grammars.pl
+++ b/word-aligner/support/generate-per-sentence-grammars.pl
@@ -4,7 +4,7 @@ use utf8;
die "Usage: $0 f.voc corpus.f-e grammar.f-e.gz\n" unless scalar @ARGV == 3;
-my $MAX_INMEM = 1000;
+my $MAX_INMEM = 3000;
open FV,"<$ARGV[0]" or die "Can't read $ARGV[0]: $!";
open C,"<$ARGV[1]" or die "Can't read $ARGV[1]: $!";
@@ -19,7 +19,7 @@ my %most_freq;
$most_freq{"<eps>"} = 1;
while(my $f = <FV>) {
chomp $f;
- %most_freq{$f}=1;
+ $most_freq{$f}=1;
$vc++;
last if $vc == $MAX_INMEM;
}
@@ -27,6 +27,7 @@ close FV;
print STDERR "Loaded $vc vocabulary items for permanent translation cache\n";
+my %grammar;
my $memrc = 0;
my $loadrc = 0;
while(<G>) {