diff options
author | redpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-10-28 18:02:35 +0000 |
---|---|---|
committer | redpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-10-28 18:02:35 +0000 |
commit | c1e9b0d59290843498dec2b4821532d0c36eab71 (patch) | |
tree | 1e318fd688a0e62fa42162a4602555667fbeeff5 | |
parent | 13829cbd808c727112a9f24ac08141fc4483f5a3 (diff) |
fix, rename
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@696 ec762483-ff6d-05da-a07a-a48fb63a330f
-rwxr-xr-x[-rw-r--r--] | word-aligner/support/generate_per_sentence_grammars.pl (renamed from word-aligner/support/generate-per-sentence-grammars.pl) | 22 |
1 files changed, 19 insertions, 3 deletions
diff --git a/word-aligner/support/generate-per-sentence-grammars.pl b/word-aligner/support/generate_per_sentence_grammars.pl index d621213e..c644ec6d 100644..100755 --- a/word-aligner/support/generate-per-sentence-grammars.pl +++ b/word-aligner/support/generate_per_sentence_grammars.pl @@ -38,11 +38,27 @@ while(<G>) { $memrc++; } else { $loadrc++; - $grammar{$f}="$e ||| $feats"; + my $r = $grammar{$f}; + if (!defined $r) { + $r = []; + $grammar{$f} = $r; + } + push @$r, "$e ||| $feats"; } } - +close G; print STDERR " mem rc: $memrc\n"; print STDERR " load rc: $loadrc\n"; - +while(<C>) { + my ($f,$e) = split / \|\|\| /; + my @fwords = split /\s+/, $f; + my $tot = 0; + for my $f (@fwords) { + my $r = $grammar{$f}; + die "No translations for: $f" unless $r; + my $num = scalar @$r; + $tot += $num; + } + print "RULES: $tot\n"; +} |