summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorredpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-10-28 19:42:39 +0000
committerredpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f>2010-10-28 19:42:39 +0000
commit0b528dff0ff3dec0dd7a65b6cda84483092dacfb (patch)
tree51663a61b61ca562425738b1fc82e6c54be18d43
parent6f21de07db8631992be2ed01fef3c839ec5aedae (diff)
gen ps
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@698 ec762483-ff6d-05da-a07a-a48fb63a330f
-rwxr-xr-xword-aligner/support/generate_per_sentence_grammars.pl4
1 files changed, 3 insertions, 1 deletions
diff --git a/word-aligner/support/generate_per_sentence_grammars.pl b/word-aligner/support/generate_per_sentence_grammars.pl
index 730035d8..80243419 100755
--- a/word-aligner/support/generate_per_sentence_grammars.pl
+++ b/word-aligner/support/generate_per_sentence_grammars.pl
@@ -55,6 +55,7 @@ my $id = 0;
open O, ">ps.grammar" or die;
binmode(O,":utf8");
while(<C>) {
+ chomp;
my ($f,$e) = split / \|\|\| /;
my @fwords = split /\s+/, $f;
my $tot = 0;
@@ -73,7 +74,8 @@ while(<C>) {
$used{$f} = 1;
}
print O "###EOS###\n";
- print STDERR "id=$id POS=$fpos\n";
+ print STDERR "<seg id=\"$id\" grammar=\"\@$fpos\"> $_ </seg>\n";
+ #print STDERR "id=$id POS=$fpos\n";
$id++;
last if $id == 10;
}