diff options
author | redpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-10-28 19:42:39 +0000 |
---|---|---|
committer | redpony <redpony@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-10-28 19:42:39 +0000 |
commit | 0b528dff0ff3dec0dd7a65b6cda84483092dacfb (patch) | |
tree | 51663a61b61ca562425738b1fc82e6c54be18d43 /word-aligner/support/generate_per_sentence_grammars.pl | |
parent | 6f21de07db8631992be2ed01fef3c839ec5aedae (diff) |
gen ps
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@698 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'word-aligner/support/generate_per_sentence_grammars.pl')
-rwxr-xr-x | word-aligner/support/generate_per_sentence_grammars.pl | 4 |
1 files changed, 3 insertions, 1 deletions
diff --git a/word-aligner/support/generate_per_sentence_grammars.pl b/word-aligner/support/generate_per_sentence_grammars.pl index 730035d8..80243419 100755 --- a/word-aligner/support/generate_per_sentence_grammars.pl +++ b/word-aligner/support/generate_per_sentence_grammars.pl @@ -55,6 +55,7 @@ my $id = 0; open O, ">ps.grammar" or die; binmode(O,":utf8"); while(<C>) { + chomp; my ($f,$e) = split / \|\|\| /; my @fwords = split /\s+/, $f; my $tot = 0; @@ -73,7 +74,8 @@ while(<C>) { $used{$f} = 1; } print O "###EOS###\n"; - print STDERR "id=$id POS=$fpos\n"; + print STDERR "<seg id=\"$id\" grammar=\"\@$fpos\"> $_ </seg>\n"; + #print STDERR "id=$id POS=$fpos\n"; $id++; last if $id == 10; } |