summaryrefslogtreecommitdiff
path: root/word-aligner/ortho-norm/ar.pl
blob: e8bd521a29d6ea2f44abcfdc56e10c7614d3bf92 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
#!/usr/bin/perl -w
use strict;
use utf8;

binmode(STDIN, ":utf8");
binmode(STDOUT, ":utf8");

while(<STDIN>) {
  chomp;
  my $len = length($_);
  if ($len > 1 && !($_ =~ /\d/)) {
    s/\$/sh/g;
  }
  s/([a-z])\~/$1$1/g;
  s/E/'/g;
  s/^Aw/o/g;
  s/\|/a/g;
  s/@/h/g;
  s/c/ch/g;
  s/x/kh/g;
  s/\*/dh/g;
  s/w/o/g;
  s/v/th/g;
  if ($len > 1) { s/}/'/g; }
  s/Z/dh/g;
  s/y/i/g;
  s/Y/a/g;
  if ($len > 1) { s/p$//; }
  $_ = lc $_;
  print "$_\n";
}