diff options
author | Patrick Simianer <p@simianer.de> | 2013-03-15 11:39:18 +0100 |
---|---|---|
committer | Patrick Simianer <p@simianer.de> | 2013-03-15 11:39:18 +0100 |
commit | 3d8aa307d233f58cfe9ddcc616a8297551a738e3 (patch) | |
tree | b9556fe62c7ac0d7b48d92481acdd06a546b1dc2 /word-aligner | |
parent | cf67d34738e1487f75739dc1e027b1864a06513b (diff) | |
parent | 9f1d72fa4dc231eb8cdb737becfc10452b5daef4 (diff) |
Merge remote-tracking branch 'upstream/master'
Diffstat (limited to 'word-aligner')
-rwxr-xr-x | word-aligner/ortho-norm/ru.pl | 44 |
1 files changed, 44 insertions, 0 deletions
diff --git a/word-aligner/ortho-norm/ru.pl b/word-aligner/ortho-norm/ru.pl new file mode 100755 index 00000000..34452d06 --- /dev/null +++ b/word-aligner/ortho-norm/ru.pl @@ -0,0 +1,44 @@ +#!/usr/bin/perl -w +use strict; +use utf8; +binmode(STDIN,":utf8"); +binmode(STDOUT,":utf8"); +while(<STDIN>) { + $_ = uc $_; + s/А/a/g; + s/І/i/g; + s/Б/b/g; + s/В/v/g; + s/Г/g/g; + s/Д/d/g; + s/Е/e/g; + s/Ж/zh/g; + s/З/z/g; + s/И/i/g; + s/Й/i/g; + s/К/k/g; + s/Л/l/g; + s/М/m/g; + s/Н/n/g; + s/О/o/g; + s/П/p/g; + s/Р/r/g; + s/С/s/g; + s/Т/t/g; + s/У/u/g; + s/Ф/f/g; + s/Х/kh/g; + s/Ц/c/g; + s/Ч/ch/g; + s/Ш/sh/g; + s/Щ/shch/g; + s/Ъ//g; + s/Ы//g; + s/Ь//g; + s/Э/e/g; + s/Ю/yo/g; + s/Я/ya/g; + $_ = lc $_; + print; +} + |