summaryrefslogtreecommitdiff
path: root/word-aligner
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2013-03-15 11:39:18 +0100
committerPatrick Simianer <p@simianer.de>2013-03-15 11:39:18 +0100
commit4f191a593918c7889f2c27cd9f596bec591bf736 (patch)
tree07635cd6e1544c8ef3495aa2b086350a23fc4c28 /word-aligner
parent2a48d73eb794fdd736d1df035c8a31af887cde0a (diff)
parentcba324bee086f4dd0fc9df204d33ff7eb9b6c323 (diff)
Merge remote-tracking branch 'upstream/master'
Diffstat (limited to 'word-aligner')
-rwxr-xr-xword-aligner/ortho-norm/ru.pl44
1 files changed, 44 insertions, 0 deletions
diff --git a/word-aligner/ortho-norm/ru.pl b/word-aligner/ortho-norm/ru.pl
new file mode 100755
index 00000000..34452d06
--- /dev/null
+++ b/word-aligner/ortho-norm/ru.pl
@@ -0,0 +1,44 @@
+#!/usr/bin/perl -w
+use strict;
+use utf8;
+binmode(STDIN,":utf8");
+binmode(STDOUT,":utf8");
+while(<STDIN>) {
+ $_ = uc $_;
+ s/А/a/g;
+ s/І/i/g;
+ s/Б/b/g;
+ s/В/v/g;
+ s/Г/g/g;
+ s/Д/d/g;
+ s/Е/e/g;
+ s/Ж/zh/g;
+ s/З/z/g;
+ s/И/i/g;
+ s/Й/i/g;
+ s/К/k/g;
+ s/Л/l/g;
+ s/М/m/g;
+ s/Н/n/g;
+ s/О/o/g;
+ s/П/p/g;
+ s/Р/r/g;
+ s/С/s/g;
+ s/Т/t/g;
+ s/У/u/g;
+ s/Ф/f/g;
+ s/Х/kh/g;
+ s/Ц/c/g;
+ s/Ч/ch/g;
+ s/Ш/sh/g;
+ s/Щ/shch/g;
+ s/Ъ//g;
+ s/Ы//g;
+ s/Ь//g;
+ s/Э/e/g;
+ s/Ю/yo/g;
+ s/Я/ya/g;
+ $_ = lc $_;
+ print;
+}
+