summaryrefslogtreecommitdiff
path: root/corpus
diff options
context:
space:
mode:
authorChris Dyer <redpony@gmail.com>2014-12-29 02:02:27 -0500
committerChris Dyer <redpony@gmail.com>2014-12-29 02:02:27 -0500
commita66b19342f105546adfb9cd9189f862e8a9c0b15 (patch)
tree608b6894fb5ebdba37451684755963011f685b14 /corpus
parent4c4ab517897a217734e7a7e5942735712b561981 (diff)
finnish case markings
Diffstat (limited to 'corpus')
-rw-r--r--corpus/support/token_patterns3
1 files changed, 2 insertions, 1 deletions
diff --git a/corpus/support/token_patterns b/corpus/support/token_patterns
index e51e5e72..12558cdd 100644
--- a/corpus/support/token_patterns
+++ b/corpus/support/token_patterns
@@ -1,6 +1,7 @@
/^(al|el|ul|e)\-[a-z]+$/
+/\.(fi|fr|es|co\.uk|de)$/
+/:[a-zä]+$/
/^((а|А)(ль|ш)|уль)-\p{Cyrillic}+$/
-/^(юл)-\p{Cyrillic}+$/
/^\p{Cyrillic}\.\p{Cyrillic}\.$/
/^(\d|\d\d|\d\d\d)\.$/