summaryrefslogtreecommitdiff
path: root/corpus/support/quote-norm.pl
diff options
context:
space:
mode:
authorarmatthews <armatthe@cmu.edu>2014-02-20 22:22:15 -0500
committerarmatthews <armatthe@cmu.edu>2014-02-20 22:22:15 -0500
commitf7d1893a35ae158e05503ec15b7125e89309aa16 (patch)
treee46c09e53f168966f6b56f72eb27e2e97f0a70d6 /corpus/support/quote-norm.pl
parentfb3a61574c90bb96f90fb390496eb1277b4cc83c (diff)
parent7ecdca1448cc709b21692a1a3b6247c45a3126c3 (diff)
Merge branch 'master' of https://github.com/redpony/cdec
Diffstat (limited to 'corpus/support/quote-norm.pl')
-rwxr-xr-xcorpus/support/quote-norm.pl2
1 files changed, 2 insertions, 0 deletions
diff --git a/corpus/support/quote-norm.pl b/corpus/support/quote-norm.pl
index bed0844e..1d9bb96f 100755
--- a/corpus/support/quote-norm.pl
+++ b/corpus/support/quote-norm.pl
@@ -109,6 +109,8 @@ while(<STDIN>) {
s/\x{ab}/\"/g; # opening guillemet
s/\x{bb}/\"/g; # closing guillemet
s/\x{0301}/'/g; # combining acute accent
+ s/\x{203a}/\"/g; # angle quotation mark
+ s/\x{2039}/\"/g; # angle quotation mark
# Space inverted punctuation:
s/¡/ ¡ /g;