From a08d59c277086933125efc0d996814dfdf497af8 Mon Sep 17 00:00:00 2001 From: Al Date: Sun, 5 Jul 2015 15:28:07 -0400 Subject: [PATCH] [fix] NFD normalization should be the default in normalize.c, not NFKD, as NFKD does some unwanted things like converting superscripts and the Latin-ASCII transliterator does a better, more thorough job while staying faithful to the original string --- src/normalize.c | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/normalize.c b/src/normalize.c index d4018032..c3708b93 100644 --- a/src/normalize.c +++ b/src/normalize.c @@ -13,7 +13,7 @@ char *utf8_normalize_string(char *str, uint64_t options) { if (options & NORMALIZE_STRING_DECOMPOSE) { have_utf8proc_options = true; - utf8proc_options |= UTF8PROC_OPTIONS_NFKD; + utf8proc_options |= UTF8PROC_OPTIONS_NFD; } if (options & NORMALIZE_STRING_STRIP_ACCENTS) {