From: Richard Kettlewell Date: Sun, 5 Apr 2009 09:45:15 +0000 (+0100) Subject: Update grapheme break algorithm to Unicode 5.1.0 (based on UAX #29) X-Git-Tag: 5.0~152^2~4 X-Git-Url: http://www.chiark.greenend.org.uk/ucgi/~mdw/git/disorder/commitdiff_plain/e2e88ad814a1839b34a163832975620fe0e44fac Update grapheme break algorithm to Unicode 5.1.0 (based on UAX #29) --- diff --git a/lib/unicode.c b/lib/unicode.c index 55390eb..16c5932 100644 --- a/lib/unicode.c +++ b/lib/unicode.c @@ -603,6 +603,12 @@ int utf32_iterator_grapheme_boundary(utf32_iterator it) { /* GB9 */ if(gbafter == unicode_Grapheme_Break_Extend) return 0; + /* GB9a */ + if(gbafter == unicode_Grapheme_Break_SpacingMark) + return 0; + /* GB9b */ + if(gbbefore == unicode_Grapheme_Break_Prepend) + return 0; /* GB10 */ return 1;