chiark / gitweb /
Merge from 3.0 fixes branch
[disorder] / lib / t-casefold.c
CommitLineData
b90f122b
RK
1/*
2 * This file is part of DisOrder.
3 * Copyright (C) 2005, 2007, 2008 Richard Kettlewell
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
18 * USA
19 */
20#include "test.h"
21
22void test_casefold(void) {
23 uint32_t c, l;
24 const char *input, *canon_folded, *compat_folded, *canon_expected, *compat_expected;
25
26 fprintf(stderr, "test_casefold\n");
27
28 /* This isn't a very exhaustive test. Unlike for normalization, there don't
29 * seem to be any public test vectors for these algorithms. */
30
31 for(c = 1; c < 256; ++c) {
32 input = utf32_to_utf8(&c, 1, 0);
33 canon_folded = utf8_casefold_canon(input, strlen(input), 0);
34 compat_folded = utf8_casefold_compat(input, strlen(input), 0);
35 switch(c) {
36 default:
37 if((c >= 'A' && c <= 'Z')
38 || (c >= 0xC0 && c <= 0xDE && c != 0xD7))
39 l = c ^ 0x20;
40 else
41 l = c;
42 break;
43 case 0xB5: /* MICRO SIGN */
44 l = 0x3BC; /* GREEK SMALL LETTER MU */
45 break;
46 case 0xDF: /* LATIN SMALL LETTER SHARP S */
47 check_string(canon_folded, "ss");
48 check_string(compat_folded, "ss");
49 l = 0;
50 break;
51 }
52 if(l) {
53 uint32_t *d;
54 /* Case-folded data is now normalized */
55 d = utf32_decompose_canon(&l, 1, 0);
56 canon_expected = utf32_to_utf8(d, utf32_len(d), 0);
57 if(strcmp(canon_folded, canon_expected)) {
58 fprintf(stderr, "%s:%d: canon-casefolding %#lx got '%s', expected '%s'\n",
59 __FILE__, __LINE__, (unsigned long)c,
60 format(canon_folded), format(canon_expected));
61 count_error();
62 }
63 ++tests;
64 d = utf32_decompose_compat(&l, 1, 0);
65 compat_expected = utf32_to_utf8(d, utf32_len(d), 0);
66 if(strcmp(compat_folded, compat_expected)) {
67 fprintf(stderr, "%s:%d: compat-casefolding %#lx got '%s', expected '%s'\n",
68 __FILE__, __LINE__, (unsigned long)c,
69 format(compat_folded), format(compat_expected));
70 count_error();
71 }
72 ++tests;
73 }
74 }
75 check_string(utf8_casefold_canon("", 0, 0), "");
76}
77
78/*
79Local Variables:
80c-basic-offset:2
81comment-column:40
82fill-column:79
83indent-tabs-mode:nil
84End:
85*/