3 unless ("A" eq pack('U', 0x41)) {
4 print "1..0 # Unicode::Normalize " .
5 "cannot stringify a Unicode code point\n";
11 if ($ENV{PERL_CORE}) {
13 @INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib);
17 #########################
22 BEGIN { plan tests => 64 };
23 use Unicode::Normalize qw(normalize);
24 ok(1); # If we made it this far, we're ok.
26 sub _pack_U { Unicode::Normalize::pack_U(@_) }
27 sub _unpack_U { Unicode::Normalize::unpack_U(@_) }
29 #########################
31 ok(normalize('D', ""), "");
32 ok(normalize('C', ""), "");
33 ok(normalize('KD',""), "");
34 ok(normalize('KC',""), "");
36 ok(normalize('D', "A"), "A");
37 ok(normalize('C', "A"), "A");
38 ok(normalize('KD',"A"), "A");
39 ok(normalize('KC',"A"), "A");
41 ok(normalize('NFD', ""), "");
42 ok(normalize('NFC', ""), "");
43 ok(normalize('NFKD',""), "");
44 ok(normalize('NFKC',""), "");
46 ok(normalize('NFD', "A"), "A");
47 ok(normalize('NFC', "A"), "A");
48 ok(normalize('NFKD',"A"), "A");
49 ok(normalize('NFKC',"A"), "A");
51 # don't modify the source
52 my $sNFD = "\x{FA19}";
53 ok(normalize('NFD', $sNFD), "\x{795E}");
54 ok($sNFD, "\x{FA19}");
56 my $sNFC = "\x{FA1B}";
57 ok(normalize('NFC', $sNFC), "\x{798F}");
58 ok($sNFC, "\x{FA1B}");
60 my $sNFKD = "\x{FA1E}";
61 ok(normalize('NFKD', $sNFKD), "\x{7FBD}");
62 ok($sNFKD, "\x{FA1E}");
64 my $sNFKC = "\x{FA26}";
65 ok(normalize('NFKC', $sNFKC), "\x{90FD}");
66 ok($sNFKC, "\x{FA26}");
69 join " ", map sprintf("%04X", $_),
70 _unpack_U normalize 'C', _pack_U map hex, split ' ', shift;
73 join " ", map sprintf("%04X", $_),
74 _unpack_U normalize 'D', _pack_U map hex, split ' ', shift;
77 ok(hexNFD("1E14 AC01"), "0045 0304 0300 1100 1161 11A8");
78 ok(hexNFD("AC00 AE00"), "1100 1161 1100 1173 11AF");
80 ok(hexNFC("0061 0315 0300 05AE 05C4 0062"), "00E0 05AE 05C4 0315 0062");
81 ok(hexNFC("00E0 05AE 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062");
82 ok(hexNFC("0061 05AE 0300 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062");
83 ok(hexNFC("0045 0304 0300 AC00 11A8"), "1E14 AC01");
84 ok(hexNFC("1100 1161 1100 1173 11AF"), "AC00 AE00");
85 ok(hexNFC("1100 0300 1161 1173 11AF"), "1100 0300 1161 1173 11AF");
87 ok(hexNFD("0061 0315 0300 05AE 05C4 0062"), "0061 05AE 0300 05C4 0315 0062");
88 ok(hexNFD("00E0 05AE 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062");
89 ok(hexNFD("0061 05AE 0300 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062");
90 ok(hexNFC("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062");
91 ok(hexNFC("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062");
92 ok(hexNFD("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062");
93 ok(hexNFD("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062");
94 ok(hexNFC("0000 0041 0000 0000"), "0000 0041 0000 0000");
95 ok(hexNFD("0000 0041 0000 0000"), "0000 0041 0000 0000");
97 ok(hexNFC("AC00 11A7"), "AC00 11A7");
98 ok(hexNFC("AC00 11A8"), "AC01");
99 ok(hexNFC("AC00 11A9"), "AC02");
100 ok(hexNFC("AC00 11C2"), "AC1B");
101 ok(hexNFC("AC00 11C3"), "AC00 11C3");
103 # Test Cases from Public Review Issue #29: Normalization Issue
104 # cf. http://www.unicode.org/review/pr-29.html
105 ok(hexNFC("0B47 0300 0B3E"), "0B47 0300 0B3E");
106 ok(hexNFC("1100 0300 1161"), "1100 0300 1161");
108 ok(hexNFC("0B47 0B3E 0300"), "0B4B 0300");
109 ok(hexNFC("1100 1161 0300"), "AC00 0300");
111 ok(hexNFC("0B47 0300 0B3E 0327"), "0B47 0300 0B3E 0327");
112 ok(hexNFC("1100 0300 1161 0327"), "1100 0300 1161 0327");
114 ok(hexNFC("0300 0041"), "0300 0041");
115 ok(hexNFC("0300 0301 0041"), "0300 0301 0041");
116 ok(hexNFC("0301 0300 0041"), "0301 0300 0041");
117 ok(hexNFC("0000 0300 0000 0301"), "0000 0300 0000 0301");
118 ok(hexNFC("0000 0301 0000 0300"), "0000 0301 0000 0300");
120 ok(hexNFC("0327 0061 0300"), "0327 00E0");
121 ok(hexNFC("0301 0061 0300"), "0301 00E0");
122 ok(hexNFC("0315 0061 0300"), "0315 00E0");
123 ok(hexNFC("0000 0327 0061 0300"), "0000 0327 00E0");
124 ok(hexNFC("0000 0301 0061 0300"), "0000 0301 00E0");
125 ok(hexNFC("0000 0315 0061 0300"), "0000 0315 00E0");