1
2BEGIN {
3    if ($ENV{PERL_CORE}) {
4        chdir('t') if -d 't';
5        @INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib);
6    }
7}
8
9#########################
10
11use strict;
12use warnings;
13BEGIN { $| = 1; print "1..64\n"; }
14my $count = 0;
15sub ok { Unicode::Normalize::ok(\$count, @_) }
16
17use Unicode::Normalize qw(normalize);
18
19ok(1);
20
21sub _pack_U   { Unicode::Normalize::dot_t_pack_U(@_) }
22sub _unpack_U { Unicode::Normalize::dot_t_unpack_U(@_) }
23
24#########################
25
26ok(normalize('D', ""), "");
27ok(normalize('C', ""), "");
28ok(normalize('KD',""), "");
29ok(normalize('KC',""), "");
30
31ok(normalize('D', "A"), "A");
32ok(normalize('C', "A"), "A");
33ok(normalize('KD',"A"), "A");
34ok(normalize('KC',"A"), "A");
35
36ok(normalize('NFD', ""), "");
37ok(normalize('NFC', ""), "");
38ok(normalize('NFKD',""), "");
39ok(normalize('NFKC',""), "");
40
41ok(normalize('NFD', "A"), "A");
42ok(normalize('NFC', "A"), "A");
43ok(normalize('NFKD',"A"), "A");
44ok(normalize('NFKC',"A"), "A");
45
46# 17
47
48# don't modify the source
49my $sNFD = "\x{FA19}";
50ok(normalize('NFD', $sNFD), "\x{795E}");
51ok($sNFD, "\x{FA19}");
52
53my $sNFC = "\x{FA1B}";
54ok(normalize('NFC', $sNFC), "\x{798F}");
55ok($sNFC, "\x{FA1B}");
56
57my $sNFKD = "\x{FA1E}";
58ok(normalize('NFKD', $sNFKD), "\x{7FBD}");
59ok($sNFKD, "\x{FA1E}");
60
61my $sNFKC = "\x{FA26}";
62ok(normalize('NFKC', $sNFKC), "\x{90FD}");
63ok($sNFKC, "\x{FA26}");
64
65# 25
66
67sub hexNFC {
68  join " ", map sprintf("%04X", $_),
69  _unpack_U normalize 'C', _pack_U map hex, split ' ', shift;
70}
71sub hexNFD {
72  join " ", map sprintf("%04X", $_),
73  _unpack_U normalize 'D', _pack_U map hex, split ' ', shift;
74}
75
76ok(hexNFD("1E14 AC01"), "0045 0304 0300 1100 1161 11A8");
77ok(hexNFD("AC00 AE00"), "1100 1161 1100 1173 11AF");
78
79ok(hexNFC("0061 0315 0300 05AE 05C4 0062"), "00E0 05AE 05C4 0315 0062");
80ok(hexNFC("00E0 05AE 05C4 0315 0062"),      "00E0 05AE 05C4 0315 0062");
81ok(hexNFC("0061 05AE 0300 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062");
82ok(hexNFC("0045 0304 0300 AC00 11A8"), "1E14 AC01");
83ok(hexNFC("1100 1161 1100 1173 11AF"), "AC00 AE00");
84ok(hexNFC("1100 0300 1161 1173 11AF"), "1100 0300 1161 1173 11AF");
85
86ok(hexNFD("0061 0315 0300 05AE 05C4 0062"), "0061 05AE 0300 05C4 0315 0062");
87ok(hexNFD("00E0 05AE 05C4 0315 0062"),      "0061 05AE 0300 05C4 0315 0062");
88ok(hexNFD("0061 05AE 0300 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062");
89ok(hexNFC("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062");
90ok(hexNFC("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062");
91ok(hexNFD("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062");
92ok(hexNFD("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062");
93ok(hexNFC("0000 0041 0000 0000"), "0000 0041 0000 0000");
94ok(hexNFD("0000 0041 0000 0000"), "0000 0041 0000 0000");
95
96ok(hexNFC("AC00 11A7"), "AC00 11A7");
97ok(hexNFC("AC00 11A8"), "AC01");
98ok(hexNFC("AC00 11A9"), "AC02");
99ok(hexNFC("AC00 11C2"), "AC1B");
100ok(hexNFC("AC00 11C3"), "AC00 11C3");
101
102# 47
103
104# Test Cases from Public Review Issue #29: Normalization Issue
105# cf. http://www.unicode.org/review/pr-29.html
106ok(hexNFC("0B47 0300 0B3E"), "0B47 0300 0B3E");
107ok(hexNFC("1100 0300 1161"), "1100 0300 1161");
108ok(hexNFC("0B47 0B3E 0300"), "0B4B 0300");
109ok(hexNFC("1100 1161 0300"), "AC00 0300");
110ok(hexNFC("0B47 0300 0B3E 0327"), "0B47 0300 0B3E 0327");
111ok(hexNFC("1100 0300 1161 0327"), "1100 0300 1161 0327");
112
113ok(hexNFC("0300 0041"), "0300 0041");
114ok(hexNFC("0300 0301 0041"), "0300 0301 0041");
115ok(hexNFC("0301 0300 0041"), "0301 0300 0041");
116ok(hexNFC("0000 0300 0000 0301"), "0000 0300 0000 0301");
117ok(hexNFC("0000 0301 0000 0300"), "0000 0301 0000 0300");
118
119ok(hexNFC("0327 0061 0300"), "0327 00E0");
120ok(hexNFC("0301 0061 0300"), "0301 00E0");
121ok(hexNFC("0315 0061 0300"), "0315 00E0");
122ok(hexNFC("0000 0327 0061 0300"), "0000 0327 00E0");
123ok(hexNFC("0000 0301 0061 0300"), "0000 0301 00E0");
124ok(hexNFC("0000 0315 0061 0300"), "0000 0315 00E0");
125
126# 64
127
128