1 2BEGIN { 3 if ($ENV{PERL_CORE}) { 4 chdir('t') if -d 't'; 5 @INC = $^O eq 'MacOS' ? qw(::lib) : qw(../lib); 6 } 7} 8 9######################### 10 11use strict; 12use warnings; 13BEGIN { $| = 1; print "1..64\n"; } 14my $count = 0; 15sub ok { Unicode::Normalize::ok(\$count, @_) } 16 17use Unicode::Normalize qw(normalize); 18 19ok(1); 20 21sub _pack_U { Unicode::Normalize::dot_t_pack_U(@_) } 22sub _unpack_U { Unicode::Normalize::dot_t_unpack_U(@_) } 23 24######################### 25 26ok(normalize('D', ""), ""); 27ok(normalize('C', ""), ""); 28ok(normalize('KD',""), ""); 29ok(normalize('KC',""), ""); 30 31ok(normalize('D', "A"), "A"); 32ok(normalize('C', "A"), "A"); 33ok(normalize('KD',"A"), "A"); 34ok(normalize('KC',"A"), "A"); 35 36ok(normalize('NFD', ""), ""); 37ok(normalize('NFC', ""), ""); 38ok(normalize('NFKD',""), ""); 39ok(normalize('NFKC',""), ""); 40 41ok(normalize('NFD', "A"), "A"); 42ok(normalize('NFC', "A"), "A"); 43ok(normalize('NFKD',"A"), "A"); 44ok(normalize('NFKC',"A"), "A"); 45 46# 17 47 48# don't modify the source 49my $sNFD = "\x{FA19}"; 50ok(normalize('NFD', $sNFD), "\x{795E}"); 51ok($sNFD, "\x{FA19}"); 52 53my $sNFC = "\x{FA1B}"; 54ok(normalize('NFC', $sNFC), "\x{798F}"); 55ok($sNFC, "\x{FA1B}"); 56 57my $sNFKD = "\x{FA1E}"; 58ok(normalize('NFKD', $sNFKD), "\x{7FBD}"); 59ok($sNFKD, "\x{FA1E}"); 60 61my $sNFKC = "\x{FA26}"; 62ok(normalize('NFKC', $sNFKC), "\x{90FD}"); 63ok($sNFKC, "\x{FA26}"); 64 65# 25 66 67sub hexNFC { 68 join " ", map sprintf("%04X", $_), 69 _unpack_U normalize 'C', _pack_U map hex, split ' ', shift; 70} 71sub hexNFD { 72 join " ", map sprintf("%04X", $_), 73 _unpack_U normalize 'D', _pack_U map hex, split ' ', shift; 74} 75 76ok(hexNFD("1E14 AC01"), "0045 0304 0300 1100 1161 11A8"); 77ok(hexNFD("AC00 AE00"), "1100 1161 1100 1173 11AF"); 78 79ok(hexNFC("0061 0315 0300 05AE 05C4 0062"), "00E0 05AE 05C4 0315 0062"); 80ok(hexNFC("00E0 05AE 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062"); 81ok(hexNFC("0061 05AE 0300 05C4 0315 0062"), "00E0 05AE 05C4 0315 0062"); 82ok(hexNFC("0045 0304 0300 AC00 11A8"), "1E14 AC01"); 83ok(hexNFC("1100 1161 1100 1173 11AF"), "AC00 AE00"); 84ok(hexNFC("1100 0300 1161 1173 11AF"), "1100 0300 1161 1173 11AF"); 85 86ok(hexNFD("0061 0315 0300 05AE 05C4 0062"), "0061 05AE 0300 05C4 0315 0062"); 87ok(hexNFD("00E0 05AE 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062"); 88ok(hexNFD("0061 05AE 0300 05C4 0315 0062"), "0061 05AE 0300 05C4 0315 0062"); 89ok(hexNFC("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062"); 90ok(hexNFC("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062"); 91ok(hexNFD("0061 05C4 0315 0300 05AE 0062"), "0061 05AE 05C4 0300 0315 0062"); 92ok(hexNFD("0061 05AE 05C4 0300 0315 0062"), "0061 05AE 05C4 0300 0315 0062"); 93ok(hexNFC("0000 0041 0000 0000"), "0000 0041 0000 0000"); 94ok(hexNFD("0000 0041 0000 0000"), "0000 0041 0000 0000"); 95 96ok(hexNFC("AC00 11A7"), "AC00 11A7"); 97ok(hexNFC("AC00 11A8"), "AC01"); 98ok(hexNFC("AC00 11A9"), "AC02"); 99ok(hexNFC("AC00 11C2"), "AC1B"); 100ok(hexNFC("AC00 11C3"), "AC00 11C3"); 101 102# 47 103 104# Test Cases from Public Review Issue #29: Normalization Issue 105# cf. http://www.unicode.org/review/pr-29.html 106ok(hexNFC("0B47 0300 0B3E"), "0B47 0300 0B3E"); 107ok(hexNFC("1100 0300 1161"), "1100 0300 1161"); 108ok(hexNFC("0B47 0B3E 0300"), "0B4B 0300"); 109ok(hexNFC("1100 1161 0300"), "AC00 0300"); 110ok(hexNFC("0B47 0300 0B3E 0327"), "0B47 0300 0B3E 0327"); 111ok(hexNFC("1100 0300 1161 0327"), "1100 0300 1161 0327"); 112 113ok(hexNFC("0300 0041"), "0300 0041"); 114ok(hexNFC("0300 0301 0041"), "0300 0301 0041"); 115ok(hexNFC("0301 0300 0041"), "0301 0300 0041"); 116ok(hexNFC("0000 0300 0000 0301"), "0000 0300 0000 0301"); 117ok(hexNFC("0000 0301 0000 0300"), "0000 0301 0000 0300"); 118 119ok(hexNFC("0327 0061 0300"), "0327 00E0"); 120ok(hexNFC("0301 0061 0300"), "0301 00E0"); 121ok(hexNFC("0315 0061 0300"), "0315 00E0"); 122ok(hexNFC("0000 0327 0061 0300"), "0000 0327 00E0"); 123ok(hexNFC("0000 0301 0061 0300"), "0000 0301 00E0"); 124ok(hexNFC("0000 0315 0061 0300"), "0000 0315 00E0"); 125 126# 64 127 128