1#!../perl 2 3BEGIN { 4 if ($ENV{'PERL_CORE'}){ 5 chdir 't'; 6 unshift @INC, '../lib'; 7 } 8 require Config; import Config; 9 if ($Config{'extensions'} !~ /\bEncode\b/) { 10 print "1..0 # Skip: Encode was not built\n"; 11 exit 0; 12 } 13} 14 15use strict; 16use Encode; 17use Encode::Alias; 18my %a2c; 19my @override_tests; 20my $ON_EBCDIC; 21 22sub init_a2c{ 23 %a2c = ( 24 'US-ascii' => 'ascii', 25 'ISO-646-US' => 'ascii', 26 'UTF-8' => 'utf-8-strict', 27 'en_US.UTF-8' => 'utf-8-strict', 28 'UCS-2' => 'UCS-2BE', 29 'UCS2' => 'UCS-2BE', 30 'iso-10646-1' => 'UCS-2BE', 31 'ucs2-le' => 'UCS-2LE', 32 'ucs2-be' => 'UCS-2BE', 33 'utf16' => 'UTF-16', 34 'utf32' => 'UTF-32', 35 'utf16-be' => 'UTF-16BE', 36 'utf32-be' => 'UTF-32BE', 37 'utf16-le' => 'UTF-16LE', 38 'utf32-le' => 'UTF-32LE', 39 'UCS4-BE' => 'UTF-32BE', 40 'UCS-4-LE' => 'UTF-32LE', 41 'cyrillic' => 'iso-8859-5', 42 'arabic' => 'iso-8859-6', 43 'greek' => 'iso-8859-7', 44 'hebrew' => 'iso-8859-8', 45 'thai' => 'iso-8859-11', 46 'tis620' => 'iso-8859-11', 47 'tis-620' => 'iso-8859-11', 48 'WinLatin1' => 'cp1252', 49 'WinLatin2' => 'cp1250', 50 'WinCyrillic' => 'cp1251', 51 'WinGreek' => 'cp1253', 52 'WinTurkish' => 'cp1254', 53 'WinHebrew' => 'cp1255', 54 'WinArabic' => 'cp1256', 55 'WinBaltic' => 'cp1257', 56 'WinVietnamese' => 'cp1258', 57 'Macintosh' => 'MacRoman', 58 'koi8r' => 'koi8-r', 59 'koi8u' => 'koi8-u', 60 'ja_JP.euc' => $ON_EBCDIC ? '' : 'euc-jp', 61 'x-euc-jp' => $ON_EBCDIC ? '' : 'euc-jp', 62 'zh_CN.euc' => $ON_EBCDIC ? '' : 'euc-cn', 63 'x-euc-cn' => $ON_EBCDIC ? '' : 'euc-cn', 64 'ko_KR.euc' => $ON_EBCDIC ? '' : 'euc-kr', 65 'x-euc-kr' => $ON_EBCDIC ? '' : 'euc-kr', 66 'ujis' => $ON_EBCDIC ? '' : 'euc-jp', 67 'Shift_JIS' => $ON_EBCDIC ? '' : 'shiftjis', 68 'x-sjis' => $ON_EBCDIC ? '' : 'shiftjis', 69 'jis' => $ON_EBCDIC ? '' : '7bit-jis', 70 'big-5' => $ON_EBCDIC ? '' : 'big5-eten', 71 'zh_TW.Big5' => $ON_EBCDIC ? '' : 'big5-eten', 72 'tca-big5' => $ON_EBCDIC ? '' : 'big5-eten', 73 'big5-hk' => $ON_EBCDIC ? '' : 'big5-hkscs', 74 'hkscs-big5' => $ON_EBCDIC ? '' : 'big5-hkscs', 75 'GB_2312-80' => $ON_EBCDIC ? '' : 'euc-cn', 76 'KS_C_5601-1987' => $ON_EBCDIC ? '' : 'cp949', 77 # 78 'gb12345-raw' => $ON_EBCDIC ? '' : 'gb12345-raw', 79 'gb2312-raw' => $ON_EBCDIC ? '' : 'gb2312-raw', 80 'jis0201-raw' => $ON_EBCDIC ? '' : 'jis0201-raw', 81 'jis0208-raw' => $ON_EBCDIC ? '' : 'jis0208-raw', 82 'jis0212-raw' => $ON_EBCDIC ? '' : 'jis0212-raw', 83 'ksc5601-raw' => $ON_EBCDIC ? '' : 'ksc5601-raw', 84 'cp65000' => 'UTF-7', 85 'cp65001' => 'utf-8-strict', 86 ); 87 88 for my $i (1..11,13..16){ 89 $a2c{"ISO 8859 $i"} = "iso-8859-$i"; 90 } 91 for my $i (1..10){ 92 $a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]"; 93 } 94 for my $k (keys %Encode::Alias::Winlatin2cp){ 95 my $v = $Encode::Alias::Winlatin2cp{$k}; 96 $a2c{"Win" . ucfirst($k)} = "cp" . $v; 97 $a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v; 98 $a2c{"cp-" . $v} = "cp" . $v; 99 } 100 my @a2c = keys %a2c; 101 for my $k (@a2c){ 102 $a2c{uc($k)} = $a2c{$k}; 103 $a2c{lc($k)} = $a2c{$k}; 104 $a2c{lcfirst($k)} = $a2c{$k}; 105 $a2c{ucfirst($k)} = $a2c{$k}; 106 } 107} 108 109BEGIN{ 110 $ON_EBCDIC = ord("A") == 193; 111 @ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC'; 112 $Encode::ON_EBCDIC = $ON_EBCDIC; 113 init_a2c(); 114 @override_tests = qw( 115 myascii:cp1252 116 mygreek:cp1253 117 myhebrew:iso-8859-2 118 myarabic:cp1256 119 ueightsomething:utf-8-strict 120 unknown: 121 ); 122} 123 124if ($ON_EBCDIC){ 125 delete @Encode::ExtModule{ 126 qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp 127 euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932 128 euc-kr ksc5601 cp949 MacKorean 129 big5 big5-hkscs cp950 MacChineseTrad 130 gb18030 big5plus euc-tw) 131 }; 132} 133 134use Test::More tests => (scalar keys %a2c) * 3 + @override_tests; 135 136print "# alias test; \$ON_EBCDIC == $ON_EBCDIC\n"; 137 138foreach my $a (keys %a2c){ 139 print "# $a => $a2c{$a}\n"; 140 my $e = Encode::find_encoding($a); 141 is((defined($e) and $e->name), $a2c{$a},$a) 142 or warn "alias was $a";; 143} 144 145# now we override some of the aliases and see if it works fine 146 147define_alias( 148 qr/ascii/i => '"WinLatin1"', 149 qr/cyrillic/i => '"WinCyrillic"', 150 qr/arabic/i => '"WinArabic"', 151 qr/greek/i => '"WinGreek"', 152 qr/hebrew/i => '"WinHebrew"' 153 ); 154 155Encode::find_encoding("myhebrew"); # polute alias cache 156 157define_alias( sub { 158 my $enc = shift; 159 return "iso-8859-2" if $enc =~ /hebrew/i; 160 return "does-not-exist" if $enc =~ /arabic/i; # should then use other override alias 161 return "utf-8" if $enc =~ /eight/i; 162 return "unknown"; 163}); 164 165print "# alias test with alias overrides\n"; 166 167for my $test (@override_tests) { 168 my($a, $c) = split /:/, $test; 169 my $e = Encode::find_encoding($a); 170 is((defined($e) and $e->name), $c, $a); 171} 172 173print "# alias undef test\n"; 174 175Encode::Alias->undef_aliases; 176foreach my $a (keys %a2c){ 177 my $e = Encode::find_encoding($a); 178 ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a") 179 or warn "alias was $a"; 180} 181 182print "# alias reinit test\n"; 183 184Encode::Alias->init_aliases; 185init_a2c(); 186foreach my $a (keys %a2c){ 187 my $e = Encode::find_encoding($a); 188 is((defined($e) and $e->name), $a2c{$a}, "Reinit $a") 189 or warn "alias was $a"; 190} 191__END__ 192for my $k (keys %a2c){ 193 $k =~ /[A-Z]/ and next; 194 print "$k => $a2c{$k}\n"; 195} 196 197 198 199