1#!../perl
2
3BEGIN {
4    if ($ENV{'PERL_CORE'}){
5    chdir 't';
6    unshift @INC, '../lib';
7    }
8    require Config; import Config;
9    if ($Config{'extensions'} !~ /\bEncode\b/) {
10    print "1..0 # Skip: Encode was not built\n";
11        exit 0;
12    }
13}
14
15use strict;
16use Encode;
17use Encode::Alias;
18my %a2c;
19my @override_tests;
20my $ON_EBCDIC;
21
22sub init_a2c{
23    %a2c = (
24        'US-ascii' => 'ascii',
25        'ISO-646-US' => 'ascii',
26        'UTF-8'    => 'utf-8-strict',
27        'en_US.UTF-8'    => 'utf-8-strict',
28        'UCS-2'    => 'UCS-2BE',
29        'UCS2'     => 'UCS-2BE',
30        'iso-10646-1' => 'UCS-2BE',
31        'ucs2-le'  => 'UCS-2LE',
32        'ucs2-be'  => 'UCS-2BE',
33        'utf16'    => 'UTF-16',
34        'utf32'    => 'UTF-32',
35        'utf16-be'  => 'UTF-16BE',
36        'utf32-be'  => 'UTF-32BE',
37        'utf16-le'  => 'UTF-16LE',
38        'utf32-le'  => 'UTF-32LE',
39        'UCS4-BE'   => 'UTF-32BE',
40        'UCS-4-LE'  => 'UTF-32LE',
41        'cyrillic' => 'iso-8859-5',
42        'arabic'   => 'iso-8859-6',
43        'greek'    => 'iso-8859-7',
44        'hebrew'   => 'iso-8859-8',
45        'thai'     => 'iso-8859-11',
46        'tis620'   => 'iso-8859-11',
47        'tis-620'   => 'iso-8859-11',
48        'WinLatin1'     => 'cp1252',
49        'WinLatin2'     => 'cp1250',
50        'WinCyrillic'   => 'cp1251',
51        'WinGreek'      => 'cp1253',
52        'WinTurkish'    => 'cp1254',
53        'WinHebrew'     => 'cp1255',
54        'WinArabic'     => 'cp1256',
55        'WinBaltic'     => 'cp1257',
56        'WinVietnamese' => 'cp1258',
57	'Macintosh'     => 'MacRoman',
58        'koi8r'         => 'koi8-r',
59        'koi8u'         => 'koi8-u',
60        'ja_JP.euc'	    => $ON_EBCDIC ? '' : 'euc-jp',
61        'x-euc-jp'	    => $ON_EBCDIC ? '' : 'euc-jp',
62        'zh_CN.euc'	    => $ON_EBCDIC ? '' : 'euc-cn',
63        'x-euc-cn'	    => $ON_EBCDIC ? '' : 'euc-cn',
64        'ko_KR.euc'	    => $ON_EBCDIC ? '' : 'euc-kr',
65        'x-euc-kr'	    => $ON_EBCDIC ? '' : 'euc-kr',
66        'ujis'	    => $ON_EBCDIC ? '' : 'euc-jp',
67        'Shift_JIS'	    => $ON_EBCDIC ? '' : 'shiftjis',
68        'x-sjis'	    => $ON_EBCDIC ? '' : 'shiftjis',
69        'jis'	    => $ON_EBCDIC ? '' : '7bit-jis',
70        'big-5'	    => $ON_EBCDIC ? '' : 'big5-eten',
71        'zh_TW.Big5'    => $ON_EBCDIC ? '' : 'big5-eten',
72        'tca-big5'	    => $ON_EBCDIC ? '' : 'big5-eten',
73        'big5-hk'	    => $ON_EBCDIC ? '' : 'big5-hkscs',
74        'hkscs-big5'    => $ON_EBCDIC ? '' : 'big5-hkscs',
75        'GB_2312-80'    => $ON_EBCDIC ? '' : 'euc-cn',
76        'KS_C_5601-1987'    => $ON_EBCDIC ? '' : 'cp949',
77        #
78        'gb12345-raw'   => $ON_EBCDIC ? '' : 'gb12345-raw',
79        'gb2312-raw'    => $ON_EBCDIC ? '' : 'gb2312-raw',
80        'jis0201-raw'   => $ON_EBCDIC ? '' : 'jis0201-raw',
81        'jis0208-raw'   => $ON_EBCDIC ? '' : 'jis0208-raw',
82        'jis0212-raw'   => $ON_EBCDIC ? '' : 'jis0212-raw',
83        'ksc5601-raw'   => $ON_EBCDIC ? '' : 'ksc5601-raw',
84        'cp65000' => 'UTF-7',
85        'cp65001' => 'utf-8-strict',
86       );
87
88    for my $i (1..11,13..16){
89    $a2c{"ISO 8859 $i"} = "iso-8859-$i";
90    }
91    for my $i (1..10){
92    $a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]";
93    }
94    for my $k (keys %Encode::Alias::Winlatin2cp){
95    my $v = $Encode::Alias::Winlatin2cp{$k};
96    $a2c{"Win" . ucfirst($k)} = "cp" . $v;
97    $a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v;
98    $a2c{"cp-" . $v} = "cp" . $v;
99    }
100    my @a2c = keys %a2c;
101    for my $k (@a2c){
102    $a2c{uc($k)} = $a2c{$k};
103    $a2c{lc($k)} = $a2c{$k};
104    $a2c{lcfirst($k)} = $a2c{$k};
105    $a2c{ucfirst($k)} = $a2c{$k};
106    }
107}
108
109BEGIN{
110    $ON_EBCDIC = ord("A") == 193;
111    @ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC';
112    $Encode::ON_EBCDIC = $ON_EBCDIC;
113    init_a2c();
114    @override_tests = qw(
115        myascii:cp1252
116        mygreek:cp1253
117        myhebrew:iso-8859-2
118        myarabic:cp1256
119        ueightsomething:utf-8-strict
120        unknown:
121    );
122}
123
124if ($ON_EBCDIC){
125    delete @Encode::ExtModule{
126    qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp
127       euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932
128       euc-kr ksc5601 cp949 MacKorean
129       big5	big5-hkscs cp950 MacChineseTrad
130       gb18030 big5plus euc-tw)
131    };
132}
133
134use Test::More tests => (scalar keys %a2c) * 3 + @override_tests;
135
136print "# alias test;  \$ON_EBCDIC == $ON_EBCDIC\n";
137
138foreach my $a (keys %a2c){
139    print "# $a => $a2c{$a}\n";
140    my $e = Encode::find_encoding($a);
141    is((defined($e) and $e->name), $a2c{$a},$a)
142    or warn "alias was $a";;
143}
144
145# now we override some of the aliases and see if it works fine
146
147define_alias(
148         qr/ascii/i    => '"WinLatin1"',
149         qr/cyrillic/i => '"WinCyrillic"',
150         qr/arabic/i   => '"WinArabic"',
151         qr/greek/i    => '"WinGreek"',
152         qr/hebrew/i   => '"WinHebrew"'
153        );
154
155Encode::find_encoding("myhebrew");  # polute alias cache
156
157define_alias( sub {
158    my $enc = shift;
159    return "iso-8859-2"     if $enc =~ /hebrew/i;
160    return "does-not-exist" if $enc =~ /arabic/i;  # should then use other override alias
161    return "utf-8"          if $enc =~ /eight/i;
162    return "unknown";
163});
164
165print "# alias test with alias overrides\n";
166
167for my $test (@override_tests) {
168    my($a, $c) = split /:/, $test;
169    my $e = Encode::find_encoding($a);
170    is((defined($e) and $e->name), $c, $a);
171}
172
173print "# alias undef test\n";
174
175Encode::Alias->undef_aliases;
176foreach my $a (keys %a2c){
177    my $e = Encode::find_encoding($a);
178    ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a")
179    or warn "alias was $a";
180}
181
182print "# alias reinit test\n";
183
184Encode::Alias->init_aliases;
185init_a2c();
186foreach my $a (keys %a2c){
187    my $e = Encode::find_encoding($a);
188    is((defined($e) and $e->name), $a2c{$a}, "Reinit $a")
189    or warn "alias was $a";
190}
191__END__
192for my $k (keys %a2c){
193    $k =~ /[A-Z]/ and next;
194    print "$k => $a2c{$k}\n";
195}
196
197
198
199