xref: /openbsd/gnu/usr.bin/perl/cpan/Encode/t/Aliases.t (revision 8932bfb7)
1#!../perl
2
3BEGIN {
4    if ($ENV{'PERL_CORE'}){
5    chdir 't';
6    unshift @INC, '../lib';
7    }
8    require Config; import Config;
9    if ($Config{'extensions'} !~ /\bEncode\b/) {
10    print "1..0 # Skip: Encode was not built\n";
11        exit 0;
12    }
13}
14
15use strict;
16use Encode;
17use Encode::Alias;
18my %a2c;
19my $ON_EBCDIC;
20
21sub init_a2c{
22    %a2c = (
23        'US-ascii' => 'ascii',
24        'ISO-646-US' => 'ascii',
25        'UTF-8'    => 'utf-8-strict',
26        'en_US.UTF-8'    => 'utf-8-strict',
27        'UCS-2'    => 'UCS-2BE',
28        'UCS2'     => 'UCS-2BE',
29        'iso-10646-1' => 'UCS-2BE',
30        'ucs2-le'  => 'UCS-2LE',
31        'ucs2-be'  => 'UCS-2BE',
32        'utf16'    => 'UTF-16',
33        'utf32'    => 'UTF-32',
34        'utf16-be'  => 'UTF-16BE',
35        'utf32-be'  => 'UTF-32BE',
36        'utf16-le'  => 'UTF-16LE',
37        'utf32-le'  => 'UTF-32LE',
38        'UCS4-BE'   => 'UTF-32BE',
39        'UCS-4-LE'  => 'UTF-32LE',
40        'cyrillic' => 'iso-8859-5',
41        'arabic'   => 'iso-8859-6',
42        'greek'    => 'iso-8859-7',
43        'hebrew'   => 'iso-8859-8',
44        'thai'     => 'iso-8859-11',
45        'tis620'   => 'iso-8859-11',
46        'tis-620'   => 'iso-8859-11',
47        'WinLatin1'     => 'cp1252',
48        'WinLatin2'     => 'cp1250',
49        'WinCyrillic'   => 'cp1251',
50        'WinGreek'      => 'cp1253',
51        'WinTurkish'    => 'cp1254',
52        'WinHebrew'     => 'cp1255',
53        'WinArabic'     => 'cp1256',
54        'WinBaltic'     => 'cp1257',
55        'WinVietnamese' => 'cp1258',
56	'Macintosh'     => 'MacRoman',
57        'koi8r'         => 'koi8-r',
58        'koi8u'         => 'koi8-u',
59        'ja_JP.euc'	    => $ON_EBCDIC ? '' : 'euc-jp',
60        'x-euc-jp'	    => $ON_EBCDIC ? '' : 'euc-jp',
61        'zh_CN.euc'	    => $ON_EBCDIC ? '' : 'euc-cn',
62        'x-euc-cn'	    => $ON_EBCDIC ? '' : 'euc-cn',
63        'ko_KR.euc'	    => $ON_EBCDIC ? '' : 'euc-kr',
64        'x-euc-kr'	    => $ON_EBCDIC ? '' : 'euc-kr',
65        'ujis'	    => $ON_EBCDIC ? '' : 'euc-jp',
66        'Shift_JIS'	    => $ON_EBCDIC ? '' : 'shiftjis',
67        'x-sjis'	    => $ON_EBCDIC ? '' : 'shiftjis',
68        'jis'	    => $ON_EBCDIC ? '' : '7bit-jis',
69        'big-5'	    => $ON_EBCDIC ? '' : 'big5-eten',
70        'zh_TW.Big5'    => $ON_EBCDIC ? '' : 'big5-eten',
71        'tca-big5'	    => $ON_EBCDIC ? '' : 'big5-eten',
72        'big5-hk'	    => $ON_EBCDIC ? '' : 'big5-hkscs',
73        'hkscs-big5'    => $ON_EBCDIC ? '' : 'big5-hkscs',
74        'GB_2312-80'    => $ON_EBCDIC ? '' : 'euc-cn',
75        'KS_C_5601-1987'    => $ON_EBCDIC ? '' : 'cp949',
76        #
77        'gb12345-raw'   => $ON_EBCDIC ? '' : 'gb12345-raw',
78        'gb2312-raw'    => $ON_EBCDIC ? '' : 'gb2312-raw',
79        'jis0201-raw'   => $ON_EBCDIC ? '' : 'jis0201-raw',
80        'jis0208-raw'   => $ON_EBCDIC ? '' : 'jis0208-raw',
81        'jis0212-raw'   => $ON_EBCDIC ? '' : 'jis0212-raw',
82        'ksc5601-raw'   => $ON_EBCDIC ? '' : 'ksc5601-raw',
83       );
84
85    for my $i (1..11,13..16){
86    $a2c{"ISO 8859 $i"} = "iso-8859-$i";
87    }
88    for my $i (1..10){
89    $a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]";
90    }
91    for my $k (keys %Encode::Alias::Winlatin2cp){
92    my $v = $Encode::Alias::Winlatin2cp{$k};
93    $a2c{"Win" . ucfirst($k)} = "cp" . $v;
94    $a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v;
95    $a2c{"cp-" . $v} = "cp" . $v;
96    }
97    my @a2c = keys %a2c;
98    for my $k (@a2c){
99    $a2c{uc($k)} = $a2c{$k};
100    $a2c{lc($k)} = $a2c{$k};
101    $a2c{lcfirst($k)} = $a2c{$k};
102    $a2c{ucfirst($k)} = $a2c{$k};
103    }
104}
105
106BEGIN{
107    $ON_EBCDIC = ord("A") == 193;
108    @ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC';
109    $Encode::ON_EBCDIC = $ON_EBCDIC;
110    init_a2c();
111}
112
113if ($ON_EBCDIC){
114    delete @Encode::ExtModule{
115    qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp
116       euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932
117       euc-kr ksc5601 cp949 MacKorean
118       big5	big5-hkscs cp950 MacChineseTrad
119       gb18030 big5plus euc-tw)
120    };
121}
122
123use Test::More tests => (scalar keys %a2c) * 4;
124
125print "# alias test;  \$ON_EBCDIC == $ON_EBCDIC\n";
126
127foreach my $a (keys %a2c){
128    print "# $a => $a2c{$a}\n";
129    my $e = Encode::find_encoding($a);
130    is((defined($e) and $e->name), $a2c{$a},$a)
131    or warn "alias was $a";;
132}
133
134# now we override some of the aliases and see if it works fine
135
136define_alias(
137         qr/ascii/i    => 'WinLatin1',
138         qr/cyrillic/i => 'WinCyrillic',
139         qr/arabic/i   => 'WinArabic',
140         qr/greek/i    => 'WinGreek',
141         qr/hebrew/i   => 'WinHebrew'
142        );
143
144print "# alias test with alias overrides\n";
145
146foreach my $a (keys %a2c){
147    print "# $a => $a2c{$a}\n";
148    my $e = Encode::find_encoding($a);
149    is((defined($e) and $e->name), $a2c{$a}, "Override $a")
150    or warn "alias was $a";
151}
152
153print "# alias undef test\n";
154
155Encode::Alias->undef_aliases;
156foreach my $a (keys %a2c){
157    my $e = Encode::find_encoding($a);
158    ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a")
159    or warn "alias was $a";
160}
161
162print "# alias reinit test\n";
163
164Encode::Alias->init_aliases;
165init_a2c();
166foreach my $a (keys %a2c){
167    my $e = Encode::find_encoding($a);
168    is((defined($e) and $e->name), $a2c{$a}, "Reinit $a")
169    or warn "alias was $a";
170}
171__END__
172for my $k (keys %a2c){
173    $k =~ /[A-Z]/ and next;
174    print "$k => $a2c{$k}\n";
175}
176
177
178
179