1#!../perl 2 3BEGIN { 4 if ($ENV{'PERL_CORE'}){ 5 chdir 't'; 6 unshift @INC, '../lib'; 7 } 8 require Config; import Config; 9 if ($Config{'extensions'} !~ /\bEncode\b/) { 10 print "1..0 # Skip: Encode was not built\n"; 11 exit 0; 12 } 13} 14 15use strict; 16use Encode; 17use Encode::Alias; 18my %a2c; 19my @override_tests; 20my $ON_EBCDIC; 21 22sub init_a2c{ 23 %a2c = ( 24 'US-ascii' => 'ascii', 25 'ISO-646-US' => 'ascii', 26 'UTF-8' => 'utf-8-strict', 27 'en_US.UTF-8' => 'utf-8-strict', 28 'UCS-2' => 'UCS-2BE', 29 'UCS2' => 'UCS-2BE', 30 'iso-10646-1' => 'UCS-2BE', 31 'ucs2-le' => 'UCS-2LE', 32 'ucs2-be' => 'UCS-2BE', 33 'utf16' => 'UTF-16', 34 'utf32' => 'UTF-32', 35 'utf16-be' => 'UTF-16BE', 36 'utf32-be' => 'UTF-32BE', 37 'utf16-le' => 'UTF-16LE', 38 'utf32-le' => 'UTF-32LE', 39 'UCS4-BE' => 'UTF-32BE', 40 'UCS-4-LE' => 'UTF-32LE', 41 'cyrillic' => 'iso-8859-5', 42 'arabic' => 'iso-8859-6', 43 'greek' => 'iso-8859-7', 44 'hebrew' => 'iso-8859-8', 45 'thai' => 'iso-8859-11', 46 'tis620' => 'iso-8859-11', 47 'tis-620' => 'iso-8859-11', 48 'WinLatin1' => 'cp1252', 49 'WinLatin2' => 'cp1250', 50 'WinCyrillic' => 'cp1251', 51 'WinGreek' => 'cp1253', 52 'WinTurkish' => 'cp1254', 53 'WinHebrew' => 'cp1255', 54 'WinArabic' => 'cp1256', 55 'WinBaltic' => 'cp1257', 56 'WinVietnamese' => 'cp1258', 57 'Macintosh' => 'MacRoman', 58 'koi8r' => 'koi8-r', 59 'koi8u' => 'koi8-u', 60 'ja_JP.euc' => $ON_EBCDIC ? '' : 'euc-jp', 61 'x-euc-jp' => $ON_EBCDIC ? '' : 'euc-jp', 62 'zh_CN.euc' => $ON_EBCDIC ? '' : 'euc-cn', 63 'x-euc-cn' => $ON_EBCDIC ? '' : 'euc-cn', 64 'ko_KR.euc' => $ON_EBCDIC ? '' : 'euc-kr', 65 'x-euc-kr' => $ON_EBCDIC ? '' : 'euc-kr', 66 'ujis' => $ON_EBCDIC ? '' : 'euc-jp', 67 'Shift_JIS' => $ON_EBCDIC ? '' : 'shiftjis', 68 'x-sjis' => $ON_EBCDIC ? '' : 'shiftjis', 69 'jis' => $ON_EBCDIC ? '' : '7bit-jis', 70 'big-5' => $ON_EBCDIC ? '' : 'big5-eten', 71 'zh_TW.Big5' => $ON_EBCDIC ? '' : 'big5-eten', 72 'tca-big5' => $ON_EBCDIC ? '' : 'big5-eten', 73 'big5-hk' => $ON_EBCDIC ? '' : 'big5-hkscs', 74 'hkscs-big5' => $ON_EBCDIC ? '' : 'big5-hkscs', 75 'GB_2312-80' => $ON_EBCDIC ? '' : 'euc-cn', 76 'KS_C_5601-1987' => $ON_EBCDIC ? '' : 'cp949', 77 # 78 'gb12345-raw' => $ON_EBCDIC ? '' : 'gb12345-raw', 79 'gb2312-raw' => $ON_EBCDIC ? '' : 'gb2312-raw', 80 'jis0201-raw' => $ON_EBCDIC ? '' : 'jis0201-raw', 81 'jis0208-raw' => $ON_EBCDIC ? '' : 'jis0208-raw', 82 'jis0212-raw' => $ON_EBCDIC ? '' : 'jis0212-raw', 83 'ksc5601-raw' => $ON_EBCDIC ? '' : 'ksc5601-raw', 84 ); 85 86 for my $i (1..11,13..16){ 87 $a2c{"ISO 8859 $i"} = "iso-8859-$i"; 88 } 89 for my $i (1..10){ 90 $a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]"; 91 } 92 for my $k (keys %Encode::Alias::Winlatin2cp){ 93 my $v = $Encode::Alias::Winlatin2cp{$k}; 94 $a2c{"Win" . ucfirst($k)} = "cp" . $v; 95 $a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v; 96 $a2c{"cp-" . $v} = "cp" . $v; 97 } 98 my @a2c = keys %a2c; 99 for my $k (@a2c){ 100 $a2c{uc($k)} = $a2c{$k}; 101 $a2c{lc($k)} = $a2c{$k}; 102 $a2c{lcfirst($k)} = $a2c{$k}; 103 $a2c{ucfirst($k)} = $a2c{$k}; 104 } 105} 106 107BEGIN{ 108 $ON_EBCDIC = ord("A") == 193; 109 @ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC'; 110 $Encode::ON_EBCDIC = $ON_EBCDIC; 111 init_a2c(); 112 @override_tests = qw( 113 myascii:cp1252 114 mygreek:cp1253 115 myhebrew:iso-8859-2 116 myarabic:cp1256 117 ueightsomething:utf-8-strict 118 unknown: 119 ); 120} 121 122if ($ON_EBCDIC){ 123 delete @Encode::ExtModule{ 124 qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp 125 euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932 126 euc-kr ksc5601 cp949 MacKorean 127 big5 big5-hkscs cp950 MacChineseTrad 128 gb18030 big5plus euc-tw) 129 }; 130} 131 132use Test::More tests => (scalar keys %a2c) * 3 + @override_tests; 133 134print "# alias test; \$ON_EBCDIC == $ON_EBCDIC\n"; 135 136foreach my $a (keys %a2c){ 137 print "# $a => $a2c{$a}\n"; 138 my $e = Encode::find_encoding($a); 139 is((defined($e) and $e->name), $a2c{$a},$a) 140 or warn "alias was $a";; 141} 142 143# now we override some of the aliases and see if it works fine 144 145define_alias( 146 qr/ascii/i => '"WinLatin1"', 147 qr/cyrillic/i => '"WinCyrillic"', 148 qr/arabic/i => '"WinArabic"', 149 qr/greek/i => '"WinGreek"', 150 qr/hebrew/i => '"WinHebrew"' 151 ); 152 153Encode::find_encoding("myhebrew"); # polute alias cache 154 155define_alias( sub { 156 my $enc = shift; 157 return "iso-8859-2" if $enc =~ /hebrew/i; 158 return "does-not-exist" if $enc =~ /arabic/i; # should then use other override alias 159 return "utf-8" if $enc =~ /eight/i; 160 return; 161}); 162 163print "# alias test with alias overrides\n"; 164 165for my $test (@override_tests) { 166 my($a, $c) = split /:/, $test; 167 my $e = Encode::find_encoding($a); 168 is((defined($e) and $e->name), $c, $a); 169} 170 171print "# alias undef test\n"; 172 173Encode::Alias->undef_aliases; 174foreach my $a (keys %a2c){ 175 my $e = Encode::find_encoding($a); 176 ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a") 177 or warn "alias was $a"; 178} 179 180print "# alias reinit test\n"; 181 182Encode::Alias->init_aliases; 183init_a2c(); 184foreach my $a (keys %a2c){ 185 my $e = Encode::find_encoding($a); 186 is((defined($e) and $e->name), $a2c{$a}, "Reinit $a") 187 or warn "alias was $a"; 188} 189__END__ 190for my $k (keys %a2c){ 191 $k =~ /[A-Z]/ and next; 192 print "$k => $a2c{$k}\n"; 193} 194 195 196 197