|
Packit |
d0f5c2 |
#!../perl
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
BEGIN {
|
|
Packit |
d0f5c2 |
if ($ENV{'PERL_CORE'}){
|
|
Packit |
d0f5c2 |
chdir 't';
|
|
Packit |
d0f5c2 |
unshift @INC, '../lib';
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
require Config; import Config;
|
|
Packit |
d0f5c2 |
if ($Config{'extensions'} !~ /\bEncode\b/) {
|
|
Packit |
d0f5c2 |
print "1..0 # Skip: Encode was not built\n";
|
|
Packit |
d0f5c2 |
exit 0;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
use strict;
|
|
Packit |
d0f5c2 |
use Encode;
|
|
Packit |
d0f5c2 |
use Encode::Alias;
|
|
Packit |
d0f5c2 |
my %a2c;
|
|
Packit |
d0f5c2 |
my @override_tests;
|
|
Packit |
d0f5c2 |
my $ON_EBCDIC;
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
sub init_a2c{
|
|
Packit |
d0f5c2 |
%a2c = (
|
|
Packit |
d0f5c2 |
'US-ascii' => 'ascii',
|
|
Packit |
d0f5c2 |
'ISO-646-US' => 'ascii',
|
|
Packit |
d0f5c2 |
'UTF-8' => 'utf-8-strict',
|
|
Packit |
d0f5c2 |
'en_US.UTF-8' => 'utf-8-strict',
|
|
Packit |
d0f5c2 |
'UCS-2' => 'UCS-2BE',
|
|
Packit |
d0f5c2 |
'UCS2' => 'UCS-2BE',
|
|
Packit |
d0f5c2 |
'iso-10646-1' => 'UCS-2BE',
|
|
Packit |
d0f5c2 |
'ucs2-le' => 'UCS-2LE',
|
|
Packit |
d0f5c2 |
'ucs2-be' => 'UCS-2BE',
|
|
Packit |
d0f5c2 |
'utf16' => 'UTF-16',
|
|
Packit |
d0f5c2 |
'utf32' => 'UTF-32',
|
|
Packit |
d0f5c2 |
'utf16-be' => 'UTF-16BE',
|
|
Packit |
d0f5c2 |
'utf32-be' => 'UTF-32BE',
|
|
Packit |
d0f5c2 |
'utf16-le' => 'UTF-16LE',
|
|
Packit |
d0f5c2 |
'utf32-le' => 'UTF-32LE',
|
|
Packit |
d0f5c2 |
'UCS4-BE' => 'UTF-32BE',
|
|
Packit |
d0f5c2 |
'UCS-4-LE' => 'UTF-32LE',
|
|
Packit |
d0f5c2 |
'cyrillic' => 'iso-8859-5',
|
|
Packit |
d0f5c2 |
'arabic' => 'iso-8859-6',
|
|
Packit |
d0f5c2 |
'greek' => 'iso-8859-7',
|
|
Packit |
d0f5c2 |
'hebrew' => 'iso-8859-8',
|
|
Packit |
d0f5c2 |
'thai' => 'iso-8859-11',
|
|
Packit |
d0f5c2 |
'tis620' => 'iso-8859-11',
|
|
Packit |
d0f5c2 |
'tis-620' => 'iso-8859-11',
|
|
Packit |
d0f5c2 |
'WinLatin1' => 'cp1252',
|
|
Packit |
d0f5c2 |
'WinLatin2' => 'cp1250',
|
|
Packit |
d0f5c2 |
'WinCyrillic' => 'cp1251',
|
|
Packit |
d0f5c2 |
'WinGreek' => 'cp1253',
|
|
Packit |
d0f5c2 |
'WinTurkish' => 'cp1254',
|
|
Packit |
d0f5c2 |
'WinHebrew' => 'cp1255',
|
|
Packit |
d0f5c2 |
'WinArabic' => 'cp1256',
|
|
Packit |
d0f5c2 |
'WinBaltic' => 'cp1257',
|
|
Packit |
d0f5c2 |
'WinVietnamese' => 'cp1258',
|
|
Packit |
d0f5c2 |
'Macintosh' => 'MacRoman',
|
|
Packit |
d0f5c2 |
'koi8r' => 'koi8-r',
|
|
Packit |
d0f5c2 |
'koi8u' => 'koi8-u',
|
|
Packit |
d0f5c2 |
'ja_JP.euc' => $ON_EBCDIC ? '' : 'euc-jp',
|
|
Packit |
d0f5c2 |
'x-euc-jp' => $ON_EBCDIC ? '' : 'euc-jp',
|
|
Packit |
d0f5c2 |
'zh_CN.euc' => $ON_EBCDIC ? '' : 'euc-cn',
|
|
Packit |
d0f5c2 |
'x-euc-cn' => $ON_EBCDIC ? '' : 'euc-cn',
|
|
Packit |
d0f5c2 |
'ko_KR.euc' => $ON_EBCDIC ? '' : 'euc-kr',
|
|
Packit |
d0f5c2 |
'x-euc-kr' => $ON_EBCDIC ? '' : 'euc-kr',
|
|
Packit |
d0f5c2 |
'ujis' => $ON_EBCDIC ? '' : 'euc-jp',
|
|
Packit |
d0f5c2 |
'Shift_JIS' => $ON_EBCDIC ? '' : 'shiftjis',
|
|
Packit |
d0f5c2 |
'x-sjis' => $ON_EBCDIC ? '' : 'shiftjis',
|
|
Packit |
d0f5c2 |
'jis' => $ON_EBCDIC ? '' : '7bit-jis',
|
|
Packit |
d0f5c2 |
'big-5' => $ON_EBCDIC ? '' : 'big5-eten',
|
|
Packit |
d0f5c2 |
'zh_TW.Big5' => $ON_EBCDIC ? '' : 'big5-eten',
|
|
Packit |
d0f5c2 |
'tca-big5' => $ON_EBCDIC ? '' : 'big5-eten',
|
|
Packit |
d0f5c2 |
'big5-hk' => $ON_EBCDIC ? '' : 'big5-hkscs',
|
|
Packit |
d0f5c2 |
'hkscs-big5' => $ON_EBCDIC ? '' : 'big5-hkscs',
|
|
Packit |
d0f5c2 |
'GB_2312-80' => $ON_EBCDIC ? '' : 'euc-cn',
|
|
Packit |
d0f5c2 |
'KS_C_5601-1987' => $ON_EBCDIC ? '' : 'cp949',
|
|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
'gb12345-raw' => $ON_EBCDIC ? '' : 'gb12345-raw',
|
|
Packit |
d0f5c2 |
'gb2312-raw' => $ON_EBCDIC ? '' : 'gb2312-raw',
|
|
Packit |
d0f5c2 |
'jis0201-raw' => $ON_EBCDIC ? '' : 'jis0201-raw',
|
|
Packit |
d0f5c2 |
'jis0208-raw' => $ON_EBCDIC ? '' : 'jis0208-raw',
|
|
Packit |
d0f5c2 |
'jis0212-raw' => $ON_EBCDIC ? '' : 'jis0212-raw',
|
|
Packit |
d0f5c2 |
'ksc5601-raw' => $ON_EBCDIC ? '' : 'ksc5601-raw',
|
|
Packit |
d0f5c2 |
'cp65000' => 'UTF-7',
|
|
Packit |
d0f5c2 |
'cp65001' => 'utf-8-strict',
|
|
Packit |
d0f5c2 |
);
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
for my $i (1..11,13..16){
|
|
Packit |
d0f5c2 |
$a2c{"ISO 8859 $i"} = "iso-8859-$i";
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
for my $i (1..10){
|
|
Packit |
d0f5c2 |
$a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]";
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
for my $k (keys %Encode::Alias::Winlatin2cp){
|
|
Packit |
d0f5c2 |
my $v = $Encode::Alias::Winlatin2cp{$k};
|
|
Packit |
d0f5c2 |
$a2c{"Win" . ucfirst($k)} = "cp" . $v;
|
|
Packit |
d0f5c2 |
$a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v;
|
|
Packit |
d0f5c2 |
$a2c{"cp-" . $v} = "cp" . $v;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
my @a2c = keys %a2c;
|
|
Packit |
d0f5c2 |
for my $k (@a2c){
|
|
Packit |
d0f5c2 |
$a2c{uc($k)} = $a2c{$k};
|
|
Packit |
d0f5c2 |
$a2c{lc($k)} = $a2c{$k};
|
|
Packit |
d0f5c2 |
$a2c{lcfirst($k)} = $a2c{$k};
|
|
Packit |
d0f5c2 |
$a2c{ucfirst($k)} = $a2c{$k};
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
BEGIN{
|
|
Packit |
d0f5c2 |
$ON_EBCDIC = ord("A") == 193;
|
|
Packit |
d0f5c2 |
@ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC';
|
|
Packit |
d0f5c2 |
$Encode::ON_EBCDIC = $ON_EBCDIC;
|
|
Packit |
d0f5c2 |
init_a2c();
|
|
Packit |
d0f5c2 |
@override_tests = qw(
|
|
Packit |
d0f5c2 |
myascii:cp1252
|
|
Packit |
d0f5c2 |
mygreek:cp1253
|
|
Packit |
d0f5c2 |
myhebrew:iso-8859-2
|
|
Packit |
d0f5c2 |
myarabic:cp1256
|
|
Packit |
d0f5c2 |
ueightsomething:utf-8-strict
|
|
Packit |
d0f5c2 |
unknown:
|
|
Packit |
d0f5c2 |
);
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
if ($ON_EBCDIC){
|
|
Packit |
d0f5c2 |
delete @Encode::ExtModule{
|
|
Packit |
d0f5c2 |
qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp
|
|
Packit |
d0f5c2 |
euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932
|
|
Packit |
d0f5c2 |
euc-kr ksc5601 cp949 MacKorean
|
|
Packit |
d0f5c2 |
big5 big5-hkscs cp950 MacChineseTrad
|
|
Packit |
d0f5c2 |
gb18030 big5plus euc-tw)
|
|
Packit |
d0f5c2 |
};
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
use Test::More tests => (scalar keys %a2c) * 3 + @override_tests;
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
print "# alias test; \$ON_EBCDIC == $ON_EBCDIC\n";
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
foreach my $a (keys %a2c){
|
|
Packit |
d0f5c2 |
print "# $a => $a2c{$a}\n";
|
|
Packit |
d0f5c2 |
my $e = Encode::find_encoding($a);
|
|
Packit |
d0f5c2 |
is((defined($e) and $e->name), $a2c{$a},$a)
|
|
Packit |
d0f5c2 |
or warn "alias was $a";;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# now we override some of the aliases and see if it works fine
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
define_alias(
|
|
Packit |
d0f5c2 |
qr/ascii/i => '"WinLatin1"',
|
|
Packit |
d0f5c2 |
qr/cyrillic/i => '"WinCyrillic"',
|
|
Packit |
d0f5c2 |
qr/arabic/i => '"WinArabic"',
|
|
Packit |
d0f5c2 |
qr/greek/i => '"WinGreek"',
|
|
Packit |
d0f5c2 |
qr/hebrew/i => '"WinHebrew"'
|
|
Packit |
d0f5c2 |
);
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
Encode::find_encoding("myhebrew"); # polute alias cache
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
define_alias( sub {
|
|
Packit |
d0f5c2 |
my $enc = shift;
|
|
Packit |
d0f5c2 |
return "iso-8859-2" if $enc =~ /hebrew/i;
|
|
Packit |
d0f5c2 |
return "does-not-exist" if $enc =~ /arabic/i; # should then use other override alias
|
|
Packit |
d0f5c2 |
return "utf-8" if $enc =~ /eight/i;
|
|
Packit |
d0f5c2 |
return "unknown";
|
|
Packit |
d0f5c2 |
});
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
print "# alias test with alias overrides\n";
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
for my $test (@override_tests) {
|
|
Packit |
d0f5c2 |
my($a, $c) = split /:/, $test;
|
|
Packit |
d0f5c2 |
my $e = Encode::find_encoding($a);
|
|
Packit |
d0f5c2 |
is((defined($e) and $e->name), $c, $a);
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
print "# alias undef test\n";
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
Encode::Alias->undef_aliases;
|
|
Packit |
d0f5c2 |
foreach my $a (keys %a2c){
|
|
Packit |
d0f5c2 |
my $e = Encode::find_encoding($a);
|
|
Packit |
d0f5c2 |
ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a")
|
|
Packit |
d0f5c2 |
or warn "alias was $a";
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
print "# alias reinit test\n";
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
Encode::Alias->init_aliases;
|
|
Packit |
d0f5c2 |
init_a2c();
|
|
Packit |
d0f5c2 |
foreach my $a (keys %a2c){
|
|
Packit |
d0f5c2 |
my $e = Encode::find_encoding($a);
|
|
Packit |
d0f5c2 |
is((defined($e) and $e->name), $a2c{$a}, "Reinit $a")
|
|
Packit |
d0f5c2 |
or warn "alias was $a";
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
__END__
|
|
Packit |
d0f5c2 |
for my $k (keys %a2c){
|
|
Packit |
d0f5c2 |
$k =~ /[A-Z]/ and next;
|
|
Packit |
d0f5c2 |
print "$k => $a2c{$k}\n";
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
|