Blame t/Aliases.t

Packit d0f5c2
#!../perl
Packit d0f5c2
Packit d0f5c2
BEGIN {
Packit d0f5c2
    if ($ENV{'PERL_CORE'}){
Packit d0f5c2
    chdir 't';
Packit d0f5c2
    unshift @INC, '../lib';
Packit d0f5c2
    }
Packit d0f5c2
    require Config; import Config;
Packit d0f5c2
    if ($Config{'extensions'} !~ /\bEncode\b/) {
Packit d0f5c2
    print "1..0 # Skip: Encode was not built\n";
Packit d0f5c2
        exit 0;
Packit d0f5c2
    }
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
use strict;
Packit d0f5c2
use Encode;
Packit d0f5c2
use Encode::Alias;
Packit d0f5c2
my %a2c;
Packit d0f5c2
my @override_tests;
Packit d0f5c2
my $ON_EBCDIC;
Packit d0f5c2
Packit d0f5c2
sub init_a2c{
Packit d0f5c2
    %a2c = (
Packit d0f5c2
        'US-ascii' => 'ascii',
Packit d0f5c2
        'ISO-646-US' => 'ascii',
Packit d0f5c2
        'UTF-8'    => 'utf-8-strict',
Packit d0f5c2
        'en_US.UTF-8'    => 'utf-8-strict',
Packit d0f5c2
        'UCS-2'    => 'UCS-2BE',
Packit d0f5c2
        'UCS2'     => 'UCS-2BE',
Packit d0f5c2
        'iso-10646-1' => 'UCS-2BE',
Packit d0f5c2
        'ucs2-le'  => 'UCS-2LE',
Packit d0f5c2
        'ucs2-be'  => 'UCS-2BE',
Packit d0f5c2
        'utf16'    => 'UTF-16',
Packit d0f5c2
        'utf32'    => 'UTF-32',
Packit d0f5c2
        'utf16-be'  => 'UTF-16BE',
Packit d0f5c2
        'utf32-be'  => 'UTF-32BE',
Packit d0f5c2
        'utf16-le'  => 'UTF-16LE',
Packit d0f5c2
        'utf32-le'  => 'UTF-32LE',
Packit d0f5c2
        'UCS4-BE'   => 'UTF-32BE',
Packit d0f5c2
        'UCS-4-LE'  => 'UTF-32LE',
Packit d0f5c2
        'cyrillic' => 'iso-8859-5',
Packit d0f5c2
        'arabic'   => 'iso-8859-6',
Packit d0f5c2
        'greek'    => 'iso-8859-7',
Packit d0f5c2
        'hebrew'   => 'iso-8859-8',
Packit d0f5c2
        'thai'     => 'iso-8859-11',
Packit d0f5c2
        'tis620'   => 'iso-8859-11',
Packit d0f5c2
        'tis-620'   => 'iso-8859-11',
Packit d0f5c2
        'WinLatin1'     => 'cp1252',
Packit d0f5c2
        'WinLatin2'     => 'cp1250',
Packit d0f5c2
        'WinCyrillic'   => 'cp1251',
Packit d0f5c2
        'WinGreek'      => 'cp1253',
Packit d0f5c2
        'WinTurkish'    => 'cp1254',
Packit d0f5c2
        'WinHebrew'     => 'cp1255',
Packit d0f5c2
        'WinArabic'     => 'cp1256',
Packit d0f5c2
        'WinBaltic'     => 'cp1257',
Packit d0f5c2
        'WinVietnamese' => 'cp1258',
Packit d0f5c2
	'Macintosh'     => 'MacRoman',
Packit d0f5c2
        'koi8r'         => 'koi8-r',
Packit d0f5c2
        'koi8u'         => 'koi8-u',
Packit d0f5c2
        'ja_JP.euc'	    => $ON_EBCDIC ? '' : 'euc-jp',
Packit d0f5c2
        'x-euc-jp'	    => $ON_EBCDIC ? '' : 'euc-jp',
Packit d0f5c2
        'zh_CN.euc'	    => $ON_EBCDIC ? '' : 'euc-cn',
Packit d0f5c2
        'x-euc-cn'	    => $ON_EBCDIC ? '' : 'euc-cn',
Packit d0f5c2
        'ko_KR.euc'	    => $ON_EBCDIC ? '' : 'euc-kr',
Packit d0f5c2
        'x-euc-kr'	    => $ON_EBCDIC ? '' : 'euc-kr',
Packit d0f5c2
        'ujis'	    => $ON_EBCDIC ? '' : 'euc-jp',
Packit d0f5c2
        'Shift_JIS'	    => $ON_EBCDIC ? '' : 'shiftjis',
Packit d0f5c2
        'x-sjis'	    => $ON_EBCDIC ? '' : 'shiftjis',
Packit d0f5c2
        'jis'	    => $ON_EBCDIC ? '' : '7bit-jis',
Packit d0f5c2
        'big-5'	    => $ON_EBCDIC ? '' : 'big5-eten',
Packit d0f5c2
        'zh_TW.Big5'    => $ON_EBCDIC ? '' : 'big5-eten',
Packit d0f5c2
        'tca-big5'	    => $ON_EBCDIC ? '' : 'big5-eten',
Packit d0f5c2
        'big5-hk'	    => $ON_EBCDIC ? '' : 'big5-hkscs',
Packit d0f5c2
        'hkscs-big5'    => $ON_EBCDIC ? '' : 'big5-hkscs',
Packit d0f5c2
        'GB_2312-80'    => $ON_EBCDIC ? '' : 'euc-cn',
Packit d0f5c2
        'KS_C_5601-1987'    => $ON_EBCDIC ? '' : 'cp949',
Packit d0f5c2
        #
Packit d0f5c2
        'gb12345-raw'   => $ON_EBCDIC ? '' : 'gb12345-raw',
Packit d0f5c2
        'gb2312-raw'    => $ON_EBCDIC ? '' : 'gb2312-raw',
Packit d0f5c2
        'jis0201-raw'   => $ON_EBCDIC ? '' : 'jis0201-raw',
Packit d0f5c2
        'jis0208-raw'   => $ON_EBCDIC ? '' : 'jis0208-raw',
Packit d0f5c2
        'jis0212-raw'   => $ON_EBCDIC ? '' : 'jis0212-raw',
Packit d0f5c2
        'ksc5601-raw'   => $ON_EBCDIC ? '' : 'ksc5601-raw',
Packit d0f5c2
        'cp65000' => 'UTF-7',
Packit d0f5c2
        'cp65001' => 'utf-8-strict',
Packit d0f5c2
       );
Packit d0f5c2
Packit d0f5c2
    for my $i (1..11,13..16){
Packit d0f5c2
    $a2c{"ISO 8859 $i"} = "iso-8859-$i";
Packit d0f5c2
    }
Packit d0f5c2
    for my $i (1..10){
Packit d0f5c2
    $a2c{"ISO Latin $i"} = "iso-8859-$Encode::Alias::Latin2iso[$i]";
Packit d0f5c2
    }
Packit d0f5c2
    for my $k (keys %Encode::Alias::Winlatin2cp){
Packit d0f5c2
    my $v = $Encode::Alias::Winlatin2cp{$k};
Packit d0f5c2
    $a2c{"Win" . ucfirst($k)} = "cp" . $v;
Packit d0f5c2
    $a2c{"IBM-$v"} = $a2c{"MS-$v"} = "cp" . $v;
Packit d0f5c2
    $a2c{"cp-" . $v} = "cp" . $v;
Packit d0f5c2
    }
Packit d0f5c2
    my @a2c = keys %a2c;
Packit d0f5c2
    for my $k (@a2c){
Packit d0f5c2
    $a2c{uc($k)} = $a2c{$k};
Packit d0f5c2
    $a2c{lc($k)} = $a2c{$k};
Packit d0f5c2
    $a2c{lcfirst($k)} = $a2c{$k};
Packit d0f5c2
    $a2c{ucfirst($k)} = $a2c{$k};
Packit d0f5c2
    }
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
BEGIN{
Packit d0f5c2
    $ON_EBCDIC = ord("A") == 193;
Packit d0f5c2
    @ARGV and $ON_EBCDIC = $ARGV[0] eq 'EBCDIC';
Packit d0f5c2
    $Encode::ON_EBCDIC = $ON_EBCDIC;
Packit d0f5c2
    init_a2c();
Packit d0f5c2
    @override_tests = qw(
Packit d0f5c2
        myascii:cp1252
Packit d0f5c2
        mygreek:cp1253
Packit d0f5c2
        myhebrew:iso-8859-2
Packit d0f5c2
        myarabic:cp1256
Packit d0f5c2
        ueightsomething:utf-8-strict
Packit d0f5c2
        unknown:
Packit d0f5c2
    );
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
if ($ON_EBCDIC){
Packit d0f5c2
    delete @Encode::ExtModule{
Packit d0f5c2
    qw(euc-cn gb2312 gb12345 gbk cp936 iso-ir-165 MacChineseSimp
Packit d0f5c2
       euc-jp iso-2022-jp 7bit-jis shiftjis MacJapanese cp932
Packit d0f5c2
       euc-kr ksc5601 cp949 MacKorean
Packit d0f5c2
       big5	big5-hkscs cp950 MacChineseTrad
Packit d0f5c2
       gb18030 big5plus euc-tw)
Packit d0f5c2
    };
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
use Test::More tests => (scalar keys %a2c) * 3 + @override_tests;
Packit d0f5c2
Packit d0f5c2
print "# alias test;  \$ON_EBCDIC == $ON_EBCDIC\n";
Packit d0f5c2
Packit d0f5c2
foreach my $a (keys %a2c){	
Packit d0f5c2
    print "# $a => $a2c{$a}\n";
Packit d0f5c2
    my $e = Encode::find_encoding($a);
Packit d0f5c2
    is((defined($e) and $e->name), $a2c{$a},$a)
Packit d0f5c2
    or warn "alias was $a";;
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
# now we override some of the aliases and see if it works fine
Packit d0f5c2
Packit d0f5c2
define_alias(
Packit d0f5c2
         qr/ascii/i    => '"WinLatin1"',
Packit d0f5c2
         qr/cyrillic/i => '"WinCyrillic"',
Packit d0f5c2
         qr/arabic/i   => '"WinArabic"',
Packit d0f5c2
         qr/greek/i    => '"WinGreek"',
Packit d0f5c2
         qr/hebrew/i   => '"WinHebrew"'
Packit d0f5c2
        );
Packit d0f5c2
Packit d0f5c2
Encode::find_encoding("myhebrew");  # polute alias cache
Packit d0f5c2
Packit d0f5c2
define_alias( sub {
Packit d0f5c2
    my $enc = shift;
Packit d0f5c2
    return "iso-8859-2"     if $enc =~ /hebrew/i;
Packit d0f5c2
    return "does-not-exist" if $enc =~ /arabic/i;  # should then use other override alias
Packit d0f5c2
    return "utf-8"          if $enc =~ /eight/i;
Packit d0f5c2
    return "unknown";
Packit d0f5c2
});
Packit d0f5c2
Packit d0f5c2
print "# alias test with alias overrides\n";
Packit d0f5c2
Packit d0f5c2
for my $test (@override_tests) {
Packit d0f5c2
    my($a, $c) = split /:/, $test;
Packit d0f5c2
    my $e = Encode::find_encoding($a);
Packit d0f5c2
    is((defined($e) and $e->name), $c, $a);
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
print "# alias undef test\n";
Packit d0f5c2
Packit d0f5c2
Encode::Alias->undef_aliases;
Packit d0f5c2
foreach my $a (keys %a2c){	
Packit d0f5c2
    my $e = Encode::find_encoding($a);
Packit d0f5c2
    ok(!defined($e) || $e->name =~ /-raw$/o,"Undef $a")
Packit d0f5c2
    or warn "alias was $a";
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
print "# alias reinit test\n";
Packit d0f5c2
Packit d0f5c2
Encode::Alias->init_aliases;
Packit d0f5c2
init_a2c();
Packit d0f5c2
foreach my $a (keys %a2c){	
Packit d0f5c2
    my $e = Encode::find_encoding($a);
Packit d0f5c2
    is((defined($e) and $e->name), $a2c{$a}, "Reinit $a")
Packit d0f5c2
    or warn "alias was $a";
Packit d0f5c2
}
Packit d0f5c2
__END__
Packit d0f5c2
for my $k (keys %a2c){
Packit d0f5c2
    $k =~ /[A-Z]/ and next;
Packit d0f5c2
    print "$k => $a2c{$k}\n";
Packit d0f5c2
}
Packit d0f5c2
Packit d0f5c2
Packit d0f5c2