|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
# $Id: jperl.t,v 2.5 2016/11/29 23:29:23 dankogai Exp $
|
|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
# This script is written in euc-jp
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
BEGIN {
|
|
Packit |
d0f5c2 |
require Config; import Config;
|
|
Packit |
d0f5c2 |
if ($Config{'extensions'} !~ /\bEncode\b/) {
|
|
Packit |
d0f5c2 |
print "1..0 # Skip: Encode was not built\n";
|
|
Packit |
d0f5c2 |
exit 0;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
unless (find PerlIO::Layer 'perlio') {
|
|
Packit |
d0f5c2 |
print "1..0 # Skip: PerlIO was not built\n";
|
|
Packit |
d0f5c2 |
exit 0;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
if (ord("A") == 193) {
|
|
Packit |
d0f5c2 |
print "1..0 # Skip: EBCDIC\n";
|
|
Packit |
d0f5c2 |
exit 0;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
if ($] >= 5.025 and !$Config{usecperl}) {
|
|
Packit |
d0f5c2 |
print "1..0 # Skip: encoding pragma not supported in Perl 5.26\n";
|
|
Packit |
d0f5c2 |
exit(0);
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
$| = 1;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
no utf8; # we have raw Japanese encodings here
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
use strict;
|
|
Packit |
d0f5c2 |
#use Test::More tests => 18;
|
|
Packit |
d0f5c2 |
use Test::More tests => 15; # black magic tests commented out
|
|
Packit |
d0f5c2 |
my $Debug = shift;
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
no warnings "deprecated";
|
|
Packit |
d0f5c2 |
no encoding; # ensure
|
|
Packit |
d0f5c2 |
my $Enamae = "\xbe\xae\xbb\xf4\x20\xc3\xc6"; # euc-jp, with \x escapes
|
|
Packit |
d0f5c2 |
use encoding "euc-jp";
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
my $Namae = "¾®»ô ÃÆ"; # in Japanese, in euc-jp
|
|
Packit |
d0f5c2 |
my $Name = "Dan Kogai"; # in English
|
|
Packit |
d0f5c2 |
# euc-jp in \x format but after the pragma. But this one will be converted!
|
|
Packit |
d0f5c2 |
my $Ynamae = "\xbe\xae\xbb\xf4\x20\xc3\xc6";
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
my $str = $Namae; $str =~ s/¾®»ô ÃÆ/Dan Kogai/o;
|
|
Packit |
d0f5c2 |
is($str, $Name, q{regex});
|
|
Packit |
d0f5c2 |
$str = $Namae; $str =~ s/$Namae/Dan Kogai/o;
|
|
Packit |
d0f5c2 |
is($str, $Name, q{regex - with variable});
|
|
Packit |
d0f5c2 |
is(length($Namae), 4, q{utf8:length});
|
|
Packit |
d0f5c2 |
{
|
|
Packit |
d0f5c2 |
use bytes;
|
|
Packit |
d0f5c2 |
# converted to UTF-8 so 3*3+1
|
|
Packit |
d0f5c2 |
is(length($Namae), 10, q{bytes:length});
|
|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
is(length($Enamae), 7, q{euc:length}); # 2*3+1
|
|
Packit |
d0f5c2 |
is ($Namae, $Ynamae, q{literal conversions});
|
|
Packit |
d0f5c2 |
isnt($Enamae, $Ynamae, q{before and after});
|
|
Packit |
d0f5c2 |
is($Enamae, Encode::encode('euc-jp', $Namae));
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
# let's test the scope as well. Must be in utf8 realm
|
|
Packit |
d0f5c2 |
is(length($Namae), 4, q{utf8:length});
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
{
|
|
Packit |
d0f5c2 |
no encoding;
|
|
Packit |
d0f5c2 |
ok(! defined(${^ENCODING}), q{no encoding;});
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
# should've been isnt() but no scoping is suported -- yet
|
|
Packit |
d0f5c2 |
ok(! defined(${^ENCODING}), q{not scoped yet});
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
# The following tests are commented out to accomodate
|
|
Packit |
d0f5c2 |
# Inaba-San's patch to make tr/// work w/o eval qq{}
|
|
Packit |
d0f5c2 |
#{
|
|
Packit |
d0f5c2 |
# # now let's try some real black magic!
|
|
Packit |
d0f5c2 |
# local(${^ENCODING}) = Encode::find_encoding("euc-jp");
|
|
Packit |
d0f5c2 |
# my $str = "\xbe\xae\xbb\xf4\x20\xc3\xc6";
|
|
Packit |
d0f5c2 |
# is (length($str), 4, q{black magic:length});
|
|
Packit |
d0f5c2 |
# is ($str, $Enamae, q{black magic:eq});
|
|
Packit |
d0f5c2 |
#}
|
|
Packit |
d0f5c2 |
#ok(! defined(${^ENCODING}), q{out of black magic});
|
|
Packit |
d0f5c2 |
use bytes;
|
|
Packit |
d0f5c2 |
is (length($Namae), 10);
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
# now something completely different!
|
|
Packit |
d0f5c2 |
#
|
|
Packit |
d0f5c2 |
{
|
|
Packit |
d0f5c2 |
use encoding "euc-jp", Filter=>1;
|
|
Packit |
d0f5c2 |
ok(1, "Filter on");
|
|
Packit |
d0f5c2 |
use utf8;
|
|
Packit |
d0f5c2 |
no strict 'vars'; # fools
|
|
Packit |
d0f5c2 |
# doesn't work w/ "my" as of this writing.
|
|
Packit |
d0f5c2 |
# because of buggy strict.pm and utf8.pm
|
|
Packit |
d0f5c2 |
our $¿Í = 2;
|
|
Packit |
d0f5c2 |
# ^^U+4eba, "human" in CJK ideograph
|
|
Packit |
d0f5c2 |
$¿Í++; # a child is born
|
|
Packit |
d0f5c2 |
*people = \$¿Í;
|
|
Packit |
d0f5c2 |
is ($people, 3, "Filter:utf8 identifier");
|
|
Packit |
d0f5c2 |
no encoding;
|
|
Packit |
d0f5c2 |
ok(1, "Filter off");
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
1;
|
|
Packit |
d0f5c2 |
__END__
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
|