|
Packit |
d0f5c2 |
BEGIN {
|
|
Packit |
d0f5c2 |
if ($ENV{'PERL_CORE'}){
|
|
Packit |
d0f5c2 |
chdir 't';
|
|
Packit |
d0f5c2 |
unshift @INC, '../lib';
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
require Config; import Config;
|
|
Packit |
d0f5c2 |
if ($Config{'extensions'} !~ /\bEncode\b/) {
|
|
Packit |
d0f5c2 |
print "1..0 # Skip: Encode was not built\n";
|
|
Packit |
d0f5c2 |
exit 0;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
$| = 1;
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
use strict;
|
|
Packit |
d0f5c2 |
use utf8;
|
|
Packit |
d0f5c2 |
use Test::More tests => 780;
|
|
Packit |
d0f5c2 |
use Encode;
|
|
Packit |
d0f5c2 |
use Encode::GSM0338;
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# The specification of GSM 03.38 is not awfully clear.
|
|
Packit |
d0f5c2 |
# (http://www.unicode.org/Public/MAPPINGS/ETSI/GSM0338.TXT)
|
|
Packit |
d0f5c2 |
# The various combinations of 0x00 and 0x1B as leading bytes
|
|
Packit |
d0f5c2 |
# are unclear, as is the semantics of those bytes as standalone
|
|
Packit |
d0f5c2 |
# or as final single bytes.
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
my $chk = Encode::LEAVE_SRC();
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# escapes
|
|
Packit |
d0f5c2 |
# see http://www.csoft.co.uk/sms/character_sets/gsm.htm
|
|
Packit |
d0f5c2 |
my %esc_seq = (
|
|
Packit |
d0f5c2 |
"\x{20ac}" => "\x1b\x65",
|
|
Packit |
d0f5c2 |
"\x0c" => "\x1b\x0A",
|
|
Packit |
d0f5c2 |
"[" => "\x1b\x3C",
|
|
Packit |
d0f5c2 |
"\\" => "\x1b\x2F",
|
|
Packit |
d0f5c2 |
"]" => "\x1b\x3E",
|
|
Packit |
d0f5c2 |
"^" => "\x1b\x14",
|
|
Packit |
d0f5c2 |
"{" => "\x1b\x28",
|
|
Packit |
d0f5c2 |
"|" => "\x1b\x40",
|
|
Packit |
d0f5c2 |
"}" => "\x1b\x29",
|
|
Packit |
d0f5c2 |
"~" => "\x1b\x3D",
|
|
Packit |
d0f5c2 |
);
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
my %unesc_seq = reverse %esc_seq;
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
sub eu{
|
|
Packit |
d0f5c2 |
$_[0] =~ /[\x00-\x1f]/ ?
|
|
Packit |
d0f5c2 |
sprintf("\\x{%04X}", ord($_[0])) : encode_utf8($_[0]);
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
for my $c ( map { chr } 0 .. 127 ) {
|
|
Packit |
d0f5c2 |
my $u = $Encode::GSM0338::GSM2UNI{$c};
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# default character set
|
|
Packit |
d0f5c2 |
is decode( "gsm0338", $c, $chk ), $u,
|
|
Packit |
d0f5c2 |
sprintf( "decode \\x%02X", ord($c) );
|
|
Packit |
d0f5c2 |
eval { decode( "gsm0338", $c . "\xff", $chk ) };
|
|
Packit |
d0f5c2 |
ok( $@, $@ );
|
|
Packit |
d0f5c2 |
is encode( "gsm0338", $u, $chk ), $c, sprintf( "encode %s", eu($u) );
|
|
Packit |
d0f5c2 |
eval { encode( "gsm0338", $u . "\x{3000}", $chk ) };
|
|
Packit |
d0f5c2 |
ok( $@, $@ );
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# nasty atmark
|
|
Packit |
d0f5c2 |
if ( $c eq "\x00" ) {
|
|
Packit |
d0f5c2 |
is decode( "gsm0338", "\x00" . $c, $chk ), "\x00",
|
|
Packit |
d0f5c2 |
sprintf( '@@ =>: \x00+\x%02X', ord($c) );
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
else {
|
|
Packit |
d0f5c2 |
is decode( "gsm0338", "\x00" . $c ), '@' . decode( "gsm0338", $c ),
|
|
Packit |
d0f5c2 |
sprintf( '@: decode \x00+\x%02X', ord($c) );
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# escape seq.
|
|
Packit |
d0f5c2 |
my $ecs = "\x1b" . $c;
|
|
Packit |
d0f5c2 |
if ( $unesc_seq{$ecs} ) {
|
|
Packit |
d0f5c2 |
is decode( "gsm0338", $ecs, $chk ), $unesc_seq{$ecs},
|
|
Packit |
d0f5c2 |
sprintf( "ESC: decode ESC+\\x%02X", ord($c) );
|
|
Packit |
d0f5c2 |
is encode( "gsm0338", $unesc_seq{$ecs}, $chk ), $ecs,
|
|
Packit |
d0f5c2 |
sprintf( "ESC: encode %s ", eu( $unesc_seq{$ecs} ) );
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
else {
|
|
Packit |
d0f5c2 |
is decode( "gsm0338", $ecs, $chk ),
|
|
Packit |
d0f5c2 |
"\xA0" . decode( "gsm0338", $c ),
|
|
Packit |
d0f5c2 |
sprintf( "decode ESC+\\x%02X", ord($c) );
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# https://rt.cpan.org/Ticket/Display.html?id=75670
|
|
Packit |
d0f5c2 |
is decode("gsm0338", "\x09") => chr(0xC7), 'RT75670: decode';
|
|
Packit |
d0f5c2 |
is encode("gsm0338", chr(0xC7)) => "\x09", 'RT75670: encode';
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
__END__
|
|
Packit |
d0f5c2 |
for my $c (map { chr } 0..127){
|
|
Packit |
d0f5c2 |
my $b = "\x1b$c";
|
|
Packit |
d0f5c2 |
my $u = $Encode::GSM0338::GSM2UNI{$b};
|
|
Packit |
d0f5c2 |
next unless $u;
|
|
Packit |
d0f5c2 |
$u ||= "\xA0" . $Encode::GSM0338::GSM2UNI{$c};
|
|
Packit |
d0f5c2 |
is decode("gsm0338", $b), $u, sprintf("decode ESC+\\x%02X", ord($c) );
|
|
Packit |
d0f5c2 |
}
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
__END__
|
|
Packit |
d0f5c2 |
# old test follows
|
|
Packit |
d0f5c2 |
ub t { is(decode("gsm0338", my $t = $_[0]), $_[1]) }
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# t("\x00", "\x00"); # ???
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# "Round-trip".
|
|
Packit |
d0f5c2 |
t("\x41", "\x41");
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
t("\x01", "\xA3");
|
|
Packit |
d0f5c2 |
t("\x02", "\x24");
|
|
Packit |
d0f5c2 |
t("\x03", "\xA5");
|
|
Packit |
d0f5c2 |
t("\x09", "\xE7");
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
t("\x00\x00", "\x00\x00"); # Maybe?
|
|
Packit |
d0f5c2 |
t("\x00\x1B", "\x40\xA0"); # Maybe?
|
|
Packit |
d0f5c2 |
t("\x00\x41", "\x40\x41");
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# t("\x1B", "\x1B"); # ???
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# Escape with no special second byte is just a NBSP.
|
|
Packit |
d0f5c2 |
t("\x1B\x41", "\xA0\x41");
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
t("\x1B\x00", "\xA0\x40"); # Maybe?
|
|
Packit |
d0f5c2 |
|
|
Packit |
d0f5c2 |
# Special escape characters.
|
|
Packit |
d0f5c2 |
t("\x1B\x0A", "\x0C");
|
|
Packit |
d0f5c2 |
t("\x1B\x14", "\x5E");
|
|
Packit |
d0f5c2 |
t("\x1B\x28", "\x7B");
|
|
Packit |
d0f5c2 |
t("\x1B\x29", "\x7D");
|
|
Packit |
d0f5c2 |
t("\x1B\x2F", "\x5C");
|
|
Packit |
d0f5c2 |
t("\x1B\x3C", "\x5B");
|
|
Packit |
d0f5c2 |
t("\x1B\x3D", "\x7E");
|
|
Packit |
d0f5c2 |
t("\x1B\x3E", "\x5D");
|
|
Packit |
d0f5c2 |
t("\x1B\x40", "\x7C");
|
|
Packit |
d0f5c2 |
t("\x1B\x40", "\x7C");
|
|
Packit |
d0f5c2 |
t("\x1B\x65", "\x{20AC}");
|