593 lines
16 KiB
Perl
Raw Normal View History

2010-09-01 11:22:43 +09:00
package Data::MessagePack::PP;
2010-09-17 13:37:17 +09:00
use 5.008001;
2010-09-01 11:22:43 +09:00
use strict;
use Carp ();
# See also
# http://redmine.msgpack.org/projects/msgpack/wiki/FormatSpec
# http://cpansearch.perl.org/src/YAPPO/Data-Model-0.00006/lib/Data/Model/Driver/Memcached.pm
# http://frox25.no-ip.org/~mtve/wiki/MessagePack.html : reference to using CORE::pack, CORE::unpack
package
Data::MessagePack;
use strict;
use B ();
2010-09-01 11:22:43 +09:00
BEGIN {
my $unpack_int64_slow;
my $unpack_uint64_slow;
if(!eval { pack 'Q', 1 }) { # don't have quad types
$unpack_int64_slow = sub {
require Math::BigInt;
my $high = unpack_uint32( $_[0], $_[1] );
my $low = unpack_uint32( $_[0], $_[1] + 4);
if($high < 0xF0000000) { # positive
$high = Math::BigInt->new( $high );
$low = Math::BigInt->new( $low );
return +($high << 32 | $low)->bstr;
}
else { # negative
$high = Math::BigInt->new( ~$high );
$low = Math::BigInt->new( ~$low );
return +( -($high << 32 | $low + 1) )->bstr;
}
};
$unpack_uint64_slow = sub {
require Math::BigInt;
my $high = Math::BigInt->new( unpack_uint32( $_[0], $_[1]) );
my $low = Math::BigInt->new( unpack_uint32( $_[0], $_[1] + 4) );
return +($high << 32 | $low)->bstr;
};
}
*unpack_uint16 = sub { return unpack 'n', substr( $_[0], $_[1], 2 ) };
*unpack_uint32 = sub { return unpack 'N', substr( $_[0], $_[1], 4 ) };
2010-09-01 11:22:43 +09:00
# for pack and unpack compatibility
if ( $] < 5.010 ) {
# require $Config{byteorder}; my $bo_is_le = ( $Config{byteorder} =~ /^1234/ );
# which better?
2010-09-02 23:45:05 +09:00
my $bo_is_le = unpack ( 'd', "\x00\x00\x00\x00\x00\x00\xf0\x3f") == 1; # 1.0LE
2010-09-17 13:37:17 +09:00
*unpack_int16 = sub {
my $v = unpack 'n', substr( $_[0], $_[1], 2 );
return $v ? $v - 0x10000 : 0;
};
*unpack_int32 = sub {
no warnings; # avoid for warning about Hexadecimal number
my $v = unpack 'N', substr( $_[0], $_[1], 4 );
return $v ? $v - 0x100000000 : 0;
};
2010-09-17 13:37:17 +09:00
# In reality, since 5.9.2 '>' is introduced. but 'n!' and 'N!'?
if($bo_is_le) {
*pack_uint64 = sub {
my @v = unpack( 'V2', pack( 'Q', $_[0] ) );
return pack 'CN2', 0xcf, @v[1,0];
};
*pack_int64 = sub {
my @v = unpack( 'V2', pack( 'q', $_[0] ) );
return pack 'CN2', 0xd3, @v[1,0];
};
*pack_double = sub {
my @v = unpack( 'V2', pack( 'd', $_[0] ) );
return pack 'CN2', 0xcb, @v[1,0];
};
*unpack_float = sub {
my @v = unpack( 'v2', substr( $_[0], $_[1], 4 ) );
return unpack( 'f', pack( 'n2', @v[1,0] ) );
};
*unpack_double = sub {
my @v = unpack( 'V2', substr( $_[0], $_[1], 8 ) );
return unpack( 'd', pack( 'N2', @v[1,0] ) );
};
*unpack_int64 = $unpack_int64_slow || sub {
2010-09-17 13:37:17 +09:00
my @v = unpack( 'V*', substr( $_[0], $_[1], 8 ) );
return unpack( 'q', pack( 'N2', @v[1,0] ) );
};
*unpack_uint64 = $unpack_uint64_slow || sub {
2010-09-17 13:37:17 +09:00
my @v = unpack( 'V*', substr( $_[0], $_[1], 8 ) );
return unpack( 'Q', pack( 'N2', @v[1,0] ) );
};
}
else { # big endian
*pack_uint64 = sub { return pack 'CQ', 0xcf, $_[0]; };
*pack_int64 = sub { return pack 'Cq', 0xd3, $_[0]; };
*pack_double = sub { return pack 'Cd', 0xcb, $_[0]; };
*unpack_float = sub { return unpack( 'f', substr( $_[0], $_[1], 4 ) ); };
*unpack_double = sub { return unpack( 'd', substr( $_[0], $_[1], 8 ) ); };
2010-09-22 14:12:19 +09:00
*unpack_int64 = $unpack_int64_slow || sub { unpack 'q', substr( $_[0], $_[1], 8 ); };
*unpack_uint64 = $unpack_uint64_slow || sub { unpack 'Q', substr( $_[0], $_[1], 8 ); };
2010-09-17 13:37:17 +09:00
}
2010-09-01 11:22:43 +09:00
}
else {
*pack_uint64 = sub { return pack 'CQ>', 0xcf, $_[0]; };
*pack_int64 = sub { return pack 'Cq>', 0xd3, $_[0]; };
2010-09-01 11:22:43 +09:00
*pack_double = sub { return pack 'Cd>', 0xcb, $_[0]; };
2010-09-17 13:37:17 +09:00
2010-09-01 11:22:43 +09:00
*unpack_float = sub { return unpack( 'f>', substr( $_[0], $_[1], 4 ) ); };
2010-09-02 23:45:05 +09:00
*unpack_double = sub { return unpack( 'd>', substr( $_[0], $_[1], 8 ) ); };
*unpack_int16 = sub { return unpack( 'n!', substr( $_[0], $_[1], 2 ) ); };
*unpack_int32 = sub { return unpack( 'N!', substr( $_[0], $_[1], 4 ) ); };
*unpack_int64 = $unpack_int64_slow || sub { return unpack( 'q>', substr( $_[0], $_[1], 8 ) ); };
*unpack_uint64 = $unpack_uint64_slow || sub { return unpack( 'Q>', substr( $_[0], $_[1], 8 ) ); };
2010-09-01 11:22:43 +09:00
}
}
2010-09-18 14:38:35 +09:00
sub _unexpected {
Carp::confess("Unexpected " . sprintf(shift, @_) . " found");
}
2010-09-01 11:22:43 +09:00
#
# PACK
#
{
2010-09-01 16:04:25 +09:00
no warnings 'recursion';
2010-09-18 14:46:10 +09:00
our $_max_depth;
2010-09-01 11:22:43 +09:00
2010-09-17 13:37:17 +09:00
sub pack :method {
2010-09-01 11:22:43 +09:00
Carp::croak('Usage: Data::MessagePack->pack($dat [,$max_depth])') if @_ < 2;
2010-09-18 14:46:10 +09:00
$_max_depth = defined $_[2] ? $_[2] : 512; # init
2010-09-01 11:22:43 +09:00
return _pack( $_[1] );
}
sub _pack {
my ( $value ) = @_;
2010-09-18 14:46:10 +09:00
local $_max_depth = $_max_depth - 1;
if ( $_max_depth < 0 ) {
Carp::croak("perl structure exceeds maximum nesting level (max_depth set too low?)");
}
2010-09-01 16:04:25 +09:00
return CORE::pack( 'C', 0xc0 ) if ( not defined $value );
2010-09-01 11:22:43 +09:00
2010-09-17 13:49:08 +09:00
if ( ref($value) eq 'ARRAY' ) {
2010-09-01 11:22:43 +09:00
my $num = @$value;
my $header =
2010-09-01 16:04:25 +09:00
$num < 16 ? CORE::pack( 'C', 0x90 + $num )
: $num < 2 ** 16 - 1 ? CORE::pack( 'Cn', 0xdc, $num )
: $num < 2 ** 32 - 1 ? CORE::pack( 'CN', 0xdd, $num )
2010-09-18 14:38:35 +09:00
: _unexpected("number %d", $num)
2010-09-01 11:22:43 +09:00
;
return join( '', $header, map { _pack( $_ ) } @$value );
}
2010-09-17 13:49:08 +09:00
elsif ( ref($value) eq 'HASH' ) {
2010-09-01 11:22:43 +09:00
my $num = keys %$value;
my $header =
2010-09-01 16:04:25 +09:00
$num < 16 ? CORE::pack( 'C', 0x80 + $num )
: $num < 2 ** 16 - 1 ? CORE::pack( 'Cn', 0xde, $num )
: $num < 2 ** 32 - 1 ? CORE::pack( 'CN', 0xdf, $num )
2010-09-18 14:38:35 +09:00
: _unexpected("number %d", $num)
2010-09-01 11:22:43 +09:00
;
return join( '', $header, map { _pack( $_ ) } %$value );
}
2010-09-17 13:49:08 +09:00
elsif ( ref( $value ) eq 'Data::MessagePack::Boolean' ) {
return CORE::pack( 'C', ${$value} ? 0xc3 : 0xc2 );
2010-09-01 11:22:43 +09:00
}
2010-09-17 13:49:08 +09:00
my $b_obj = B::svref_2object( \$value );
2010-09-01 11:22:43 +09:00
my $flags = $b_obj->FLAGS;
if ( $flags & ( B::SVf_IOK | B::SVp_IOK ) ) {
if ($value >= 0) {
2010-09-01 16:04:25 +09:00
return $value <= 127 ? CORE::pack 'C', $value
: $value < 2 ** 8 ? CORE::pack 'CC', 0xcc, $value
: $value < 2 ** 16 ? CORE::pack 'Cn', 0xcd, $value
: $value < 2 ** 32 ? CORE::pack 'CN', 0xce, $value
: pack_uint64( $value );
2010-09-01 11:22:43 +09:00
}
else {
2010-09-01 16:04:25 +09:00
return -$value <= 32 ? CORE::pack 'C', ($value & 255)
: -$value <= 2 ** 7 ? CORE::pack 'Cc', 0xd0, $value
: -$value <= 2 ** 15 ? CORE::pack 'Cn', 0xd1, $value
: -$value <= 2 ** 31 ? CORE::pack 'CN', 0xd2, $value
: pack_int64( $value );
2010-09-01 11:22:43 +09:00
}
}
elsif ( $flags & B::SVf_POK ) { # raw / check needs before dboule
if ( $Data::MessagePack::PreferInteger ) {
2010-09-01 11:22:43 +09:00
if ( $value =~ /^-?[0-9]+$/ ) { # ok?
my $value2 = 0 + $value;
if ( $value > 0xFFFFFFFF or $value < '-'.0x80000000 or # <- needless but for XS compat
0 + $value != B::svref_2object( \$value2 )->int_value
) {
local $Data::MessagePack::PreferInteger; # avoid for PV => NV
2010-09-01 11:22:43 +09:00
return _pack( "$value" );
}
return _pack( $value + 0 );
}
}
utf8::encode( $value ) if utf8::is_utf8( $value );
my $num = length $value;
my $header =
2010-09-01 16:04:25 +09:00
$num < 32 ? CORE::pack( 'C', 0xa0 + $num )
: $num < 2 ** 16 - 1 ? CORE::pack( 'Cn', 0xda, $num )
: $num < 2 ** 32 - 1 ? CORE::pack( 'CN', 0xdb, $num )
2010-09-18 14:38:35 +09:00
: _unexpected_number($num)
2010-09-01 11:22:43 +09:00
;
return $header . $value;
}
elsif ( $flags & ( B::SVf_NOK | B::SVp_NOK ) ) { # double only
return pack_double( $value );
}
else {
2010-09-18 14:38:35 +09:00
_unexpected("data type %s", $b_obj);
2010-09-01 11:22:43 +09:00
}
}
} # PACK
#
# UNPACK
#
{
2010-09-01 16:04:25 +09:00
2010-09-01 11:22:43 +09:00
my $p; # position variables for speed.
2010-09-17 13:37:17 +09:00
sub unpack :method {
2010-09-01 11:22:43 +09:00
$p = 0; # init
_unpack( $_[1] );
}
sub _unpack {
my ( $value ) = @_;
2010-09-01 16:04:25 +09:00
my $byte = CORE::unpack( 'C', substr( $value, $p++, 1 ) ); # get header
2010-09-01 11:22:43 +09:00
die "invalid data" unless defined $byte;
if ( ( $byte >= 0x90 and $byte <= 0x9f ) or $byte == 0xdc or $byte == 0xdd ) {
my $num;
if ( $byte == 0xdc ) { # array 16
2010-09-01 16:04:25 +09:00
$num = CORE::unpack 'n', substr( $value, $p, 2 );
2010-09-01 11:22:43 +09:00
$p += 2;
}
elsif ( $byte == 0xdd ) { # array 32
2010-09-01 16:04:25 +09:00
$num = CORE::unpack 'N', substr( $value, $p, 4 );
2010-09-01 11:22:43 +09:00
$p += 4;
}
else { # fix array
$num = $byte & ~0x90;
}
my @array;
push @array, _unpack( $value ) while $num-- > 0;
return \@array;
}
elsif ( ( $byte >= 0x80 and $byte <= 0x8f ) or $byte == 0xde or $byte == 0xdf ) {
my $num;
if ( $byte == 0xde ) { # map 16
2010-09-01 16:04:25 +09:00
$num = CORE::unpack 'n', substr( $value, $p, 2 );
2010-09-01 11:22:43 +09:00
$p += 2;
}
elsif ( $byte == 0xdf ) { # map 32
2010-09-01 16:04:25 +09:00
$num = CORE::unpack 'N', substr( $value, $p, 4 );
2010-09-01 11:22:43 +09:00
$p += 4;
}
else { # fix map
$num = $byte & ~0x80;
}
my %map;
for ( 0 .. $num - 1 ) {
2010-09-01 16:04:25 +09:00
no warnings; # for undef key case
2010-09-01 11:22:43 +09:00
my $key = _unpack( $value );
my $val = _unpack( $value );
$map{ $key } = $val;
}
return \%map;
}
elsif ( $byte >= 0x00 and $byte <= 0x7f ) { # positive fixnum
return $byte;
}
elsif ( $byte == 0xcc ) { # uint8
2010-09-01 16:04:25 +09:00
CORE::unpack( 'C', substr( $value, $p++, 1 ) );
2010-09-01 11:22:43 +09:00
}
elsif ( $byte == 0xcd ) { # uint16
$p += 2;
return unpack_uint16( $value, $p - 2 );
2010-09-01 11:22:43 +09:00
}
elsif ( $byte == 0xce ) { # unit32
$p += 4;
return unpack_uint32( $value, $p - 4 );
2010-09-01 11:22:43 +09:00
}
elsif ( $byte == 0xcf ) { # unit64
$p += 8;
return unpack_uint64( $value, $p - 8 );
2010-09-01 11:22:43 +09:00
}
elsif ( $byte == 0xd3 ) { # int64
$p += 8;
return unpack_int64( $value, $p - 8 );
}
elsif ( $byte == 0xd2 ) { # int32
$p += 4;
return unpack_int32( $value, $p - 4 );
}
elsif ( $byte == 0xd1 ) { # int16
$p += 2;
return unpack_int16( $value, $p - 2 );
}
elsif ( $byte == 0xd0 ) { # int8
2010-09-01 16:04:25 +09:00
return CORE::unpack 'c', substr( $value, $p++, 1 ); # c / C
2010-09-01 11:22:43 +09:00
}
elsif ( $byte >= 0xe0 and $byte <= 0xff ) { # negative fixnum
return $byte - 256;
}
elsif ( ( $byte >= 0xa0 and $byte <= 0xbf ) or $byte == 0xda or $byte == 0xdb ) { # raw
my $num;
if ( $byte == 0xda ) {
2010-09-01 16:04:25 +09:00
$num = CORE::unpack 'n', substr( $value, $p, 2 );
2010-09-01 11:22:43 +09:00
$p += 2 + $num;
}
elsif ( $byte == 0xdb ) {
2010-09-01 16:04:25 +09:00
$num = CORE::unpack 'N', substr( $value, $p, 4 );
2010-09-01 11:22:43 +09:00
$p += 4 + $num;
}
else { # fix raw
$num = $byte & ~0xa0;
$p += $num;
}
return substr( $value, $p - $num, $num );
}
elsif ( $byte == 0xc0 ) { # nil
return undef;
}
elsif ( $byte == 0xc2 ) { # boolean
return false;
}
elsif ( $byte == 0xc3 ) { # boolean
return true;
}
elsif ( $byte == 0xcb ) { # double
$p += 8;
return unpack_double( $value, $p - 8 );
}
elsif ( $byte == 0xca ) { # float
$p += 4;
return unpack_float( $value, $p - 4 );
}
else {
2010-09-18 14:38:35 +09:00
_unexpected("byte 0x%02x", $byte);
2010-09-01 11:22:43 +09:00
}
}
} # UNPACK
#
# Data::MessagePack::Unpacker
#
package
Data::MessagePack::Unpacker;
2010-09-01 11:22:43 +09:00
use strict;
sub new {
2010-09-18 09:44:32 +09:00
bless { pos => 0 }, shift;
2010-09-01 11:22:43 +09:00
}
sub execute_limit {
execute( @_ );
}
{
my $p;
sub execute {
my ( $self, $data, $offset, $limit ) = @_;
2010-09-18 09:44:32 +09:00
$offset ||= 0;
my $value = substr( $data, $offset, $limit ? $limit : length $data );
2010-09-01 11:22:43 +09:00
my $len = length $value;
2010-09-18 09:44:32 +09:00
$self->{data} .= $value;
local $self->{stack} = [];
2010-09-01 11:22:43 +09:00
$p = 0;
2010-09-18 09:44:32 +09:00
LOOP: while ( length($self->{data}) > $p ) {
_count( $self, $self->{data} ) or last;
2010-09-01 11:22:43 +09:00
2010-09-18 09:44:32 +09:00
while ( @{ $self->{stack} } > 0 && --$self->{stack}->[-1] == 0) {
pop @{ $self->{stack} };
2010-09-01 11:22:43 +09:00
}
2010-09-18 09:44:32 +09:00
if (@{$self->{stack}} == 0) {
$self->{is_finished}++;
last LOOP;
}
2010-09-01 11:22:43 +09:00
}
2010-09-18 09:44:32 +09:00
$self->{pos} = $p;
2010-09-01 11:22:43 +09:00
2010-09-18 09:44:32 +09:00
return $p + $offset;
2010-09-01 11:22:43 +09:00
}
sub _count {
my ( $self, $value ) = @_;
my $byte = unpack( 'C', substr( $value, $p++, 1 ) ); # get header
if ( ( $byte >= 0x90 and $byte <= 0x9f ) or $byte == 0xdc or $byte == 0xdd ) {
my $num;
if ( $byte == 0xdc ) { # array 16
$num = unpack 'n', substr( $value, $p, 2 );
$p += 2;
}
elsif ( $byte == 0xdd ) { # array 32
$num = unpack 'N', substr( $value, $p, 4 );
$p += 4;
}
else { # fix array
$num = $byte & ~0x90;
}
2010-09-18 09:44:32 +09:00
if (defined($num) && $num > 0) {
push @{ $self->{stack} }, $num + 1;
}
2010-09-01 11:22:43 +09:00
return 1;
}
elsif ( ( $byte >= 0x80 and $byte <= 0x8f ) or $byte == 0xde or $byte == 0xdf ) {
my $num;
if ( $byte == 0xde ) { # map 16
$num = unpack 'n', substr( $value, $p, 2 );
$p += 2;
}
elsif ( $byte == 0xdf ) { # map 32
$num = unpack 'N', substr( $value, $p, 4 );
$p += 4;
}
else { # fix map
$num = $byte & ~0x80;
}
2010-09-18 09:44:32 +09:00
if ($num > 0) {
push @{ $self->{stack} }, $num * 2 + 1; # a pair
}
2010-09-01 11:22:43 +09:00
return 1;
}
elsif ( $byte == 0xc0 or $byte == 0xc2 or $byte == 0xc3 ) { # nil, false, true
return 1;
}
elsif ( $byte >= 0x00 and $byte <= 0x7f ) { # positive fixnum
return 1;
}
elsif ( $byte >= 0xcc and $byte <= 0xcf ) { # uint
$p += $byte == 0xcc ? 1
: $byte == 0xcd ? 2
: $byte == 0xce ? 4
: $byte == 0xcf ? 8
2010-09-18 14:38:35 +09:00
: _unexpected("byte 0x%02x", $byte);
2010-09-01 11:22:43 +09:00
return 1;
}
elsif ( $byte >= 0xd0 and $byte <= 0xd3 ) { # int
$p += $byte == 0xd0 ? 1
: $byte == 0xd1 ? 2
: $byte == 0xd2 ? 4
: $byte == 0xd3 ? 8
2010-09-18 14:38:35 +09:00
: _unexpected("byte 0x%02x", $byte);
2010-09-01 11:22:43 +09:00
return 1;
}
elsif ( $byte >= 0xe0 and $byte <= 0xff ) { # negative fixnum
return 1;
}
elsif ( $byte >= 0xca and $byte <= 0xcb ) { # float, double
$p += $byte == 0xca ? 4 : 8;
return 1;
}
elsif ( ( $byte >= 0xa0 and $byte <= 0xbf ) or $byte == 0xda or $byte == 0xdb ) {
my $num;
if ( $byte == 0xda ) {
$num = unpack 'n', substr( $value, $p, 2 );
$p += 2;
}
elsif ( $byte == 0xdb ) {
$num = unpack 'N', substr( $value, $p, 4 );
$p += 4;
}
else { # fix raw
$num = $byte & ~0xa0;
}
$p += $num;
return 1;
}
else {
2010-09-18 14:38:35 +09:00
_unexpected("byte 0x%02x", $byte);
2010-09-01 11:22:43 +09:00
}
return 0;
}
} # execute
sub data {
2010-09-18 09:44:32 +09:00
return Data::MessagePack->unpack( substr($_[0]->{ data }, 0, $_[0]->{pos}) );
2010-09-01 11:22:43 +09:00
}
sub is_finished {
my ( $self ) = @_;
2010-09-18 09:44:32 +09:00
return $self->{is_finished};
2010-09-01 11:22:43 +09:00
}
2010-09-17 13:37:17 +09:00
sub reset :method {
2010-09-01 11:22:43 +09:00
$_[0]->{ data } = undef;
2010-09-18 09:44:32 +09:00
$_[0]->{ pos } = 0;
$_[0]->{ is_finished } = 0;
2010-09-01 11:22:43 +09:00
}
1;
__END__
=pod
=head1 NAME
2010-09-02 23:45:05 +09:00
Data::MessagePack::PP - Pure Perl implementation of Data::MessagePack
2010-09-01 11:22:43 +09:00
=head1 DESCRIPTION
2010-09-02 23:58:40 +09:00
This module is used by L<Data::MessagePack> internally.
2010-09-01 11:22:43 +09:00
=head1 SEE ALSO
L<http://msgpack.sourceforge.jp/>,
2010-09-01 11:22:43 +09:00
L<Data::MessagePack>,
L<http://frox25.no-ip.org/~mtve/wiki/MessagePack.html>,
2010-09-02 23:56:55 +09:00
=head1 AUTHOR
makamaka
2010-09-01 11:22:43 +09:00
=head1 COPYRIGHT AND LICENSE
This library is free software; you can redistribute it and/or modify
it under the same terms as Perl itself.
=cut