Spaces:
Runtime error
Runtime error
| package # This is JSON::backportPP | |
| JSON::PP; | |
| # JSON-2.0 | |
| use 5.005; | |
| use strict; | |
| use base qw(Exporter); | |
| use overload (); | |
| use Carp (); | |
| use B (); | |
| #use Devel::Peek; | |
| use vars qw($VERSION); | |
| $VERSION = '2.27204'; | |
| @JSON::PP::EXPORT = qw(encode_json decode_json from_json to_json); | |
| # instead of hash-access, i tried index-access for speed. | |
| # but this method is not faster than what i expected. so it will be changed. | |
| use constant P_ASCII => 0; | |
| use constant P_LATIN1 => 1; | |
| use constant P_UTF8 => 2; | |
| use constant P_INDENT => 3; | |
| use constant P_CANONICAL => 4; | |
| use constant P_SPACE_BEFORE => 5; | |
| use constant P_SPACE_AFTER => 6; | |
| use constant P_ALLOW_NONREF => 7; | |
| use constant P_SHRINK => 8; | |
| use constant P_ALLOW_BLESSED => 9; | |
| use constant P_CONVERT_BLESSED => 10; | |
| use constant P_RELAXED => 11; | |
| use constant P_LOOSE => 12; | |
| use constant P_ALLOW_BIGNUM => 13; | |
| use constant P_ALLOW_BAREKEY => 14; | |
| use constant P_ALLOW_SINGLEQUOTE => 15; | |
| use constant P_ESCAPE_SLASH => 16; | |
| use constant P_AS_NONBLESSED => 17; | |
| use constant P_ALLOW_UNKNOWN => 18; | |
| use constant OLD_PERL => $] < 5.008 ? 1 : 0; | |
| BEGIN { | |
| my @xs_compati_bit_properties = qw( | |
| latin1 ascii utf8 indent canonical space_before space_after allow_nonref shrink | |
| allow_blessed convert_blessed relaxed allow_unknown | |
| ); | |
| my @pp_bit_properties = qw( | |
| allow_singlequote allow_bignum loose | |
| allow_barekey escape_slash as_nonblessed | |
| ); | |
| # Perl version check, Unicode handling is enable? | |
| # Helper module sets @JSON::PP::_properties. | |
| if ($] < 5.008 ) { | |
| my $helper = $] >= 5.006 ? 'JSON::backportPP::Compat5006' : 'JSON::backportPP::Compat5005'; | |
| eval qq| require $helper |; | |
| if ($@) { Carp::croak $@; } | |
| } | |
| for my $name (@xs_compati_bit_properties, @pp_bit_properties) { | |
| my $flag_name = 'P_' . uc($name); | |
| eval qq/ | |
| sub $name { | |
| my \$enable = defined \$_[1] ? \$_[1] : 1; | |
| if (\$enable) { | |
| \$_[0]->{PROPS}->[$flag_name] = 1; | |
| } | |
| else { | |
| \$_[0]->{PROPS}->[$flag_name] = 0; | |
| } | |
| \$_[0]; | |
| } | |
| sub get_$name { | |
| \$_[0]->{PROPS}->[$flag_name] ? 1 : ''; | |
| } | |
| /; | |
| } | |
| } | |
| # Functions | |
| my %encode_allow_method | |
| = map {($_ => 1)} qw/utf8 pretty allow_nonref latin1 self_encode escape_slash | |
| allow_blessed convert_blessed indent indent_length allow_bignum | |
| as_nonblessed | |
| /; | |
| my %decode_allow_method | |
| = map {($_ => 1)} qw/utf8 allow_nonref loose allow_singlequote allow_bignum | |
| allow_barekey max_size relaxed/; | |
| my $JSON; # cache | |
| sub encode_json ($) { # encode | |
| ($JSON ||= __PACKAGE__->new->utf8)->encode(@_); | |
| } | |
| sub decode_json { # decode | |
| ($JSON ||= __PACKAGE__->new->utf8)->decode(@_); | |
| } | |
| # Obsoleted | |
| sub to_json($) { | |
| Carp::croak ("JSON::PP::to_json has been renamed to encode_json."); | |
| } | |
| sub from_json($) { | |
| Carp::croak ("JSON::PP::from_json has been renamed to decode_json."); | |
| } | |
| # Methods | |
| sub new { | |
| my $class = shift; | |
| my $self = { | |
| max_depth => 512, | |
| max_size => 0, | |
| indent => 0, | |
| FLAGS => 0, | |
| fallback => sub { encode_error('Invalid value. JSON can only reference.') }, | |
| indent_length => 3, | |
| }; | |
| bless $self, $class; | |
| } | |
| sub encode { | |
| return $_[0]->PP_encode_json($_[1]); | |
| } | |
| sub decode { | |
| return $_[0]->PP_decode_json($_[1], 0x00000000); | |
| } | |
| sub decode_prefix { | |
| return $_[0]->PP_decode_json($_[1], 0x00000001); | |
| } | |
| # accessor | |
| # pretty printing | |
| sub pretty { | |
| my ($self, $v) = @_; | |
| my $enable = defined $v ? $v : 1; | |
| if ($enable) { # indent_length(3) for JSON::XS compatibility | |
| $self->indent(1)->indent_length(3)->space_before(1)->space_after(1); | |
| } | |
| else { | |
| $self->indent(0)->space_before(0)->space_after(0); | |
| } | |
| $self; | |
| } | |
| # etc | |
| sub max_depth { | |
| my $max = defined $_[1] ? $_[1] : 0x80000000; | |
| $_[0]->{max_depth} = $max; | |
| $_[0]; | |
| } | |
| sub get_max_depth { $_[0]->{max_depth}; } | |
| sub max_size { | |
| my $max = defined $_[1] ? $_[1] : 0; | |
| $_[0]->{max_size} = $max; | |
| $_[0]; | |
| } | |
| sub get_max_size { $_[0]->{max_size}; } | |
| sub filter_json_object { | |
| $_[0]->{cb_object} = defined $_[1] ? $_[1] : 0; | |
| $_[0]->{F_HOOK} = ($_[0]->{cb_object} or $_[0]->{cb_sk_object}) ? 1 : 0; | |
| $_[0]; | |
| } | |
| sub filter_json_single_key_object { | |
| if (@_ > 1) { | |
| $_[0]->{cb_sk_object}->{$_[1]} = $_[2]; | |
| } | |
| $_[0]->{F_HOOK} = ($_[0]->{cb_object} or $_[0]->{cb_sk_object}) ? 1 : 0; | |
| $_[0]; | |
| } | |
| sub indent_length { | |
| if (!defined $_[1] or $_[1] > 15 or $_[1] < 0) { | |
| Carp::carp "The acceptable range of indent_length() is 0 to 15."; | |
| } | |
| else { | |
| $_[0]->{indent_length} = $_[1]; | |
| } | |
| $_[0]; | |
| } | |
| sub get_indent_length { | |
| $_[0]->{indent_length}; | |
| } | |
| sub sort_by { | |
| $_[0]->{sort_by} = defined $_[1] ? $_[1] : 1; | |
| $_[0]; | |
| } | |
| sub allow_bigint { | |
| Carp::carp("allow_bigint() is obsoleted. use allow_bignum() insted."); | |
| } | |
| ############################### | |
| ### | |
| ### Perl => JSON | |
| ### | |
| { # Convert | |
| my $max_depth; | |
| my $indent; | |
| my $ascii; | |
| my $latin1; | |
| my $utf8; | |
| my $space_before; | |
| my $space_after; | |
| my $canonical; | |
| my $allow_blessed; | |
| my $convert_blessed; | |
| my $indent_length; | |
| my $escape_slash; | |
| my $bignum; | |
| my $as_nonblessed; | |
| my $depth; | |
| my $indent_count; | |
| my $keysort; | |
| sub PP_encode_json { | |
| my $self = shift; | |
| my $obj = shift; | |
| $indent_count = 0; | |
| $depth = 0; | |
| my $idx = $self->{PROPS}; | |
| ($ascii, $latin1, $utf8, $indent, $canonical, $space_before, $space_after, $allow_blessed, | |
| $convert_blessed, $escape_slash, $bignum, $as_nonblessed) | |
| = @{$idx}[P_ASCII .. P_SPACE_AFTER, P_ALLOW_BLESSED, P_CONVERT_BLESSED, | |
| P_ESCAPE_SLASH, P_ALLOW_BIGNUM, P_AS_NONBLESSED]; | |
| ($max_depth, $indent_length) = @{$self}{qw/max_depth indent_length/}; | |
| $keysort = $canonical ? sub { $a cmp $b } : undef; | |
| if ($self->{sort_by}) { | |
| $keysort = ref($self->{sort_by}) eq 'CODE' ? $self->{sort_by} | |
| : $self->{sort_by} =~ /\D+/ ? $self->{sort_by} | |
| : sub { $a cmp $b }; | |
| } | |
| encode_error("hash- or arrayref expected (not a simple scalar, use allow_nonref to allow this)") | |
| if(!ref $obj and !$idx->[ P_ALLOW_NONREF ]); | |
| my $str = $self->object_to_json($obj); | |
| $str .= "\n" if ( $indent ); # JSON::XS 2.26 compatible | |
| unless ($ascii or $latin1 or $utf8) { | |
| utf8::upgrade($str); | |
| } | |
| if ($idx->[ P_SHRINK ]) { | |
| utf8::downgrade($str, 1); | |
| } | |
| return $str; | |
| } | |
| sub object_to_json { | |
| my ($self, $obj) = @_; | |
| my $type = ref($obj); | |
| if($type eq 'HASH'){ | |
| return $self->hash_to_json($obj); | |
| } | |
| elsif($type eq 'ARRAY'){ | |
| return $self->array_to_json($obj); | |
| } | |
| elsif ($type) { # blessed object? | |
| if (blessed($obj)) { | |
| return $self->value_to_json($obj) if ( $obj->isa('JSON::PP::Boolean') ); | |
| if ( $convert_blessed and $obj->can('TO_JSON') ) { | |
| my $result = $obj->TO_JSON(); | |
| if ( defined $result and ref( $result ) ) { | |
| if ( refaddr( $obj ) eq refaddr( $result ) ) { | |
| encode_error( sprintf( | |
| "%s::TO_JSON method returned same object as was passed instead of a new one", | |
| ref $obj | |
| ) ); | |
| } | |
| } | |
| return $self->object_to_json( $result ); | |
| } | |
| return "$obj" if ( $bignum and _is_bignum($obj) ); | |
| return $self->blessed_to_json($obj) if ($allow_blessed and $as_nonblessed); # will be removed. | |
| encode_error( sprintf("encountered object '%s', but neither allow_blessed " | |
| . "nor convert_blessed settings are enabled", $obj) | |
| ) unless ($allow_blessed); | |
| return 'null'; | |
| } | |
| else { | |
| return $self->value_to_json($obj); | |
| } | |
| } | |
| else{ | |
| return $self->value_to_json($obj); | |
| } | |
| } | |
| sub hash_to_json { | |
| my ($self, $obj) = @_; | |
| my @res; | |
| encode_error("json text or perl structure exceeds maximum nesting level (max_depth set too low?)") | |
| if (++$depth > $max_depth); | |
| my ($pre, $post) = $indent ? $self->_up_indent() : ('', ''); | |
| my $del = ($space_before ? ' ' : '') . ':' . ($space_after ? ' ' : ''); | |
| for my $k ( _sort( $obj ) ) { | |
| if ( OLD_PERL ) { utf8::decode($k) } # key for Perl 5.6 / be optimized | |
| push @res, string_to_json( $self, $k ) | |
| . $del | |
| . ( $self->object_to_json( $obj->{$k} ) || $self->value_to_json( $obj->{$k} ) ); | |
| } | |
| --$depth; | |
| $self->_down_indent() if ($indent); | |
| return '{' . ( @res ? $pre : '' ) . ( @res ? join( ",$pre", @res ) . $post : '' ) . '}'; | |
| } | |
| sub array_to_json { | |
| my ($self, $obj) = @_; | |
| my @res; | |
| encode_error("json text or perl structure exceeds maximum nesting level (max_depth set too low?)") | |
| if (++$depth > $max_depth); | |
| my ($pre, $post) = $indent ? $self->_up_indent() : ('', ''); | |
| for my $v (@$obj){ | |
| push @res, $self->object_to_json($v) || $self->value_to_json($v); | |
| } | |
| --$depth; | |
| $self->_down_indent() if ($indent); | |
| return '[' . ( @res ? $pre : '' ) . ( @res ? join( ",$pre", @res ) . $post : '' ) . ']'; | |
| } | |
| sub value_to_json { | |
| my ($self, $value) = @_; | |
| return 'null' if(!defined $value); | |
| my $b_obj = B::svref_2object(\$value); # for round trip problem | |
| my $flags = $b_obj->FLAGS; | |
| return $value # as is | |
| if $flags & ( B::SVp_IOK | B::SVp_NOK ) and !( $flags & B::SVp_POK ); # SvTYPE is IV or NV? | |
| my $type = ref($value); | |
| if(!$type){ | |
| return string_to_json($self, $value); | |
| } | |
| elsif( blessed($value) and $value->isa('JSON::PP::Boolean') ){ | |
| return $$value == 1 ? 'true' : 'false'; | |
| } | |
| elsif ($type) { | |
| if ((overload::StrVal($value) =~ /=(\w+)/)[0]) { | |
| return $self->value_to_json("$value"); | |
| } | |
| if ($type eq 'SCALAR' and defined $$value) { | |
| return $$value eq '1' ? 'true' | |
| : $$value eq '0' ? 'false' | |
| : $self->{PROPS}->[ P_ALLOW_UNKNOWN ] ? 'null' | |
| : encode_error("cannot encode reference to scalar"); | |
| } | |
| if ( $self->{PROPS}->[ P_ALLOW_UNKNOWN ] ) { | |
| return 'null'; | |
| } | |
| else { | |
| if ( $type eq 'SCALAR' or $type eq 'REF' ) { | |
| encode_error("cannot encode reference to scalar"); | |
| } | |
| else { | |
| encode_error("encountered $value, but JSON can only represent references to arrays or hashes"); | |
| } | |
| } | |
| } | |
| else { | |
| return $self->{fallback}->($value) | |
| if ($self->{fallback} and ref($self->{fallback}) eq 'CODE'); | |
| return 'null'; | |
| } | |
| } | |
| my %esc = ( | |
| "\n" => '\n', | |
| "\r" => '\r', | |
| "\t" => '\t', | |
| "\f" => '\f', | |
| "\b" => '\b', | |
| "\"" => '\"', | |
| "\\" => '\\\\', | |
| "\'" => '\\\'', | |
| ); | |
| sub string_to_json { | |
| my ($self, $arg) = @_; | |
| $arg =~ s/([\x22\x5c\n\r\t\f\b])/$esc{$1}/g; | |
| $arg =~ s/\//\\\//g if ($escape_slash); | |
| $arg =~ s/([\x00-\x08\x0b\x0e-\x1f])/'\\u00' . unpack('H2', $1)/eg; | |
| if ($ascii) { | |
| $arg = JSON_PP_encode_ascii($arg); | |
| } | |
| if ($latin1) { | |
| $arg = JSON_PP_encode_latin1($arg); | |
| } | |
| if ($utf8) { | |
| utf8::encode($arg); | |
| } | |
| return '"' . $arg . '"'; | |
| } | |
| sub blessed_to_json { | |
| my $reftype = reftype($_[1]) || ''; | |
| if ($reftype eq 'HASH') { | |
| return $_[0]->hash_to_json($_[1]); | |
| } | |
| elsif ($reftype eq 'ARRAY') { | |
| return $_[0]->array_to_json($_[1]); | |
| } | |
| else { | |
| return 'null'; | |
| } | |
| } | |
| sub encode_error { | |
| my $error = shift; | |
| Carp::croak "$error"; | |
| } | |
| sub _sort { | |
| defined $keysort ? (sort $keysort (keys %{$_[0]})) : keys %{$_[0]}; | |
| } | |
| sub _up_indent { | |
| my $self = shift; | |
| my $space = ' ' x $indent_length; | |
| my ($pre,$post) = ('',''); | |
| $post = "\n" . $space x $indent_count; | |
| $indent_count++; | |
| $pre = "\n" . $space x $indent_count; | |
| return ($pre,$post); | |
| } | |
| sub _down_indent { $indent_count--; } | |
| sub PP_encode_box { | |
| { | |
| depth => $depth, | |
| indent_count => $indent_count, | |
| }; | |
| } | |
| } # Convert | |
| sub _encode_ascii { | |
| join('', | |
| map { | |
| $_ <= 127 ? | |
| chr($_) : | |
| $_ <= 65535 ? | |
| sprintf('\u%04x', $_) : sprintf('\u%x\u%x', _encode_surrogates($_)); | |
| } unpack('U*', $_[0]) | |
| ); | |
| } | |
| sub _encode_latin1 { | |
| join('', | |
| map { | |
| $_ <= 255 ? | |
| chr($_) : | |
| $_ <= 65535 ? | |
| sprintf('\u%04x', $_) : sprintf('\u%x\u%x', _encode_surrogates($_)); | |
| } unpack('U*', $_[0]) | |
| ); | |
| } | |
| sub _encode_surrogates { # from perlunicode | |
| my $uni = $_[0] - 0x10000; | |
| return ($uni / 0x400 + 0xD800, $uni % 0x400 + 0xDC00); | |
| } | |
| sub _is_bignum { | |
| $_[0]->isa('Math::BigInt') or $_[0]->isa('Math::BigFloat'); | |
| } | |
| # | |
| # JSON => Perl | |
| # | |
| my $max_intsize; | |
| BEGIN { | |
| my $checkint = 1111; | |
| for my $d (5..64) { | |
| $checkint .= 1; | |
| my $int = eval qq| $checkint |; | |
| if ($int =~ /[eE]/) { | |
| $max_intsize = $d - 1; | |
| last; | |
| } | |
| } | |
| } | |
| { # PARSE | |
| my %escapes = ( # by Jeremy Muhlich <jmuhlich [at] bitflood.org> | |
| b => "\x8", | |
| t => "\x9", | |
| n => "\xA", | |
| f => "\xC", | |
| r => "\xD", | |
| '\\' => '\\', | |
| '"' => '"', | |
| '/' => '/', | |
| ); | |
| my $text; # json data | |
| my $at; # offset | |
| my $ch; # 1chracter | |
| my $len; # text length (changed according to UTF8 or NON UTF8) | |
| # INTERNAL | |
| my $depth; # nest counter | |
| my $encoding; # json text encoding | |
| my $is_valid_utf8; # temp variable | |
| my $utf8_len; # utf8 byte length | |
| # FLAGS | |
| my $utf8; # must be utf8 | |
| my $max_depth; # max nest number of objects and arrays | |
| my $max_size; | |
| my $relaxed; | |
| my $cb_object; | |
| my $cb_sk_object; | |
| my $F_HOOK; | |
| my $allow_bigint; # using Math::BigInt | |
| my $singlequote; # loosely quoting | |
| my $loose; # | |
| my $allow_barekey; # bareKey | |
| # $opt flag | |
| # 0x00000001 .... decode_prefix | |
| # 0x10000000 .... incr_parse | |
| sub PP_decode_json { | |
| my ($self, $opt); # $opt is an effective flag during this decode_json. | |
| ($self, $text, $opt) = @_; | |
| ($at, $ch, $depth) = (0, '', 0); | |
| if ( !defined $text or ref $text ) { | |
| decode_error("malformed JSON string, neither array, object, number, string or atom"); | |
| } | |
| my $idx = $self->{PROPS}; | |
| ($utf8, $relaxed, $loose, $allow_bigint, $allow_barekey, $singlequote) | |
| = @{$idx}[P_UTF8, P_RELAXED, P_LOOSE .. P_ALLOW_SINGLEQUOTE]; | |
| if ( $utf8 ) { | |
| utf8::downgrade( $text, 1 ) or Carp::croak("Wide character in subroutine entry"); | |
| } | |
| else { | |
| utf8::upgrade( $text ); | |
| } | |
| $len = length $text; | |
| ($max_depth, $max_size, $cb_object, $cb_sk_object, $F_HOOK) | |
| = @{$self}{qw/max_depth max_size cb_object cb_sk_object F_HOOK/}; | |
| if ($max_size > 1) { | |
| use bytes; | |
| my $bytes = length $text; | |
| decode_error( | |
| sprintf("attempted decode of JSON text of %s bytes size, but max_size is set to %s" | |
| , $bytes, $max_size), 1 | |
| ) if ($bytes > $max_size); | |
| } | |
| # Currently no effect | |
| # should use regexp | |
| my @octets = unpack('C4', $text); | |
| $encoding = ( $octets[0] and $octets[1]) ? 'UTF-8' | |
| : (!$octets[0] and $octets[1]) ? 'UTF-16BE' | |
| : (!$octets[0] and !$octets[1]) ? 'UTF-32BE' | |
| : ( $octets[2] ) ? 'UTF-16LE' | |
| : (!$octets[2] ) ? 'UTF-32LE' | |
| : 'unknown'; | |
| white(); # remove head white space | |
| my $valid_start = defined $ch; # Is there a first character for JSON structure? | |
| my $result = value(); | |
| return undef if ( !$result && ( $opt & 0x10000000 ) ); # for incr_parse | |
| decode_error("malformed JSON string, neither array, object, number, string or atom") unless $valid_start; | |
| if ( !$idx->[ P_ALLOW_NONREF ] and !ref $result ) { | |
| decode_error( | |
| 'JSON text must be an object or array (but found number, string, true, false or null,' | |
| . ' use allow_nonref to allow this)', 1); | |
| } | |
| Carp::croak('something wrong.') if $len < $at; # we won't arrive here. | |
| my $consumed = defined $ch ? $at - 1 : $at; # consumed JSON text length | |
| white(); # remove tail white space | |
| if ( $ch ) { | |
| return ( $result, $consumed ) if ($opt & 0x00000001); # all right if decode_prefix | |
| decode_error("garbage after JSON object"); | |
| } | |
| ( $opt & 0x00000001 ) ? ( $result, $consumed ) : $result; | |
| } | |
| sub next_chr { | |
| return $ch = undef if($at >= $len); | |
| $ch = substr($text, $at++, 1); | |
| } | |
| sub value { | |
| white(); | |
| return if(!defined $ch); | |
| return object() if($ch eq '{'); | |
| return array() if($ch eq '['); | |
| return string() if($ch eq '"' or ($singlequote and $ch eq "'")); | |
| return number() if($ch =~ /[0-9]/ or $ch eq '-'); | |
| return word(); | |
| } | |
| sub string { | |
| my ($i, $s, $t, $u); | |
| my $utf16; | |
| my $is_utf8; | |
| ($is_valid_utf8, $utf8_len) = ('', 0); | |
| $s = ''; # basically UTF8 flag on | |
| if($ch eq '"' or ($singlequote and $ch eq "'")){ | |
| my $boundChar = $ch; | |
| OUTER: while( defined(next_chr()) ){ | |
| if($ch eq $boundChar){ | |
| next_chr(); | |
| if ($utf16) { | |
| decode_error("missing low surrogate character in surrogate pair"); | |
| } | |
| utf8::decode($s) if($is_utf8); | |
| return $s; | |
| } | |
| elsif($ch eq '\\'){ | |
| next_chr(); | |
| if(exists $escapes{$ch}){ | |
| $s .= $escapes{$ch}; | |
| } | |
| elsif($ch eq 'u'){ # UNICODE handling | |
| my $u = ''; | |
| for(1..4){ | |
| $ch = next_chr(); | |
| last OUTER if($ch !~ /[0-9a-fA-F]/); | |
| $u .= $ch; | |
| } | |
| # U+D800 - U+DBFF | |
| if ($u =~ /^[dD][89abAB][0-9a-fA-F]{2}/) { # UTF-16 high surrogate? | |
| $utf16 = $u; | |
| } | |
| # U+DC00 - U+DFFF | |
| elsif ($u =~ /^[dD][c-fC-F][0-9a-fA-F]{2}/) { # UTF-16 low surrogate? | |
| unless (defined $utf16) { | |
| decode_error("missing high surrogate character in surrogate pair"); | |
| } | |
| $is_utf8 = 1; | |
| $s .= JSON_PP_decode_surrogates($utf16, $u) || next; | |
| $utf16 = undef; | |
| } | |
| else { | |
| if (defined $utf16) { | |
| decode_error("surrogate pair expected"); | |
| } | |
| if ( ( my $hex = hex( $u ) ) > 127 ) { | |
| $is_utf8 = 1; | |
| $s .= JSON_PP_decode_unicode($u) || next; | |
| } | |
| else { | |
| $s .= chr $hex; | |
| } | |
| } | |
| } | |
| else{ | |
| unless ($loose) { | |
| $at -= 2; | |
| decode_error('illegal backslash escape sequence in string'); | |
| } | |
| $s .= $ch; | |
| } | |
| } | |
| else{ | |
| if ( ord $ch > 127 ) { | |
| if ( $utf8 ) { | |
| unless( $ch = is_valid_utf8($ch) ) { | |
| $at -= 1; | |
| decode_error("malformed UTF-8 character in JSON string"); | |
| } | |
| else { | |
| $at += $utf8_len - 1; | |
| } | |
| } | |
| else { | |
| utf8::encode( $ch ); | |
| } | |
| $is_utf8 = 1; | |
| } | |
| if (!$loose) { | |
| if ($ch =~ /[\x00-\x1f\x22\x5c]/) { # '/' ok | |
| $at--; | |
| decode_error('invalid character encountered while parsing JSON string'); | |
| } | |
| } | |
| $s .= $ch; | |
| } | |
| } | |
| } | |
| decode_error("unexpected end of string while parsing JSON string"); | |
| } | |
| sub white { | |
| while( defined $ch ){ | |
| if($ch le ' '){ | |
| next_chr(); | |
| } | |
| elsif($ch eq '/'){ | |
| next_chr(); | |
| if(defined $ch and $ch eq '/'){ | |
| 1 while(defined(next_chr()) and $ch ne "\n" and $ch ne "\r"); | |
| } | |
| elsif(defined $ch and $ch eq '*'){ | |
| next_chr(); | |
| while(1){ | |
| if(defined $ch){ | |
| if($ch eq '*'){ | |
| if(defined(next_chr()) and $ch eq '/'){ | |
| next_chr(); | |
| last; | |
| } | |
| } | |
| else{ | |
| next_chr(); | |
| } | |
| } | |
| else{ | |
| decode_error("Unterminated comment"); | |
| } | |
| } | |
| next; | |
| } | |
| else{ | |
| $at--; | |
| decode_error("malformed JSON string, neither array, object, number, string or atom"); | |
| } | |
| } | |
| else{ | |
| if ($relaxed and $ch eq '#') { # correctly? | |
| pos($text) = $at; | |
| $text =~ /\G([^\n]*(?:\r\n|\r|\n|$))/g; | |
| $at = pos($text); | |
| next_chr; | |
| next; | |
| } | |
| last; | |
| } | |
| } | |
| } | |
| sub array { | |
| my $a = $_[0] || []; # you can use this code to use another array ref object. | |
| decode_error('json text or perl structure exceeds maximum nesting level (max_depth set too low?)') | |
| if (++$depth > $max_depth); | |
| next_chr(); | |
| white(); | |
| if(defined $ch and $ch eq ']'){ | |
| --$depth; | |
| next_chr(); | |
| return $a; | |
| } | |
| else { | |
| while(defined($ch)){ | |
| push @$a, value(); | |
| white(); | |
| if (!defined $ch) { | |
| last; | |
| } | |
| if($ch eq ']'){ | |
| --$depth; | |
| next_chr(); | |
| return $a; | |
| } | |
| if($ch ne ','){ | |
| last; | |
| } | |
| next_chr(); | |
| white(); | |
| if ($relaxed and $ch eq ']') { | |
| --$depth; | |
| next_chr(); | |
| return $a; | |
| } | |
| } | |
| } | |
| decode_error(", or ] expected while parsing array"); | |
| } | |
| sub object { | |
| my $o = $_[0] || {}; # you can use this code to use another hash ref object. | |
| my $k; | |
| decode_error('json text or perl structure exceeds maximum nesting level (max_depth set too low?)') | |
| if (++$depth > $max_depth); | |
| next_chr(); | |
| white(); | |
| if(defined $ch and $ch eq '}'){ | |
| --$depth; | |
| next_chr(); | |
| if ($F_HOOK) { | |
| return _json_object_hook($o); | |
| } | |
| return $o; | |
| } | |
| else { | |
| while (defined $ch) { | |
| $k = ($allow_barekey and $ch ne '"' and $ch ne "'") ? bareKey() : string(); | |
| white(); | |
| if(!defined $ch or $ch ne ':'){ | |
| $at--; | |
| decode_error("':' expected"); | |
| } | |
| next_chr(); | |
| $o->{$k} = value(); | |
| white(); | |
| last if (!defined $ch); | |
| if($ch eq '}'){ | |
| --$depth; | |
| next_chr(); | |
| if ($F_HOOK) { | |
| return _json_object_hook($o); | |
| } | |
| return $o; | |
| } | |
| if($ch ne ','){ | |
| last; | |
| } | |
| next_chr(); | |
| white(); | |
| if ($relaxed and $ch eq '}') { | |
| --$depth; | |
| next_chr(); | |
| if ($F_HOOK) { | |
| return _json_object_hook($o); | |
| } | |
| return $o; | |
| } | |
| } | |
| } | |
| $at--; | |
| decode_error(", or } expected while parsing object/hash"); | |
| } | |
| sub bareKey { # doesn't strictly follow Standard ECMA-262 3rd Edition | |
| my $key; | |
| while($ch =~ /[^\x00-\x23\x25-\x2F\x3A-\x40\x5B-\x5E\x60\x7B-\x7F]/){ | |
| $key .= $ch; | |
| next_chr(); | |
| } | |
| return $key; | |
| } | |
| sub word { | |
| my $word = substr($text,$at-1,4); | |
| if($word eq 'true'){ | |
| $at += 3; | |
| next_chr; | |
| return $JSON::PP::true; | |
| } | |
| elsif($word eq 'null'){ | |
| $at += 3; | |
| next_chr; | |
| return undef; | |
| } | |
| elsif($word eq 'fals'){ | |
| $at += 3; | |
| if(substr($text,$at,1) eq 'e'){ | |
| $at++; | |
| next_chr; | |
| return $JSON::PP::false; | |
| } | |
| } | |
| $at--; # for decode_error report | |
| decode_error("'null' expected") if ($word =~ /^n/); | |
| decode_error("'true' expected") if ($word =~ /^t/); | |
| decode_error("'false' expected") if ($word =~ /^f/); | |
| decode_error("malformed JSON string, neither array, object, number, string or atom"); | |
| } | |
| sub number { | |
| my $n = ''; | |
| my $v; | |
| # According to RFC4627, hex or oct digits are invalid. | |
| if($ch eq '0'){ | |
| my $peek = substr($text,$at,1); | |
| my $hex = $peek =~ /[xX]/; # 0 or 1 | |
| if($hex){ | |
| decode_error("malformed number (leading zero must not be followed by another digit)"); | |
| ($n) = ( substr($text, $at+1) =~ /^([0-9a-fA-F]+)/); | |
| } | |
| else{ # oct | |
| ($n) = ( substr($text, $at) =~ /^([0-7]+)/); | |
| if (defined $n and length $n > 1) { | |
| decode_error("malformed number (leading zero must not be followed by another digit)"); | |
| } | |
| } | |
| if(defined $n and length($n)){ | |
| if (!$hex and length($n) == 1) { | |
| decode_error("malformed number (leading zero must not be followed by another digit)"); | |
| } | |
| $at += length($n) + $hex; | |
| next_chr; | |
| return $hex ? hex($n) : oct($n); | |
| } | |
| } | |
| if($ch eq '-'){ | |
| $n = '-'; | |
| next_chr; | |
| if (!defined $ch or $ch !~ /\d/) { | |
| decode_error("malformed number (no digits after initial minus)"); | |
| } | |
| } | |
| while(defined $ch and $ch =~ /\d/){ | |
| $n .= $ch; | |
| next_chr; | |
| } | |
| if(defined $ch and $ch eq '.'){ | |
| $n .= '.'; | |
| next_chr; | |
| if (!defined $ch or $ch !~ /\d/) { | |
| decode_error("malformed number (no digits after decimal point)"); | |
| } | |
| else { | |
| $n .= $ch; | |
| } | |
| while(defined(next_chr) and $ch =~ /\d/){ | |
| $n .= $ch; | |
| } | |
| } | |
| if(defined $ch and ($ch eq 'e' or $ch eq 'E')){ | |
| $n .= $ch; | |
| next_chr; | |
| if(defined($ch) and ($ch eq '+' or $ch eq '-')){ | |
| $n .= $ch; | |
| next_chr; | |
| if (!defined $ch or $ch =~ /\D/) { | |
| decode_error("malformed number (no digits after exp sign)"); | |
| } | |
| $n .= $ch; | |
| } | |
| elsif(defined($ch) and $ch =~ /\d/){ | |
| $n .= $ch; | |
| } | |
| else { | |
| decode_error("malformed number (no digits after exp sign)"); | |
| } | |
| while(defined(next_chr) and $ch =~ /\d/){ | |
| $n .= $ch; | |
| } | |
| } | |
| $v .= $n; | |
| if ($v !~ /[.eE]/ and length $v > $max_intsize) { | |
| if ($allow_bigint) { # from Adam Sussman | |
| require Math::BigInt; | |
| return Math::BigInt->new($v); | |
| } | |
| else { | |
| return "$v"; | |
| } | |
| } | |
| elsif ($allow_bigint) { | |
| require Math::BigFloat; | |
| return Math::BigFloat->new($v); | |
| } | |
| return 0+$v; | |
| } | |
| sub is_valid_utf8 { | |
| $utf8_len = $_[0] =~ /[\x00-\x7F]/ ? 1 | |
| : $_[0] =~ /[\xC2-\xDF]/ ? 2 | |
| : $_[0] =~ /[\xE0-\xEF]/ ? 3 | |
| : $_[0] =~ /[\xF0-\xF4]/ ? 4 | |
| : 0 | |
| ; | |
| return unless $utf8_len; | |
| my $is_valid_utf8 = substr($text, $at - 1, $utf8_len); | |
| return ( $is_valid_utf8 =~ /^(?: | |
| [\x00-\x7F] | |
| |[\xC2-\xDF][\x80-\xBF] | |
| |[\xE0][\xA0-\xBF][\x80-\xBF] | |
| |[\xE1-\xEC][\x80-\xBF][\x80-\xBF] | |
| |[\xED][\x80-\x9F][\x80-\xBF] | |
| |[\xEE-\xEF][\x80-\xBF][\x80-\xBF] | |
| |[\xF0][\x90-\xBF][\x80-\xBF][\x80-\xBF] | |
| |[\xF1-\xF3][\x80-\xBF][\x80-\xBF][\x80-\xBF] | |
| |[\xF4][\x80-\x8F][\x80-\xBF][\x80-\xBF] | |
| )$/x ) ? $is_valid_utf8 : ''; | |
| } | |
| sub decode_error { | |
| my $error = shift; | |
| my $no_rep = shift; | |
| my $str = defined $text ? substr($text, $at) : ''; | |
| my $mess = ''; | |
| my $type = $] >= 5.008 ? 'U*' | |
| : $] < 5.006 ? 'C*' | |
| : utf8::is_utf8( $str ) ? 'U*' # 5.6 | |
| : 'C*' | |
| ; | |
| for my $c ( unpack( $type, $str ) ) { # emulate pv_uni_display() ? | |
| $mess .= $c == 0x07 ? '\a' | |
| : $c == 0x09 ? '\t' | |
| : $c == 0x0a ? '\n' | |
| : $c == 0x0d ? '\r' | |
| : $c == 0x0c ? '\f' | |
| : $c < 0x20 ? sprintf('\x{%x}', $c) | |
| : $c == 0x5c ? '\\\\' | |
| : $c < 0x80 ? chr($c) | |
| : sprintf('\x{%x}', $c) | |
| ; | |
| if ( length $mess >= 20 ) { | |
| $mess .= '...'; | |
| last; | |
| } | |
| } | |
| unless ( length $mess ) { | |
| $mess = '(end of string)'; | |
| } | |
| Carp::croak ( | |
| $no_rep ? "$error" : "$error, at character offset $at (before \"$mess\")" | |
| ); | |
| } | |
| sub _json_object_hook { | |
| my $o = $_[0]; | |
| my @ks = keys %{$o}; | |
| if ( $cb_sk_object and @ks == 1 and exists $cb_sk_object->{ $ks[0] } and ref $cb_sk_object->{ $ks[0] } ) { | |
| my @val = $cb_sk_object->{ $ks[0] }->( $o->{$ks[0]} ); | |
| if (@val == 1) { | |
| return $val[0]; | |
| } | |
| } | |
| my @val = $cb_object->($o) if ($cb_object); | |
| if (@val == 0 or @val > 1) { | |
| return $o; | |
| } | |
| else { | |
| return $val[0]; | |
| } | |
| } | |
| sub PP_decode_box { | |
| { | |
| text => $text, | |
| at => $at, | |
| ch => $ch, | |
| len => $len, | |
| depth => $depth, | |
| encoding => $encoding, | |
| is_valid_utf8 => $is_valid_utf8, | |
| }; | |
| } | |
| } # PARSE | |
| sub _decode_surrogates { # from perlunicode | |
| my $uni = 0x10000 + (hex($_[0]) - 0xD800) * 0x400 + (hex($_[1]) - 0xDC00); | |
| my $un = pack('U*', $uni); | |
| utf8::encode( $un ); | |
| return $un; | |
| } | |
| sub _decode_unicode { | |
| my $un = pack('U', hex shift); | |
| utf8::encode( $un ); | |
| return $un; | |
| } | |
| # | |
| # Setup for various Perl versions (the code from JSON::PP58) | |
| # | |
| BEGIN { | |
| unless ( defined &utf8::is_utf8 ) { | |
| require Encode; | |
| *utf8::is_utf8 = *Encode::is_utf8; | |
| } | |
| if ( $] >= 5.008 ) { | |
| *JSON::PP::JSON_PP_encode_ascii = \&_encode_ascii; | |
| *JSON::PP::JSON_PP_encode_latin1 = \&_encode_latin1; | |
| *JSON::PP::JSON_PP_decode_surrogates = \&_decode_surrogates; | |
| *JSON::PP::JSON_PP_decode_unicode = \&_decode_unicode; | |
| } | |
| if ($] >= 5.008 and $] < 5.008003) { # join() in 5.8.0 - 5.8.2 is broken. | |
| package # hide from PAUSE | |
| JSON::PP; | |
| require subs; | |
| subs->import('join'); | |
| eval q| | |
| sub join { | |
| return '' if (@_ < 2); | |
| my $j = shift; | |
| my $str = shift; | |
| for (@_) { $str .= $j . $_; } | |
| return $str; | |
| } | |
| |; | |
| } | |
| sub JSON::PP::incr_parse { | |
| local $Carp::CarpLevel = 1; | |
| ( $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new )->incr_parse( @_ ); | |
| } | |
| sub JSON::PP::incr_skip { | |
| ( $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new )->incr_skip; | |
| } | |
| sub JSON::PP::incr_reset { | |
| ( $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new )->incr_reset; | |
| } | |
| eval q{ | |
| sub JSON::PP::incr_text : lvalue { | |
| $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new; | |
| if ( $_[0]->{_incr_parser}->{incr_parsing} ) { | |
| Carp::croak("incr_text can not be called when the incremental parser already started parsing"); | |
| } | |
| $_[0]->{_incr_parser}->{incr_text}; | |
| } | |
| } if ( $] >= 5.006 ); | |
| } # Setup for various Perl versions (the code from JSON::PP58) | |
| ############################### | |
| # Utilities | |
| # | |
| BEGIN { | |
| eval 'require Scalar::Util'; | |
| unless($@){ | |
| *JSON::PP::blessed = \&Scalar::Util::blessed; | |
| *JSON::PP::reftype = \&Scalar::Util::reftype; | |
| *JSON::PP::refaddr = \&Scalar::Util::refaddr; | |
| } | |
| else{ # This code is from Scalar::Util. | |
| # warn $@; | |
| eval 'sub UNIVERSAL::a_sub_not_likely_to_be_here { ref($_[0]) }'; | |
| *JSON::PP::blessed = sub { | |
| local($@, $SIG{__DIE__}, $SIG{__WARN__}); | |
| ref($_[0]) ? eval { $_[0]->a_sub_not_likely_to_be_here } : undef; | |
| }; | |
| my %tmap = qw( | |
| B::NULL SCALAR | |
| B::HV HASH | |
| B::AV ARRAY | |
| B::CV CODE | |
| B::IO IO | |
| B::GV GLOB | |
| B::REGEXP REGEXP | |
| ); | |
| *JSON::PP::reftype = sub { | |
| my $r = shift; | |
| return undef unless length(ref($r)); | |
| my $t = ref(B::svref_2object($r)); | |
| return | |
| exists $tmap{$t} ? $tmap{$t} | |
| : length(ref($$r)) ? 'REF' | |
| : 'SCALAR'; | |
| }; | |
| *JSON::PP::refaddr = sub { | |
| return undef unless length(ref($_[0])); | |
| my $addr; | |
| if(defined(my $pkg = blessed($_[0]))) { | |
| $addr .= bless $_[0], 'Scalar::Util::Fake'; | |
| bless $_[0], $pkg; | |
| } | |
| else { | |
| $addr .= $_[0] | |
| } | |
| $addr =~ /0x(\w+)/; | |
| local $^W; | |
| #no warnings 'portable'; | |
| hex($1); | |
| } | |
| } | |
| } | |
| # shamelessly copied and modified from JSON::XS code. | |
| unless ( $INC{'JSON/PP.pm'} ) { | |
| eval q| | |
| package | |
| JSON::PP::Boolean; | |
| use overload ( | |
| "0+" => sub { ${$_[0]} }, | |
| "++" => sub { $_[0] = ${$_[0]} + 1 }, | |
| "--" => sub { $_[0] = ${$_[0]} - 1 }, | |
| fallback => 1, | |
| ); | |
| |; | |
| } | |
| $JSON::PP::true = do { bless \(my $dummy = 1), "JSON::PP::Boolean" }; | |
| $JSON::PP::false = do { bless \(my $dummy = 0), "JSON::PP::Boolean" }; | |
| sub is_bool { defined $_[0] and UNIVERSAL::isa($_[0], "JSON::PP::Boolean"); } | |
| sub true { $JSON::PP::true } | |
| sub false { $JSON::PP::false } | |
| sub null { undef; } | |
| ############################### | |
| ############################### | |
| package # hide from PAUSE | |
| JSON::PP::IncrParser; | |
| use strict; | |
| use constant INCR_M_WS => 0; # initial whitespace skipping | |
| use constant INCR_M_STR => 1; # inside string | |
| use constant INCR_M_BS => 2; # inside backslash | |
| use constant INCR_M_JSON => 3; # outside anything, count nesting | |
| use constant INCR_M_C0 => 4; | |
| use constant INCR_M_C1 => 5; | |
| use vars qw($VERSION); | |
| $VERSION = '1.01'; | |
| my $unpack_format = $] < 5.006 ? 'C*' : 'U*'; | |
| sub new { | |
| my ( $class ) = @_; | |
| bless { | |
| incr_nest => 0, | |
| incr_text => undef, | |
| incr_parsing => 0, | |
| incr_p => 0, | |
| }, $class; | |
| } | |
| sub incr_parse { | |
| my ( $self, $coder, $text ) = @_; | |
| $self->{incr_text} = '' unless ( defined $self->{incr_text} ); | |
| if ( defined $text ) { | |
| if ( utf8::is_utf8( $text ) and !utf8::is_utf8( $self->{incr_text} ) ) { | |
| utf8::upgrade( $self->{incr_text} ) ; | |
| utf8::decode( $self->{incr_text} ) ; | |
| } | |
| $self->{incr_text} .= $text; | |
| } | |
| my $max_size = $coder->get_max_size; | |
| if ( defined wantarray ) { | |
| $self->{incr_mode} = INCR_M_WS unless defined $self->{incr_mode}; | |
| if ( wantarray ) { | |
| my @ret; | |
| $self->{incr_parsing} = 1; | |
| do { | |
| push @ret, $self->_incr_parse( $coder, $self->{incr_text} ); | |
| unless ( !$self->{incr_nest} and $self->{incr_mode} == INCR_M_JSON ) { | |
| $self->{incr_mode} = INCR_M_WS if $self->{incr_mode} != INCR_M_STR; | |
| } | |
| } until ( length $self->{incr_text} >= $self->{incr_p} ); | |
| $self->{incr_parsing} = 0; | |
| return @ret; | |
| } | |
| else { # in scalar context | |
| $self->{incr_parsing} = 1; | |
| my $obj = $self->_incr_parse( $coder, $self->{incr_text} ); | |
| $self->{incr_parsing} = 0 if defined $obj; # pointed by Martin J. Evans | |
| return $obj ? $obj : undef; # $obj is an empty string, parsing was completed. | |
| } | |
| } | |
| } | |
| sub _incr_parse { | |
| my ( $self, $coder, $text, $skip ) = @_; | |
| my $p = $self->{incr_p}; | |
| my $restore = $p; | |
| my @obj; | |
| my $len = length $text; | |
| if ( $self->{incr_mode} == INCR_M_WS ) { | |
| while ( $len > $p ) { | |
| my $s = substr( $text, $p, 1 ); | |
| $p++ and next if ( 0x20 >= unpack($unpack_format, $s) ); | |
| $self->{incr_mode} = INCR_M_JSON; | |
| last; | |
| } | |
| } | |
| while ( $len > $p ) { | |
| my $s = substr( $text, $p++, 1 ); | |
| if ( $s eq '"' ) { | |
| if (substr( $text, $p - 2, 1 ) eq '\\' ) { | |
| next; | |
| } | |
| if ( $self->{incr_mode} != INCR_M_STR ) { | |
| $self->{incr_mode} = INCR_M_STR; | |
| } | |
| else { | |
| $self->{incr_mode} = INCR_M_JSON; | |
| unless ( $self->{incr_nest} ) { | |
| last; | |
| } | |
| } | |
| } | |
| if ( $self->{incr_mode} == INCR_M_JSON ) { | |
| if ( $s eq '[' or $s eq '{' ) { | |
| if ( ++$self->{incr_nest} > $coder->get_max_depth ) { | |
| Carp::croak('json text or perl structure exceeds maximum nesting level (max_depth set too low?)'); | |
| } | |
| } | |
| elsif ( $s eq ']' or $s eq '}' ) { | |
| last if ( --$self->{incr_nest} <= 0 ); | |
| } | |
| elsif ( $s eq '#' ) { | |
| while ( $len > $p ) { | |
| last if substr( $text, $p++, 1 ) eq "\n"; | |
| } | |
| } | |
| } | |
| } | |
| $self->{incr_p} = $p; | |
| return if ( $self->{incr_mode} == INCR_M_STR and not $self->{incr_nest} ); | |
| return if ( $self->{incr_mode} == INCR_M_JSON and $self->{incr_nest} > 0 ); | |
| return '' unless ( length substr( $self->{incr_text}, 0, $p ) ); | |
| local $Carp::CarpLevel = 2; | |
| $self->{incr_p} = $restore; | |
| $self->{incr_c} = $p; | |
| my ( $obj, $tail ) = $coder->PP_decode_json( substr( $self->{incr_text}, 0, $p ), 0x10000001 ); | |
| $self->{incr_text} = substr( $self->{incr_text}, $p ); | |
| $self->{incr_p} = 0; | |
| return $obj || ''; | |
| } | |
| sub incr_text { | |
| if ( $_[0]->{incr_parsing} ) { | |
| Carp::croak("incr_text can not be called when the incremental parser already started parsing"); | |
| } | |
| $_[0]->{incr_text}; | |
| } | |
| sub incr_skip { | |
| my $self = shift; | |
| $self->{incr_text} = substr( $self->{incr_text}, $self->{incr_c} ); | |
| $self->{incr_p} = 0; | |
| } | |
| sub incr_reset { | |
| my $self = shift; | |
| $self->{incr_text} = undef; | |
| $self->{incr_p} = 0; | |
| $self->{incr_mode} = 0; | |
| $self->{incr_nest} = 0; | |
| $self->{incr_parsing} = 0; | |
| } | |
| ############################### | |
| 1; | |
| __END__ | |
| =pod | |
| =head1 NAME | |
| JSON::PP - JSON::XS compatible pure-Perl module. | |
| =head1 SYNOPSIS | |
| use JSON::PP; | |
| # exported functions, they croak on error | |
| # and expect/generate UTF-8 | |
| $utf8_encoded_json_text = encode_json $perl_hash_or_arrayref; | |
| $perl_hash_or_arrayref = decode_json $utf8_encoded_json_text; | |
| # OO-interface | |
| $coder = JSON::PP->new->ascii->pretty->allow_nonref; | |
| $json_text = $json->encode( $perl_scalar ); | |
| $perl_scalar = $json->decode( $json_text ); | |
| $pretty_printed = $json->pretty->encode( $perl_scalar ); # pretty-printing | |
| # Note that JSON version 2.0 and above will automatically use | |
| # JSON::XS or JSON::PP, so you should be able to just: | |
| use JSON; | |
| =head1 VERSION | |
| 2.27200 | |
| L<JSON::XS> 2.27 (~2.30) compatible. | |
| =head1 DESCRIPTION | |
| This module is L<JSON::XS> compatible pure Perl module. | |
| (Perl 5.8 or later is recommended) | |
| JSON::XS is the fastest and most proper JSON module on CPAN. | |
| It is written by Marc Lehmann in C, so must be compiled and | |
| installed in the used environment. | |
| JSON::PP is a pure-Perl module and has compatibility to JSON::XS. | |
| =head2 FEATURES | |
| =over | |
| =item * correct unicode handling | |
| This module knows how to handle Unicode (depending on Perl version). | |
| See to L<JSON::XS/A FEW NOTES ON UNICODE AND PERL> and | |
| L<UNICODE HANDLING ON PERLS>. | |
| =item * round-trip integrity | |
| When you serialise a perl data structure using only data types | |
| supported by JSON and Perl, the deserialised data structure is | |
| identical on the Perl level. (e.g. the string "2.0" doesn't suddenly | |
| become "2" just because it looks like a number). There I<are> minor | |
| exceptions to this, read the MAPPING section below to learn about | |
| those. | |
| =item * strict checking of JSON correctness | |
| There is no guessing, no generating of illegal JSON texts by default, | |
| and only JSON is accepted as input by default (the latter is a | |
| security feature). But when some options are set, loose checking | |
| features are available. | |
| =back | |
| =head1 FUNCTIONAL INTERFACE | |
| Some documents are copied and modified from L<JSON::XS/FUNCTIONAL INTERFACE>. | |
| =head2 encode_json | |
| $json_text = encode_json $perl_scalar | |
| Converts the given Perl data structure to a UTF-8 encoded, binary string. | |
| This function call is functionally identical to: | |
| $json_text = JSON::PP->new->utf8->encode($perl_scalar) | |
| =head2 decode_json | |
| $perl_scalar = decode_json $json_text | |
| The opposite of C<encode_json>: expects an UTF-8 (binary) string and tries | |
| to parse that as an UTF-8 encoded JSON text, returning the resulting | |
| reference. | |
| This function call is functionally identical to: | |
| $perl_scalar = JSON::PP->new->utf8->decode($json_text) | |
| =head2 JSON::PP::is_bool | |
| $is_boolean = JSON::PP::is_bool($scalar) | |
| Returns true if the passed scalar represents either JSON::PP::true or | |
| JSON::PP::false, two constants that act like C<1> and C<0> respectively | |
| and are also used to represent JSON C<true> and C<false> in Perl strings. | |
| =head2 JSON::PP::true | |
| Returns JSON true value which is blessed object. | |
| It C<isa> JSON::PP::Boolean object. | |
| =head2 JSON::PP::false | |
| Returns JSON false value which is blessed object. | |
| It C<isa> JSON::PP::Boolean object. | |
| =head2 JSON::PP::null | |
| Returns C<undef>. | |
| See L<MAPPING>, below, for more information on how JSON values are mapped to | |
| Perl. | |
| =head1 HOW DO I DECODE A DATA FROM OUTER AND ENCODE TO OUTER | |
| This section supposes that your perl version is 5.8 or later. | |
| If you know a JSON text from an outer world - a network, a file content, and so on, | |
| is encoded in UTF-8, you should use C<decode_json> or C<JSON> module object | |
| with C<utf8> enable. And the decoded result will contain UNICODE characters. | |
| # from network | |
| my $json = JSON::PP->new->utf8; | |
| my $json_text = CGI->new->param( 'json_data' ); | |
| my $perl_scalar = $json->decode( $json_text ); | |
| # from file content | |
| local $/; | |
| open( my $fh, '<', 'json.data' ); | |
| $json_text = <$fh>; | |
| $perl_scalar = decode_json( $json_text ); | |
| If an outer data is not encoded in UTF-8, firstly you should C<decode> it. | |
| use Encode; | |
| local $/; | |
| open( my $fh, '<', 'json.data' ); | |
| my $encoding = 'cp932'; | |
| my $unicode_json_text = decode( $encoding, <$fh> ); # UNICODE | |
| # or you can write the below code. | |
| # | |
| # open( my $fh, "<:encoding($encoding)", 'json.data' ); | |
| # $unicode_json_text = <$fh>; | |
| In this case, C<$unicode_json_text> is of course UNICODE string. | |
| So you B<cannot> use C<decode_json> nor C<JSON> module object with C<utf8> enable. | |
| Instead of them, you use C<JSON> module object with C<utf8> disable. | |
| $perl_scalar = $json->utf8(0)->decode( $unicode_json_text ); | |
| Or C<encode 'utf8'> and C<decode_json>: | |
| $perl_scalar = decode_json( encode( 'utf8', $unicode_json_text ) ); | |
| # this way is not efficient. | |
| And now, you want to convert your C<$perl_scalar> into JSON data and | |
| send it to an outer world - a network or a file content, and so on. | |
| Your data usually contains UNICODE strings and you want the converted data to be encoded | |
| in UTF-8, you should use C<encode_json> or C<JSON> module object with C<utf8> enable. | |
| print encode_json( $perl_scalar ); # to a network? file? or display? | |
| # or | |
| print $json->utf8->encode( $perl_scalar ); | |
| If C<$perl_scalar> does not contain UNICODE but C<$encoding>-encoded strings | |
| for some reason, then its characters are regarded as B<latin1> for perl | |
| (because it does not concern with your $encoding). | |
| You B<cannot> use C<encode_json> nor C<JSON> module object with C<utf8> enable. | |
| Instead of them, you use C<JSON> module object with C<utf8> disable. | |
| Note that the resulted text is a UNICODE string but no problem to print it. | |
| # $perl_scalar contains $encoding encoded string values | |
| $unicode_json_text = $json->utf8(0)->encode( $perl_scalar ); | |
| # $unicode_json_text consists of characters less than 0x100 | |
| print $unicode_json_text; | |
| Or C<decode $encoding> all string values and C<encode_json>: | |
| $perl_scalar->{ foo } = decode( $encoding, $perl_scalar->{ foo } ); | |
| # ... do it to each string values, then encode_json | |
| $json_text = encode_json( $perl_scalar ); | |
| This method is a proper way but probably not efficient. | |
| See to L<Encode>, L<perluniintro>. | |
| =head1 METHODS | |
| Basically, check to L<JSON> or L<JSON::XS>. | |
| =head2 new | |
| $json = JSON::PP->new | |
| Returns a new JSON::PP object that can be used to de/encode JSON | |
| strings. | |
| All boolean flags described below are by default I<disabled>. | |
| The mutators for flags all return the JSON object again and thus calls can | |
| be chained: | |
| my $json = JSON::PP->new->utf8->space_after->encode({a => [1,2]}) | |
| => {"a": [1, 2]} | |
| =head2 ascii | |
| $json = $json->ascii([$enable]) | |
| $enabled = $json->get_ascii | |
| If $enable is true (or missing), then the encode method will not generate characters outside | |
| the code range 0..127. Any Unicode characters outside that range will be escaped using either | |
| a single \uXXXX or a double \uHHHH\uLLLLL escape sequence, as per RFC4627. | |
| (See to L<JSON::XS/OBJECT-ORIENTED INTERFACE>). | |
| In Perl 5.005, there is no character having high value (more than 255). | |
| See to L<UNICODE HANDLING ON PERLS>. | |
| If $enable is false, then the encode method will not escape Unicode characters unless | |
| required by the JSON syntax or other flags. This results in a faster and more compact format. | |
| JSON::PP->new->ascii(1)->encode([chr 0x10401]) | |
| => ["\ud801\udc01"] | |
| =head2 latin1 | |
| $json = $json->latin1([$enable]) | |
| $enabled = $json->get_latin1 | |
| If $enable is true (or missing), then the encode method will encode the resulting JSON | |
| text as latin1 (or iso-8859-1), escaping any characters outside the code range 0..255. | |
| If $enable is false, then the encode method will not escape Unicode characters | |
| unless required by the JSON syntax or other flags. | |
| JSON::XS->new->latin1->encode (["\x{89}\x{abc}"] | |
| => ["\x{89}\\u0abc"] # (perl syntax, U+abc escaped, U+89 not) | |
| See to L<UNICODE HANDLING ON PERLS>. | |
| =head2 utf8 | |
| $json = $json->utf8([$enable]) | |
| $enabled = $json->get_utf8 | |
| If $enable is true (or missing), then the encode method will encode the JSON result | |
| into UTF-8, as required by many protocols, while the decode method expects to be handled | |
| an UTF-8-encoded string. Please note that UTF-8-encoded strings do not contain any | |
| characters outside the range 0..255, they are thus useful for bytewise/binary I/O. | |
| (In Perl 5.005, any character outside the range 0..255 does not exist. | |
| See to L<UNICODE HANDLING ON PERLS>.) | |
| In future versions, enabling this option might enable autodetection of the UTF-16 and UTF-32 | |
| encoding families, as described in RFC4627. | |
| If $enable is false, then the encode method will return the JSON string as a (non-encoded) | |
| Unicode string, while decode expects thus a Unicode string. Any decoding or encoding | |
| (e.g. to UTF-8 or UTF-16) needs to be done yourself, e.g. using the Encode module. | |
| Example, output UTF-16BE-encoded JSON: | |
| use Encode; | |
| $jsontext = encode "UTF-16BE", JSON::PP->new->encode ($object); | |
| Example, decode UTF-32LE-encoded JSON: | |
| use Encode; | |
| $object = JSON::PP->new->decode (decode "UTF-32LE", $jsontext); | |
| =head2 pretty | |
| $json = $json->pretty([$enable]) | |
| This enables (or disables) all of the C<indent>, C<space_before> and | |
| C<space_after> flags in one call to generate the most readable | |
| (or most compact) form possible. | |
| Equivalent to: | |
| $json->indent->space_before->space_after | |
| =head2 indent | |
| $json = $json->indent([$enable]) | |
| $enabled = $json->get_indent | |
| The default indent space length is three. | |
| You can use C<indent_length> to change the length. | |
| =head2 space_before | |
| $json = $json->space_before([$enable]) | |
| $enabled = $json->get_space_before | |
| If C<$enable> is true (or missing), then the C<encode> method will add an extra | |
| optional space before the C<:> separating keys from values in JSON objects. | |
| If C<$enable> is false, then the C<encode> method will not add any extra | |
| space at those places. | |
| This setting has no effect when decoding JSON texts. | |
| Example, space_before enabled, space_after and indent disabled: | |
| {"key" :"value"} | |
| =head2 space_after | |
| $json = $json->space_after([$enable]) | |
| $enabled = $json->get_space_after | |
| If C<$enable> is true (or missing), then the C<encode> method will add an extra | |
| optional space after the C<:> separating keys from values in JSON objects | |
| and extra whitespace after the C<,> separating key-value pairs and array | |
| members. | |
| If C<$enable> is false, then the C<encode> method will not add any extra | |
| space at those places. | |
| This setting has no effect when decoding JSON texts. | |
| Example, space_before and indent disabled, space_after enabled: | |
| {"key": "value"} | |
| =head2 relaxed | |
| $json = $json->relaxed([$enable]) | |
| $enabled = $json->get_relaxed | |
| If C<$enable> is true (or missing), then C<decode> will accept some | |
| extensions to normal JSON syntax (see below). C<encode> will not be | |
| affected in anyway. I<Be aware that this option makes you accept invalid | |
| JSON texts as if they were valid!>. I suggest only to use this option to | |
| parse application-specific files written by humans (configuration files, | |
| resource files etc.) | |
| If C<$enable> is false (the default), then C<decode> will only accept | |
| valid JSON texts. | |
| Currently accepted extensions are: | |
| =over 4 | |
| =item * list items can have an end-comma | |
| JSON I<separates> array elements and key-value pairs with commas. This | |
| can be annoying if you write JSON texts manually and want to be able to | |
| quickly append elements, so this extension accepts comma at the end of | |
| such items not just between them: | |
| [ | |
| 1, | |
| 2, <- this comma not normally allowed | |
| ] | |
| { | |
| "k1": "v1", | |
| "k2": "v2", <- this comma not normally allowed | |
| } | |
| =item * shell-style '#'-comments | |
| Whenever JSON allows whitespace, shell-style comments are additionally | |
| allowed. They are terminated by the first carriage-return or line-feed | |
| character, after which more white-space and comments are allowed. | |
| [ | |
| 1, # this comment not allowed in JSON | |
| # neither this one... | |
| ] | |
| =back | |
| =head2 canonical | |
| $json = $json->canonical([$enable]) | |
| $enabled = $json->get_canonical | |
| If C<$enable> is true (or missing), then the C<encode> method will output JSON objects | |
| by sorting their keys. This is adding a comparatively high overhead. | |
| If C<$enable> is false, then the C<encode> method will output key-value | |
| pairs in the order Perl stores them (which will likely change between runs | |
| of the same script). | |
| This option is useful if you want the same data structure to be encoded as | |
| the same JSON text (given the same overall settings). If it is disabled, | |
| the same hash might be encoded differently even if contains the same data, | |
| as key-value pairs have no inherent ordering in Perl. | |
| This setting has no effect when decoding JSON texts. | |
| If you want your own sorting routine, you can give a code reference | |
| or a subroutine name to C<sort_by>. See to C<JSON::PP OWN METHODS>. | |
| =head2 allow_nonref | |
| $json = $json->allow_nonref([$enable]) | |
| $enabled = $json->get_allow_nonref | |
| If C<$enable> is true (or missing), then the C<encode> method can convert a | |
| non-reference into its corresponding string, number or null JSON value, | |
| which is an extension to RFC4627. Likewise, C<decode> will accept those JSON | |
| values instead of croaking. | |
| If C<$enable> is false, then the C<encode> method will croak if it isn't | |
| passed an arrayref or hashref, as JSON texts must either be an object | |
| or array. Likewise, C<decode> will croak if given something that is not a | |
| JSON object or array. | |
| JSON::PP->new->allow_nonref->encode ("Hello, World!") | |
| => "Hello, World!" | |
| =head2 allow_unknown | |
| $json = $json->allow_unknown ([$enable]) | |
| $enabled = $json->get_allow_unknown | |
| If $enable is true (or missing), then "encode" will *not* throw an | |
| exception when it encounters values it cannot represent in JSON (for | |
| example, filehandles) but instead will encode a JSON "null" value. | |
| Note that blessed objects are not included here and are handled | |
| separately by c<allow_nonref>. | |
| If $enable is false (the default), then "encode" will throw an | |
| exception when it encounters anything it cannot encode as JSON. | |
| This option does not affect "decode" in any way, and it is | |
| recommended to leave it off unless you know your communications | |
| partner. | |
| =head2 allow_blessed | |
| $json = $json->allow_blessed([$enable]) | |
| $enabled = $json->get_allow_blessed | |
| If C<$enable> is true (or missing), then the C<encode> method will not | |
| barf when it encounters a blessed reference. Instead, the value of the | |
| B<convert_blessed> option will decide whether C<null> (C<convert_blessed> | |
| disabled or no C<TO_JSON> method found) or a representation of the | |
| object (C<convert_blessed> enabled and C<TO_JSON> method found) is being | |
| encoded. Has no effect on C<decode>. | |
| If C<$enable> is false (the default), then C<encode> will throw an | |
| exception when it encounters a blessed object. | |
| =head2 convert_blessed | |
| $json = $json->convert_blessed([$enable]) | |
| $enabled = $json->get_convert_blessed | |
| If C<$enable> is true (or missing), then C<encode>, upon encountering a | |
| blessed object, will check for the availability of the C<TO_JSON> method | |
| on the object's class. If found, it will be called in scalar context | |
| and the resulting scalar will be encoded instead of the object. If no | |
| C<TO_JSON> method is found, the value of C<allow_blessed> will decide what | |
| to do. | |
| The C<TO_JSON> method may safely call die if it wants. If C<TO_JSON> | |
| returns other blessed objects, those will be handled in the same | |
| way. C<TO_JSON> must take care of not causing an endless recursion cycle | |
| (== crash) in this case. The name of C<TO_JSON> was chosen because other | |
| methods called by the Perl core (== not by the user of the object) are | |
| usually in upper case letters and to avoid collisions with the C<to_json> | |
| function or method. | |
| This setting does not yet influence C<decode> in any way. | |
| If C<$enable> is false, then the C<allow_blessed> setting will decide what | |
| to do when a blessed object is found. | |
| =head2 filter_json_object | |
| $json = $json->filter_json_object([$coderef]) | |
| When C<$coderef> is specified, it will be called from C<decode> each | |
| time it decodes a JSON object. The only argument passed to the coderef | |
| is a reference to the newly-created hash. If the code references returns | |
| a single scalar (which need not be a reference), this value | |
| (i.e. a copy of that scalar to avoid aliasing) is inserted into the | |
| deserialised data structure. If it returns an empty list | |
| (NOTE: I<not> C<undef>, which is a valid scalar), the original deserialised | |
| hash will be inserted. This setting can slow down decoding considerably. | |
| When C<$coderef> is omitted or undefined, any existing callback will | |
| be removed and C<decode> will not change the deserialised hash in any | |
| way. | |
| Example, convert all JSON objects into the integer 5: | |
| my $js = JSON::PP->new->filter_json_object (sub { 5 }); | |
| # returns [5] | |
| $js->decode ('[{}]'); # the given subroutine takes a hash reference. | |
| # throw an exception because allow_nonref is not enabled | |
| # so a lone 5 is not allowed. | |
| $js->decode ('{"a":1, "b":2}'); | |
| =head2 filter_json_single_key_object | |
| $json = $json->filter_json_single_key_object($key [=> $coderef]) | |
| Works remotely similar to C<filter_json_object>, but is only called for | |
| JSON objects having a single key named C<$key>. | |
| This C<$coderef> is called before the one specified via | |
| C<filter_json_object>, if any. It gets passed the single value in the JSON | |
| object. If it returns a single value, it will be inserted into the data | |
| structure. If it returns nothing (not even C<undef> but the empty list), | |
| the callback from C<filter_json_object> will be called next, as if no | |
| single-key callback were specified. | |
| If C<$coderef> is omitted or undefined, the corresponding callback will be | |
| disabled. There can only ever be one callback for a given key. | |
| As this callback gets called less often then the C<filter_json_object> | |
| one, decoding speed will not usually suffer as much. Therefore, single-key | |
| objects make excellent targets to serialise Perl objects into, especially | |
| as single-key JSON objects are as close to the type-tagged value concept | |
| as JSON gets (it's basically an ID/VALUE tuple). Of course, JSON does not | |
| support this in any way, so you need to make sure your data never looks | |
| like a serialised Perl hash. | |
| Typical names for the single object key are C<__class_whatever__>, or | |
| C<$__dollars_are_rarely_used__$> or C<}ugly_brace_placement>, or even | |
| things like C<__class_md5sum(classname)__>, to reduce the risk of clashing | |
| with real hashes. | |
| Example, decode JSON objects of the form C<< { "__widget__" => <id> } >> | |
| into the corresponding C<< $WIDGET{<id>} >> object: | |
| # return whatever is in $WIDGET{5}: | |
| JSON::PP | |
| ->new | |
| ->filter_json_single_key_object (__widget__ => sub { | |
| $WIDGET{ $_[0] } | |
| }) | |
| ->decode ('{"__widget__": 5') | |
| # this can be used with a TO_JSON method in some "widget" class | |
| # for serialisation to json: | |
| sub WidgetBase::TO_JSON { | |
| my ($self) = @_; | |
| unless ($self->{id}) { | |
| $self->{id} = ..get..some..id..; | |
| $WIDGET{$self->{id}} = $self; | |
| } | |
| { __widget__ => $self->{id} } | |
| } | |
| =head2 shrink | |
| $json = $json->shrink([$enable]) | |
| $enabled = $json->get_shrink | |
| In JSON::XS, this flag resizes strings generated by either | |
| C<encode> or C<decode> to their minimum size possible. | |
| It will also try to downgrade any strings to octet-form if possible. | |
| In JSON::PP, it is noop about resizing strings but tries | |
| C<utf8::downgrade> to the returned string by C<encode>. | |
| See to L<utf8>. | |
| See to L<JSON::XS/OBJECT-ORIENTED INTERFACE> | |
| =head2 max_depth | |
| $json = $json->max_depth([$maximum_nesting_depth]) | |
| $max_depth = $json->get_max_depth | |
| Sets the maximum nesting level (default C<512>) accepted while encoding | |
| or decoding. If a higher nesting level is detected in JSON text or a Perl | |
| data structure, then the encoder and decoder will stop and croak at that | |
| point. | |
| Nesting level is defined by number of hash- or arrayrefs that the encoder | |
| needs to traverse to reach a given point or the number of C<{> or C<[> | |
| characters without their matching closing parenthesis crossed to reach a | |
| given character in a string. | |
| If no argument is given, the highest possible setting will be used, which | |
| is rarely useful. | |
| See L<JSON::XS/SSECURITY CONSIDERATIONS> for more info on why this is useful. | |
| When a large value (100 or more) was set and it de/encodes a deep nested object/text, | |
| it may raise a warning 'Deep recursion on subroutine' at the perl runtime phase. | |
| =head2 max_size | |
| $json = $json->max_size([$maximum_string_size]) | |
| $max_size = $json->get_max_size | |
| Set the maximum length a JSON text may have (in bytes) where decoding is | |
| being attempted. The default is C<0>, meaning no limit. When C<decode> | |
| is called on a string that is longer then this many bytes, it will not | |
| attempt to decode the string but throw an exception. This setting has no | |
| effect on C<encode> (yet). | |
| If no argument is given, the limit check will be deactivated (same as when | |
| C<0> is specified). | |
| See L<JSON::XS/SECURITY CONSIDERATIONS> for more info on why this is useful. | |
| =head2 encode | |
| $json_text = $json->encode($perl_scalar) | |
| Converts the given Perl data structure (a simple scalar or a reference | |
| to a hash or array) to its JSON representation. Simple scalars will be | |
| converted into JSON string or number sequences, while references to arrays | |
| become JSON arrays and references to hashes become JSON objects. Undefined | |
| Perl values (e.g. C<undef>) become JSON C<null> values. | |
| References to the integers C<0> and C<1> are converted into C<true> and C<false>. | |
| =head2 decode | |
| $perl_scalar = $json->decode($json_text) | |
| The opposite of C<encode>: expects a JSON text and tries to parse it, | |
| returning the resulting simple scalar or reference. Croaks on error. | |
| JSON numbers and strings become simple Perl scalars. JSON arrays become | |
| Perl arrayrefs and JSON objects become Perl hashrefs. C<true> becomes | |
| C<1> (C<JSON::true>), C<false> becomes C<0> (C<JSON::false>) and | |
| C<null> becomes C<undef>. | |
| =head2 decode_prefix | |
| ($perl_scalar, $characters) = $json->decode_prefix($json_text) | |
| This works like the C<decode> method, but instead of raising an exception | |
| when there is trailing garbage after the first JSON object, it will | |
| silently stop parsing there and return the number of characters consumed | |
| so far. | |
| JSON->new->decode_prefix ("[1] the tail") | |
| => ([], 3) | |
| =head1 INCREMENTAL PARSING | |
| Most of this section are copied and modified from L<JSON::XS/INCREMENTAL PARSING>. | |
| In some cases, there is the need for incremental parsing of JSON texts. | |
| This module does allow you to parse a JSON stream incrementally. | |
| It does so by accumulating text until it has a full JSON object, which | |
| it then can decode. This process is similar to using C<decode_prefix> | |
| to see if a full JSON object is available, but is much more efficient | |
| (and can be implemented with a minimum of method calls). | |
| This module will only attempt to parse the JSON text once it is sure it | |
| has enough text to get a decisive result, using a very simple but | |
| truly incremental parser. This means that it sometimes won't stop as | |
| early as the full parser, for example, it doesn't detect parenthesis | |
| mismatches. The only thing it guarantees is that it starts decoding as | |
| soon as a syntactically valid JSON text has been seen. This means you need | |
| to set resource limits (e.g. C<max_size>) to ensure the parser will stop | |
| parsing in the presence if syntax errors. | |
| The following methods implement this incremental parser. | |
| =head2 incr_parse | |
| $json->incr_parse( [$string] ) # void context | |
| $obj_or_undef = $json->incr_parse( [$string] ) # scalar context | |
| @obj_or_empty = $json->incr_parse( [$string] ) # list context | |
| This is the central parsing function. It can both append new text and | |
| extract objects from the stream accumulated so far (both of these | |
| functions are optional). | |
| If C<$string> is given, then this string is appended to the already | |
| existing JSON fragment stored in the C<$json> object. | |
| After that, if the function is called in void context, it will simply | |
| return without doing anything further. This can be used to add more text | |
| in as many chunks as you want. | |
| If the method is called in scalar context, then it will try to extract | |
| exactly I<one> JSON object. If that is successful, it will return this | |
| object, otherwise it will return C<undef>. If there is a parse error, | |
| this method will croak just as C<decode> would do (one can then use | |
| C<incr_skip> to skip the erroneous part). This is the most common way of | |
| using the method. | |
| And finally, in list context, it will try to extract as many objects | |
| from the stream as it can find and return them, or the empty list | |
| otherwise. For this to work, there must be no separators between the JSON | |
| objects or arrays, instead they must be concatenated back-to-back. If | |
| an error occurs, an exception will be raised as in the scalar context | |
| case. Note that in this case, any previously-parsed JSON texts will be | |
| lost. | |
| Example: Parse some JSON arrays/objects in a given string and return them. | |
| my @objs = JSON->new->incr_parse ("[5][7][1,2]"); | |
| =head2 incr_text | |
| $lvalue_string = $json->incr_text | |
| This method returns the currently stored JSON fragment as an lvalue, that | |
| is, you can manipulate it. This I<only> works when a preceding call to | |
| C<incr_parse> in I<scalar context> successfully returned an object. Under | |
| all other circumstances you must not call this function (I mean it. | |
| although in simple tests it might actually work, it I<will> fail under | |
| real world conditions). As a special exception, you can also call this | |
| method before having parsed anything. | |
| This function is useful in two cases: a) finding the trailing text after a | |
| JSON object or b) parsing multiple JSON objects separated by non-JSON text | |
| (such as commas). | |
| $json->incr_text =~ s/\s*,\s*//; | |
| In Perl 5.005, C<lvalue> attribute is not available. | |
| You must write codes like the below: | |
| $string = $json->incr_text; | |
| $string =~ s/\s*,\s*//; | |
| $json->incr_text( $string ); | |
| =head2 incr_skip | |
| $json->incr_skip | |
| This will reset the state of the incremental parser and will remove the | |
| parsed text from the input buffer. This is useful after C<incr_parse> | |
| died, in which case the input buffer and incremental parser state is left | |
| unchanged, to skip the text parsed so far and to reset the parse state. | |
| =head2 incr_reset | |
| $json->incr_reset | |
| This completely resets the incremental parser, that is, after this call, | |
| it will be as if the parser had never parsed anything. | |
| This is useful if you want to repeatedly parse JSON objects and want to | |
| ignore any trailing data, which means you have to reset the parser after | |
| each successful decode. | |
| See to L<JSON::XS/INCREMENTAL PARSING> for examples. | |
| =head1 JSON::PP OWN METHODS | |
| =head2 allow_singlequote | |
| $json = $json->allow_singlequote([$enable]) | |
| If C<$enable> is true (or missing), then C<decode> will accept | |
| JSON strings quoted by single quotations that are invalid JSON | |
| format. | |
| $json->allow_singlequote->decode({"foo":'bar'}); | |
| $json->allow_singlequote->decode({'foo':"bar"}); | |
| $json->allow_singlequote->decode({'foo':'bar'}); | |
| As same as the C<relaxed> option, this option may be used to parse | |
| application-specific files written by humans. | |
| =head2 allow_barekey | |
| $json = $json->allow_barekey([$enable]) | |
| If C<$enable> is true (or missing), then C<decode> will accept | |
| bare keys of JSON object that are invalid JSON format. | |
| As same as the C<relaxed> option, this option may be used to parse | |
| application-specific files written by humans. | |
| $json->allow_barekey->decode('{foo:"bar"}'); | |
| =head2 allow_bignum | |
| $json = $json->allow_bignum([$enable]) | |
| If C<$enable> is true (or missing), then C<decode> will convert | |
| the big integer Perl cannot handle as integer into a L<Math::BigInt> | |
| object and convert a floating number (any) into a L<Math::BigFloat>. | |
| On the contrary, C<encode> converts C<Math::BigInt> objects and C<Math::BigFloat> | |
| objects into JSON numbers with C<allow_blessed> enable. | |
| $json->allow_nonref->allow_blessed->allow_bignum; | |
| $bigfloat = $json->decode('2.000000000000000000000000001'); | |
| print $json->encode($bigfloat); | |
| # => 2.000000000000000000000000001 | |
| See to L<JSON::XS/MAPPING> about the normal conversion of JSON number. | |
| =head2 loose | |
| $json = $json->loose([$enable]) | |
| The unescaped [\x00-\x1f\x22\x2f\x5c] strings are invalid in JSON strings | |
| and the module doesn't allow to C<decode> to these (except for \x2f). | |
| If C<$enable> is true (or missing), then C<decode> will accept these | |
| unescaped strings. | |
| $json->loose->decode(qq|["abc | |
| def"]|); | |
| See L<JSON::XS/SSECURITY CONSIDERATIONS>. | |
| =head2 escape_slash | |
| $json = $json->escape_slash([$enable]) | |
| According to JSON Grammar, I<slash> (U+002F) is escaped. But default | |
| JSON::PP (as same as JSON::XS) encodes strings without escaping slash. | |
| If C<$enable> is true (or missing), then C<encode> will escape slashes. | |
| =head2 indent_length | |
| $json = $json->indent_length($length) | |
| JSON::XS indent space length is 3 and cannot be changed. | |
| JSON::PP set the indent space length with the given $length. | |
| The default is 3. The acceptable range is 0 to 15. | |
| =head2 sort_by | |
| $json = $json->sort_by($function_name) | |
| $json = $json->sort_by($subroutine_ref) | |
| If $function_name or $subroutine_ref are set, its sort routine are used | |
| in encoding JSON objects. | |
| $js = $pc->sort_by(sub { $JSON::PP::a cmp $JSON::PP::b })->encode($obj); | |
| # is($js, q|{"a":1,"b":2,"c":3,"d":4,"e":5,"f":6,"g":7,"h":8,"i":9}|); | |
| $js = $pc->sort_by('own_sort')->encode($obj); | |
| # is($js, q|{"a":1,"b":2,"c":3,"d":4,"e":5,"f":6,"g":7,"h":8,"i":9}|); | |
| sub JSON::PP::own_sort { $JSON::PP::a cmp $JSON::PP::b } | |
| As the sorting routine runs in the JSON::PP scope, the given | |
| subroutine name and the special variables C<$a>, C<$b> will begin | |
| 'JSON::PP::'. | |
| If $integer is set, then the effect is same as C<canonical> on. | |
| =head1 INTERNAL | |
| For developers. | |
| =over | |
| =item PP_encode_box | |
| Returns | |
| { | |
| depth => $depth, | |
| indent_count => $indent_count, | |
| } | |
| =item PP_decode_box | |
| Returns | |
| { | |
| text => $text, | |
| at => $at, | |
| ch => $ch, | |
| len => $len, | |
| depth => $depth, | |
| encoding => $encoding, | |
| is_valid_utf8 => $is_valid_utf8, | |
| }; | |
| =back | |
| =head1 MAPPING | |
| This section is copied from JSON::XS and modified to C<JSON::PP>. | |
| JSON::XS and JSON::PP mapping mechanisms are almost equivalent. | |
| See to L<JSON::XS/MAPPING>. | |
| =head2 JSON -> PERL | |
| =over 4 | |
| =item object | |
| A JSON object becomes a reference to a hash in Perl. No ordering of object | |
| keys is preserved (JSON does not preserver object key ordering itself). | |
| =item array | |
| A JSON array becomes a reference to an array in Perl. | |
| =item string | |
| A JSON string becomes a string scalar in Perl - Unicode codepoints in JSON | |
| are represented by the same codepoints in the Perl string, so no manual | |
| decoding is necessary. | |
| =item number | |
| A JSON number becomes either an integer, numeric (floating point) or | |
| string scalar in perl, depending on its range and any fractional parts. On | |
| the Perl level, there is no difference between those as Perl handles all | |
| the conversion details, but an integer may take slightly less memory and | |
| might represent more values exactly than floating point numbers. | |
| If the number consists of digits only, C<JSON> will try to represent | |
| it as an integer value. If that fails, it will try to represent it as | |
| a numeric (floating point) value if that is possible without loss of | |
| precision. Otherwise it will preserve the number as a string value (in | |
| which case you lose roundtripping ability, as the JSON number will be | |
| re-encoded to a JSON string). | |
| Numbers containing a fractional or exponential part will always be | |
| represented as numeric (floating point) values, possibly at a loss of | |
| precision (in which case you might lose perfect roundtripping ability, but | |
| the JSON number will still be re-encoded as a JSON number). | |
| Note that precision is not accuracy - binary floating point values cannot | |
| represent most decimal fractions exactly, and when converting from and to | |
| floating point, C<JSON> only guarantees precision up to but not including | |
| the least significant bit. | |
| When C<allow_bignum> is enable, the big integers | |
| and the numeric can be optionally converted into L<Math::BigInt> and | |
| L<Math::BigFloat> objects. | |
| =item true, false | |
| These JSON atoms become C<JSON::PP::true> and C<JSON::PP::false>, | |
| respectively. They are overloaded to act almost exactly like the numbers | |
| C<1> and C<0>. You can check whether a scalar is a JSON boolean by using | |
| the C<JSON::is_bool> function. | |
| print JSON::PP::true . "\n"; | |
| => true | |
| print JSON::PP::true + 1; | |
| => 1 | |
| ok(JSON::true eq '1'); | |
| ok(JSON::true == 1); | |
| C<JSON> will install these missing overloading features to the backend modules. | |
| =item null | |
| A JSON null atom becomes C<undef> in Perl. | |
| C<JSON::PP::null> returns C<undef>. | |
| =back | |
| =head2 PERL -> JSON | |
| The mapping from Perl to JSON is slightly more difficult, as Perl is a | |
| truly typeless language, so we can only guess which JSON type is meant by | |
| a Perl value. | |
| =over 4 | |
| =item hash references | |
| Perl hash references become JSON objects. As there is no inherent ordering | |
| in hash keys (or JSON objects), they will usually be encoded in a | |
| pseudo-random order that can change between runs of the same program but | |
| stays generally the same within a single run of a program. C<JSON> | |
| optionally sort the hash keys (determined by the I<canonical> flag), so | |
| the same data structure will serialise to the same JSON text (given same | |
| settings and version of JSON::XS), but this incurs a runtime overhead | |
| and is only rarely useful, e.g. when you want to compare some JSON text | |
| against another for equality. | |
| =item array references | |
| Perl array references become JSON arrays. | |
| =item other references | |
| Other unblessed references are generally not allowed and will cause an | |
| exception to be thrown, except for references to the integers C<0> and | |
| C<1>, which get turned into C<false> and C<true> atoms in JSON. You can | |
| also use C<JSON::false> and C<JSON::true> to improve readability. | |
| to_json [\0,JSON::PP::true] # yields [false,true] | |
| =item JSON::PP::true, JSON::PP::false, JSON::PP::null | |
| These special values become JSON true and JSON false values, | |
| respectively. You can also use C<\1> and C<\0> directly if you want. | |
| JSON::PP::null returns C<undef>. | |
| =item blessed objects | |
| Blessed objects are not directly representable in JSON. See the | |
| C<allow_blessed> and C<convert_blessed> methods on various options on | |
| how to deal with this: basically, you can choose between throwing an | |
| exception, encoding the reference as if it weren't blessed, or provide | |
| your own serialiser method. | |
| See to L<convert_blessed>. | |
| =item simple scalars | |
| Simple Perl scalars (any scalar that is not a reference) are the most | |
| difficult objects to encode: JSON::XS and JSON::PP will encode undefined scalars as | |
| JSON C<null> values, scalars that have last been used in a string context | |
| before encoding as JSON strings, and anything else as number value: | |
| # dump as number | |
| encode_json [2] # yields [2] | |
| encode_json [-3.0e17] # yields [-3e+17] | |
| my $value = 5; encode_json [$value] # yields [5] | |
| # used as string, so dump as string | |
| print $value; | |
| encode_json [$value] # yields ["5"] | |
| # undef becomes null | |
| encode_json [undef] # yields [null] | |
| You can force the type to be a string by stringifying it: | |
| my $x = 3.1; # some variable containing a number | |
| "$x"; # stringified | |
| $x .= ""; # another, more awkward way to stringify | |
| print $x; # perl does it for you, too, quite often | |
| You can force the type to be a number by numifying it: | |
| my $x = "3"; # some variable containing a string | |
| $x += 0; # numify it, ensuring it will be dumped as a number | |
| $x *= 1; # same thing, the choice is yours. | |
| You can not currently force the type in other, less obscure, ways. | |
| Note that numerical precision has the same meaning as under Perl (so | |
| binary to decimal conversion follows the same rules as in Perl, which | |
| can differ to other languages). Also, your perl interpreter might expose | |
| extensions to the floating point numbers of your platform, such as | |
| infinities or NaN's - these cannot be represented in JSON, and it is an | |
| error to pass those in. | |
| =item Big Number | |
| When C<allow_bignum> is enable, | |
| C<encode> converts C<Math::BigInt> objects and C<Math::BigFloat> | |
| objects into JSON numbers. | |
| =back | |
| =head1 UNICODE HANDLING ON PERLS | |
| If you do not know about Unicode on Perl well, | |
| please check L<JSON::XS/A FEW NOTES ON UNICODE AND PERL>. | |
| =head2 Perl 5.8 and later | |
| Perl can handle Unicode and the JSON::PP de/encode methods also work properly. | |
| $json->allow_nonref->encode(chr hex 3042); | |
| $json->allow_nonref->encode(chr hex 12345); | |
| Returns C<"\u3042"> and C<"\ud808\udf45"> respectively. | |
| $json->allow_nonref->decode('"\u3042"'); | |
| $json->allow_nonref->decode('"\ud808\udf45"'); | |
| Returns UTF-8 encoded strings with UTF8 flag, regarded as C<U+3042> and C<U+12345>. | |
| Note that the versions from Perl 5.8.0 to 5.8.2, Perl built-in C<join> was broken, | |
| so JSON::PP wraps the C<join> with a subroutine. Thus JSON::PP works slow in the versions. | |
| =head2 Perl 5.6 | |
| Perl can handle Unicode and the JSON::PP de/encode methods also work. | |
| =head2 Perl 5.005 | |
| Perl 5.005 is a byte semantics world -- all strings are sequences of bytes. | |
| That means the unicode handling is not available. | |
| In encoding, | |
| $json->allow_nonref->encode(chr hex 3042); # hex 3042 is 12354. | |
| $json->allow_nonref->encode(chr hex 12345); # hex 12345 is 74565. | |
| Returns C<B> and C<E>, as C<chr> takes a value more than 255, it treats | |
| as C<$value % 256>, so the above codes are equivalent to : | |
| $json->allow_nonref->encode(chr 66); | |
| $json->allow_nonref->encode(chr 69); | |
| In decoding, | |
| $json->decode('"\u00e3\u0081\u0082"'); | |
| The returned is a byte sequence C<0xE3 0x81 0x82> for UTF-8 encoded | |
| japanese character (C<HIRAGANA LETTER A>). | |
| And if it is represented in Unicode code point, C<U+3042>. | |
| Next, | |
| $json->decode('"\u3042"'); | |
| We ordinary expect the returned value is a Unicode character C<U+3042>. | |
| But here is 5.005 world. This is C<0xE3 0x81 0x82>. | |
| $json->decode('"\ud808\udf45"'); | |
| This is not a character C<U+12345> but bytes - C<0xf0 0x92 0x8d 0x85>. | |
| =head1 TODO | |
| =over | |
| =item speed | |
| =item memory saving | |
| =back | |
| =head1 SEE ALSO | |
| Most of the document are copied and modified from JSON::XS doc. | |
| L<JSON::XS> | |
| RFC4627 (L<http://www.ietf.org/rfc/rfc4627.txt>) | |
| =head1 AUTHOR | |
| Makamaka Hannyaharamitu, E<lt>makamaka[at]cpan.orgE<gt> | |
| =head1 COPYRIGHT AND LICENSE | |
| Copyright 2007-2012 by Makamaka Hannyaharamitu | |
| This library is free software; you can redistribute it and/or modify | |
| it under the same terms as Perl itself. | |
| =cut | |