1package # This is JSON::backportPP
2    JSON::PP;
3
4# JSON-2.0
5
6use 5.005;
7use strict;
8use base qw(Exporter);
9use overload ();
10
11use Carp ();
12use B ();
13#use Devel::Peek;
14
15$JSON::PP::VERSION = '2.27200';
16
17@JSON::PP::EXPORT = qw(encode_json decode_json from_json to_json);
18
19# instead of hash-access, i tried index-access for speed.
20# but this method is not faster than what i expected. so it will be changed.
21
22use constant P_ASCII                => 0;
23use constant P_LATIN1               => 1;
24use constant P_UTF8                 => 2;
25use constant P_INDENT               => 3;
26use constant P_CANONICAL            => 4;
27use constant P_SPACE_BEFORE         => 5;
28use constant P_SPACE_AFTER          => 6;
29use constant P_ALLOW_NONREF         => 7;
30use constant P_SHRINK               => 8;
31use constant P_ALLOW_BLESSED        => 9;
32use constant P_CONVERT_BLESSED      => 10;
33use constant P_RELAXED              => 11;
34
35use constant P_LOOSE                => 12;
36use constant P_ALLOW_BIGNUM         => 13;
37use constant P_ALLOW_BAREKEY        => 14;
38use constant P_ALLOW_SINGLEQUOTE    => 15;
39use constant P_ESCAPE_SLASH         => 16;
40use constant P_AS_NONBLESSED        => 17;
41
42use constant P_ALLOW_UNKNOWN        => 18;
43
44use constant OLD_PERL => $] < 5.008 ? 1 : 0;
45
46BEGIN {
47    my @xs_compati_bit_properties = qw(
48            latin1 ascii utf8 indent canonical space_before space_after allow_nonref shrink
49            allow_blessed convert_blessed relaxed allow_unknown
50    );
51    my @pp_bit_properties = qw(
52            allow_singlequote allow_bignum loose
53            allow_barekey escape_slash as_nonblessed
54    );
55
56    # Perl version check, Unicode handling is enable?
57    # Helper module sets @JSON::PP::_properties.
58    if ($] < 5.008 ) {
59        my $helper = $] >= 5.006 ? 'JSON::backportPP::Compat5006' : 'JSON::backportPP::Compat5005';
60        eval qq| require $helper |;
61        if ($@) { Carp::croak $@; }
62    }
63
64    for my $name (@xs_compati_bit_properties, @pp_bit_properties) {
65        my $flag_name = 'P_' . uc($name);
66
67        eval qq/
68            sub $name {
69                my \$enable = defined \$_[1] ? \$_[1] : 1;
70
71                if (\$enable) {
72                    \$_[0]->{PROPS}->[$flag_name] = 1;
73                }
74                else {
75                    \$_[0]->{PROPS}->[$flag_name] = 0;
76                }
77
78                \$_[0];
79            }
80
81            sub get_$name {
82                \$_[0]->{PROPS}->[$flag_name] ? 1 : '';
83            }
84        /;
85    }
86
87}
88
89
90
91# Functions
92
93my %encode_allow_method
94     = map {($_ => 1)} qw/utf8 pretty allow_nonref latin1 self_encode escape_slash
95                          allow_blessed convert_blessed indent indent_length allow_bignum
96                          as_nonblessed
97                        /;
98my %decode_allow_method
99     = map {($_ => 1)} qw/utf8 allow_nonref loose allow_singlequote allow_bignum
100                          allow_barekey max_size relaxed/;
101
102
103my $JSON; # cache
104
105sub encode_json ($) { # encode
106    ($JSON ||= __PACKAGE__->new->utf8)->encode(@_);
107}
108
109
110sub decode_json { # decode
111    ($JSON ||= __PACKAGE__->new->utf8)->decode(@_);
112}
113
114# Obsoleted
115
116sub to_json($) {
117   Carp::croak ("JSON::PP::to_json has been renamed to encode_json.");
118}
119
120
121sub from_json($) {
122   Carp::croak ("JSON::PP::from_json has been renamed to decode_json.");
123}
124
125
126# Methods
127
128sub new {
129    my $class = shift;
130    my $self  = {
131        max_depth   => 512,
132        max_size    => 0,
133        indent      => 0,
134        FLAGS       => 0,
135        fallback      => sub { encode_error('Invalid value. JSON can only reference.') },
136        indent_length => 3,
137    };
138
139    bless $self, $class;
140}
141
142
143sub encode {
144    return $_[0]->PP_encode_json($_[1]);
145}
146
147
148sub decode {
149    return $_[0]->PP_decode_json($_[1], 0x00000000);
150}
151
152
153sub decode_prefix {
154    return $_[0]->PP_decode_json($_[1], 0x00000001);
155}
156
157
158# accessor
159
160
161# pretty printing
162
163sub pretty {
164    my ($self, $v) = @_;
165    my $enable = defined $v ? $v : 1;
166
167    if ($enable) { # indent_length(3) for JSON::XS compatibility
168        $self->indent(1)->indent_length(3)->space_before(1)->space_after(1);
169    }
170    else {
171        $self->indent(0)->space_before(0)->space_after(0);
172    }
173
174    $self;
175}
176
177# etc
178
179sub max_depth {
180    my $max  = defined $_[1] ? $_[1] : 0x80000000;
181    $_[0]->{max_depth} = $max;
182    $_[0];
183}
184
185
186sub get_max_depth { $_[0]->{max_depth}; }
187
188
189sub max_size {
190    my $max  = defined $_[1] ? $_[1] : 0;
191    $_[0]->{max_size} = $max;
192    $_[0];
193}
194
195
196sub get_max_size { $_[0]->{max_size}; }
197
198
199sub filter_json_object {
200    $_[0]->{cb_object} = defined $_[1] ? $_[1] : 0;
201    $_[0]->{F_HOOK} = ($_[0]->{cb_object} or $_[0]->{cb_sk_object}) ? 1 : 0;
202    $_[0];
203}
204
205sub filter_json_single_key_object {
206    if (@_ > 1) {
207        $_[0]->{cb_sk_object}->{$_[1]} = $_[2];
208    }
209    $_[0]->{F_HOOK} = ($_[0]->{cb_object} or $_[0]->{cb_sk_object}) ? 1 : 0;
210    $_[0];
211}
212
213sub indent_length {
214    if (!defined $_[1] or $_[1] > 15 or $_[1] < 0) {
215        Carp::carp "The acceptable range of indent_length() is 0 to 15.";
216    }
217    else {
218        $_[0]->{indent_length} = $_[1];
219    }
220    $_[0];
221}
222
223sub get_indent_length {
224    $_[0]->{indent_length};
225}
226
227sub sort_by {
228    $_[0]->{sort_by} = defined $_[1] ? $_[1] : 1;
229    $_[0];
230}
231
232sub allow_bigint {
233    Carp::carp("allow_bigint() is obsoleted. use allow_bignum() insted.");
234}
235
236###############################
237
238###
239### Perl => JSON
240###
241
242
243{ # Convert
244
245    my $max_depth;
246    my $indent;
247    my $ascii;
248    my $latin1;
249    my $utf8;
250    my $space_before;
251    my $space_after;
252    my $canonical;
253    my $allow_blessed;
254    my $convert_blessed;
255
256    my $indent_length;
257    my $escape_slash;
258    my $bignum;
259    my $as_nonblessed;
260
261    my $depth;
262    my $indent_count;
263    my $keysort;
264
265
266    sub PP_encode_json {
267        my $self = shift;
268        my $obj  = shift;
269
270        $indent_count = 0;
271        $depth        = 0;
272
273        my $idx = $self->{PROPS};
274
275        ($ascii, $latin1, $utf8, $indent, $canonical, $space_before, $space_after, $allow_blessed,
276            $convert_blessed, $escape_slash, $bignum, $as_nonblessed)
277         = @{$idx}[P_ASCII .. P_SPACE_AFTER, P_ALLOW_BLESSED, P_CONVERT_BLESSED,
278                    P_ESCAPE_SLASH, P_ALLOW_BIGNUM, P_AS_NONBLESSED];
279
280        ($max_depth, $indent_length) = @{$self}{qw/max_depth indent_length/};
281
282        $keysort = $canonical ? sub { $a cmp $b } : undef;
283
284        if ($self->{sort_by}) {
285            $keysort = ref($self->{sort_by}) eq 'CODE' ? $self->{sort_by}
286                     : $self->{sort_by} =~ /\D+/       ? $self->{sort_by}
287                     : sub { $a cmp $b };
288        }
289
290        encode_error("hash- or arrayref expected (not a simple scalar, use allow_nonref to allow this)")
291             if(!ref $obj and !$idx->[ P_ALLOW_NONREF ]);
292
293        my $str  = $self->object_to_json($obj);
294
295        $str .= "\n" if ( $indent ); # JSON::XS 2.26 compatible
296
297        unless ($ascii or $latin1 or $utf8) {
298            utf8::upgrade($str);
299        }
300
301        if ($idx->[ P_SHRINK ]) {
302            utf8::downgrade($str, 1);
303        }
304
305        return $str;
306    }
307
308
309    sub object_to_json {
310        my ($self, $obj) = @_;
311        my $type = ref($obj);
312
313        if($type eq 'HASH'){
314            return $self->hash_to_json($obj);
315        }
316        elsif($type eq 'ARRAY'){
317            return $self->array_to_json($obj);
318        }
319        elsif ($type) { # blessed object?
320            if (blessed($obj)) {
321
322                return $self->value_to_json($obj) if ( $obj->isa('JSON::PP::Boolean') );
323
324                if ( $convert_blessed and $obj->can('TO_JSON') ) {
325                    my $result = $obj->TO_JSON();
326                    if ( defined $result and ref( $result ) ) {
327                        if ( refaddr( $obj ) eq refaddr( $result ) ) {
328                            encode_error( sprintf(
329                                "%s::TO_JSON method returned same object as was passed instead of a new one",
330                                ref $obj
331                            ) );
332                        }
333                    }
334
335                    return $self->object_to_json( $result );
336                }
337
338                return "$obj" if ( $bignum and _is_bignum($obj) );
339                return $self->blessed_to_json($obj) if ($allow_blessed and $as_nonblessed); # will be removed.
340
341                encode_error( sprintf("encountered object '%s', but neither allow_blessed "
342                    . "nor convert_blessed settings are enabled", $obj)
343                ) unless ($allow_blessed);
344
345                return 'null';
346            }
347            else {
348                return $self->value_to_json($obj);
349            }
350        }
351        else{
352            return $self->value_to_json($obj);
353        }
354    }
355
356
357    sub hash_to_json {
358        my ($self, $obj) = @_;
359        my @res;
360
361        encode_error("json text or perl structure exceeds maximum nesting level (max_depth set too low?)")
362                                         if (++$depth > $max_depth);
363
364        my ($pre, $post) = $indent ? $self->_up_indent() : ('', '');
365        my $del = ($space_before ? ' ' : '') . ':' . ($space_after ? ' ' : '');
366
367        for my $k ( _sort( $obj ) ) {
368            if ( OLD_PERL ) { utf8::decode($k) } # key for Perl 5.6 / be optimized
369            push @res, string_to_json( $self, $k )
370                          .  $del
371                          . ( $self->object_to_json( $obj->{$k} ) || $self->value_to_json( $obj->{$k} ) );
372        }
373
374        --$depth;
375        $self->_down_indent() if ($indent);
376
377        return   '{' . ( @res ? $pre : '' ) . ( @res ? join( ",$pre", @res ) . $post : '' )  . '}';
378    }
379
380
381    sub array_to_json {
382        my ($self, $obj) = @_;
383        my @res;
384
385        encode_error("json text or perl structure exceeds maximum nesting level (max_depth set too low?)")
386                                         if (++$depth > $max_depth);
387
388        my ($pre, $post) = $indent ? $self->_up_indent() : ('', '');
389
390        for my $v (@$obj){
391            push @res, $self->object_to_json($v) || $self->value_to_json($v);
392        }
393
394        --$depth;
395        $self->_down_indent() if ($indent);
396
397        return '[' . ( @res ? $pre : '' ) . ( @res ? join( ",$pre", @res ) . $post : '' ) . ']';
398    }
399
400
401    sub value_to_json {
402        my ($self, $value) = @_;
403
404        return 'null' if(!defined $value);
405
406        my $b_obj = B::svref_2object(\$value);  # for round trip problem
407        my $flags = $b_obj->FLAGS;
408
409        return $value # as is
410            if $flags & ( B::SVp_IOK | B::SVp_NOK ) and !( $flags & B::SVp_POK ); # SvTYPE is IV or NV?
411
412        my $type = ref($value);
413
414        if(!$type){
415            return string_to_json($self, $value);
416        }
417        elsif( blessed($value) and  $value->isa('JSON::PP::Boolean') ){
418            return $$value == 1 ? 'true' : 'false';
419        }
420        elsif ($type) {
421            if ((overload::StrVal($value) =~ /=(\w+)/)[0]) {
422                return $self->value_to_json("$value");
423            }
424
425            if ($type eq 'SCALAR' and defined $$value) {
426                return   $$value eq '1' ? 'true'
427                       : $$value eq '0' ? 'false'
428                       : $self->{PROPS}->[ P_ALLOW_UNKNOWN ] ? 'null'
429                       : encode_error("cannot encode reference to scalar");
430            }
431
432             if ( $self->{PROPS}->[ P_ALLOW_UNKNOWN ] ) {
433                 return 'null';
434             }
435             else {
436                 if ( $type eq 'SCALAR' or $type eq 'REF' ) {
437                    encode_error("cannot encode reference to scalar");
438                 }
439                 else {
440                    encode_error("encountered $value, but JSON can only represent references to arrays or hashes");
441                 }
442             }
443
444        }
445        else {
446            return $self->{fallback}->($value)
447                 if ($self->{fallback} and ref($self->{fallback}) eq 'CODE');
448            return 'null';
449        }
450
451    }
452
453
454    my %esc = (
455        "\n" => '\n',
456        "\r" => '\r',
457        "\t" => '\t',
458        "\f" => '\f',
459        "\b" => '\b',
460        "\"" => '\"',
461        "\\" => '\\\\',
462        "\'" => '\\\'',
463    );
464
465
466    sub string_to_json {
467        my ($self, $arg) = @_;
468
469        $arg =~ s/([\x22\x5c\n\r\t\f\b])/$esc{$1}/g;
470        $arg =~ s/\//\\\//g if ($escape_slash);
471        $arg =~ s/([\x00-\x08\x0b\x0e-\x1f])/'\\u00' . unpack('H2', $1)/eg;
472
473        if ($ascii) {
474            $arg = JSON_PP_encode_ascii($arg);
475        }
476
477        if ($latin1) {
478            $arg = JSON_PP_encode_latin1($arg);
479        }
480
481        if ($utf8) {
482            utf8::encode($arg);
483        }
484
485        return '"' . $arg . '"';
486    }
487
488
489    sub blessed_to_json {
490        my $reftype = reftype($_[1]) || '';
491        if ($reftype eq 'HASH') {
492            return $_[0]->hash_to_json($_[1]);
493        }
494        elsif ($reftype eq 'ARRAY') {
495            return $_[0]->array_to_json($_[1]);
496        }
497        else {
498            return 'null';
499        }
500    }
501
502
503    sub encode_error {
504        my $error  = shift;
505        Carp::croak "$error";
506    }
507
508
509    sub _sort {
510        defined $keysort ? (sort $keysort (keys %{$_[0]})) : keys %{$_[0]};
511    }
512
513
514    sub _up_indent {
515        my $self  = shift;
516        my $space = ' ' x $indent_length;
517
518        my ($pre,$post) = ('','');
519
520        $post = "\n" . $space x $indent_count;
521
522        $indent_count++;
523
524        $pre = "\n" . $space x $indent_count;
525
526        return ($pre,$post);
527    }
528
529
530    sub _down_indent { $indent_count--; }
531
532
533    sub PP_encode_box {
534        {
535            depth        => $depth,
536            indent_count => $indent_count,
537        };
538    }
539
540} # Convert
541
542
543sub _encode_ascii {
544    join('',
545        map {
546            $_ <= 127 ?
547                chr($_) :
548            $_ <= 65535 ?
549                sprintf('\u%04x', $_) : sprintf('\u%x\u%x', _encode_surrogates($_));
550        } unpack('U*', $_[0])
551    );
552}
553
554
555sub _encode_latin1 {
556    join('',
557        map {
558            $_ <= 255 ?
559                chr($_) :
560            $_ <= 65535 ?
561                sprintf('\u%04x', $_) : sprintf('\u%x\u%x', _encode_surrogates($_));
562        } unpack('U*', $_[0])
563    );
564}
565
566
567sub _encode_surrogates { # from perlunicode
568    my $uni = $_[0] - 0x10000;
569    return ($uni / 0x400 + 0xD800, $uni % 0x400 + 0xDC00);
570}
571
572
573sub _is_bignum {
574    $_[0]->isa('Math::BigInt') or $_[0]->isa('Math::BigFloat');
575}
576
577
578
579#
580# JSON => Perl
581#
582
583my $max_intsize;
584
585BEGIN {
586    my $checkint = 1111;
587    for my $d (5..64) {
588        $checkint .= 1;
589        my $int   = eval qq| $checkint |;
590        if ($int =~ /[eE]/) {
591            $max_intsize = $d - 1;
592            last;
593        }
594    }
595}
596
597{ # PARSE
598
599    my %escapes = ( #  by Jeremy Muhlich <jmuhlich [at] bitflood.org>
600        b    => "\x8",
601        t    => "\x9",
602        n    => "\xA",
603        f    => "\xC",
604        r    => "\xD",
605        '\\' => '\\',
606        '"'  => '"',
607        '/'  => '/',
608    );
609
610    my $text; # json data
611    my $at;   # offset
612    my $ch;   # 1chracter
613    my $len;  # text length (changed according to UTF8 or NON UTF8)
614    # INTERNAL
615    my $depth;          # nest counter
616    my $encoding;       # json text encoding
617    my $is_valid_utf8;  # temp variable
618    my $utf8_len;       # utf8 byte length
619    # FLAGS
620    my $utf8;           # must be utf8
621    my $max_depth;      # max nest nubmer of objects and arrays
622    my $max_size;
623    my $relaxed;
624    my $cb_object;
625    my $cb_sk_object;
626
627    my $F_HOOK;
628
629    my $allow_bigint;   # using Math::BigInt
630    my $singlequote;    # loosely quoting
631    my $loose;          #
632    my $allow_barekey;  # bareKey
633
634    # $opt flag
635    # 0x00000001 .... decode_prefix
636    # 0x10000000 .... incr_parse
637
638    sub PP_decode_json {
639        my ($self, $opt); # $opt is an effective flag during this decode_json.
640
641        ($self, $text, $opt) = @_;
642
643        ($at, $ch, $depth) = (0, '', 0);
644
645        if ( !defined $text or ref $text ) {
646            decode_error("malformed JSON string, neither array, object, number, string or atom");
647        }
648
649        my $idx = $self->{PROPS};
650
651        ($utf8, $relaxed, $loose, $allow_bigint, $allow_barekey, $singlequote)
652            = @{$idx}[P_UTF8, P_RELAXED, P_LOOSE .. P_ALLOW_SINGLEQUOTE];
653
654        if ( $utf8 ) {
655            utf8::downgrade( $text, 1 ) or Carp::croak("Wide character in subroutine entry");
656        }
657        else {
658            utf8::upgrade( $text );
659        }
660
661        $len = length $text;
662
663        ($max_depth, $max_size, $cb_object, $cb_sk_object, $F_HOOK)
664             = @{$self}{qw/max_depth  max_size cb_object cb_sk_object F_HOOK/};
665
666        if ($max_size > 1) {
667            use bytes;
668            my $bytes = length $text;
669            decode_error(
670                sprintf("attempted decode of JSON text of %s bytes size, but max_size is set to %s"
671                    , $bytes, $max_size), 1
672            ) if ($bytes > $max_size);
673        }
674
675        # Currently no effect
676        # should use regexp
677        my @octets = unpack('C4', $text);
678        $encoding =   ( $octets[0] and  $octets[1]) ? 'UTF-8'
679                    : (!$octets[0] and  $octets[1]) ? 'UTF-16BE'
680                    : (!$octets[0] and !$octets[1]) ? 'UTF-32BE'
681                    : ( $octets[2]                ) ? 'UTF-16LE'
682                    : (!$octets[2]                ) ? 'UTF-32LE'
683                    : 'unknown';
684
685        white(); # remove head white space
686
687        my $valid_start = defined $ch; # Is there a first character for JSON structure?
688
689        my $result = value();
690
691        return undef if ( !$result && ( $opt & 0x10000000 ) ); # for incr_parse
692
693        decode_error("malformed JSON string, neither array, object, number, string or atom") unless $valid_start;
694
695        if ( !$idx->[ P_ALLOW_NONREF ] and !ref $result ) {
696                decode_error(
697                'JSON text must be an object or array (but found number, string, true, false or null,'
698                       . ' use allow_nonref to allow this)', 1);
699        }
700
701        Carp::croak('something wrong.') if $len < $at; # we won't arrive here.
702
703        my $consumed = defined $ch ? $at - 1 : $at; # consumed JSON text length
704
705        white(); # remove tail white space
706
707        if ( $ch ) {
708            return ( $result, $consumed ) if ($opt & 0x00000001); # all right if decode_prefix
709            decode_error("garbage after JSON object");
710        }
711
712        ( $opt & 0x00000001 ) ? ( $result, $consumed ) : $result;
713    }
714
715
716    sub next_chr {
717        return $ch = undef if($at >= $len);
718        $ch = substr($text, $at++, 1);
719    }
720
721
722    sub value {
723        white();
724        return          if(!defined $ch);
725        return object() if($ch eq '{');
726        return array()  if($ch eq '[');
727        return string() if($ch eq '"' or ($singlequote and $ch eq "'"));
728        return number() if($ch =~ /[0-9]/ or $ch eq '-');
729        return word();
730    }
731
732    sub string {
733        my ($i, $s, $t, $u);
734        my $utf16;
735        my $is_utf8;
736
737        ($is_valid_utf8, $utf8_len) = ('', 0);
738
739        $s = ''; # basically UTF8 flag on
740
741        if($ch eq '"' or ($singlequote and $ch eq "'")){
742            my $boundChar = $ch;
743
744            OUTER: while( defined(next_chr()) ){
745
746                if($ch eq $boundChar){
747                    next_chr();
748
749                    if ($utf16) {
750                        decode_error("missing low surrogate character in surrogate pair");
751                    }
752
753                    utf8::decode($s) if($is_utf8);
754
755                    return $s;
756                }
757                elsif($ch eq '\\'){
758                    next_chr();
759                    if(exists $escapes{$ch}){
760                        $s .= $escapes{$ch};
761                    }
762                    elsif($ch eq 'u'){ # UNICODE handling
763                        my $u = '';
764
765                        for(1..4){
766                            $ch = next_chr();
767                            last OUTER if($ch !~ /[0-9a-fA-F]/);
768                            $u .= $ch;
769                        }
770
771                        # U+D800 - U+DBFF
772                        if ($u =~ /^[dD][89abAB][0-9a-fA-F]{2}/) { # UTF-16 high surrogate?
773                            $utf16 = $u;
774                        }
775                        # U+DC00 - U+DFFF
776                        elsif ($u =~ /^[dD][c-fC-F][0-9a-fA-F]{2}/) { # UTF-16 low surrogate?
777                            unless (defined $utf16) {
778                                decode_error("missing high surrogate character in surrogate pair");
779                            }
780                            $is_utf8 = 1;
781                            $s .= JSON_PP_decode_surrogates($utf16, $u) || next;
782                            $utf16 = undef;
783                        }
784                        else {
785                            if (defined $utf16) {
786                                decode_error("surrogate pair expected");
787                            }
788
789                            if ( ( my $hex = hex( $u ) ) > 127 ) {
790                                $is_utf8 = 1;
791                                $s .= JSON_PP_decode_unicode($u) || next;
792                            }
793                            else {
794                                $s .= chr $hex;
795                            }
796                        }
797
798                    }
799                    else{
800                        unless ($loose) {
801                            $at -= 2;
802                            decode_error('illegal backslash escape sequence in string');
803                        }
804                        $s .= $ch;
805                    }
806                }
807                else{
808
809                    if ( ord $ch  > 127 ) {
810                        if ( $utf8 ) {
811                            unless( $ch = is_valid_utf8($ch) ) {
812                                $at -= 1;
813                                decode_error("malformed UTF-8 character in JSON string");
814                            }
815                            else {
816                                $at += $utf8_len - 1;
817                            }
818                        }
819                        else {
820                            utf8::encode( $ch );
821                        }
822
823                        $is_utf8 = 1;
824                    }
825
826                    if (!$loose) {
827                        if ($ch =~ /[\x00-\x1f\x22\x5c]/)  { # '/' ok
828                            $at--;
829                            decode_error('invalid character encountered while parsing JSON string');
830                        }
831                    }
832
833                    $s .= $ch;
834                }
835            }
836        }
837
838        decode_error("unexpected end of string while parsing JSON string");
839    }
840
841
842    sub white {
843        while( defined $ch  ){
844            if($ch le ' '){
845                next_chr();
846            }
847            elsif($ch eq '/'){
848                next_chr();
849                if(defined $ch and $ch eq '/'){
850                    1 while(defined(next_chr()) and $ch ne "\n" and $ch ne "\r");
851                }
852                elsif(defined $ch and $ch eq '*'){
853                    next_chr();
854                    while(1){
855                        if(defined $ch){
856                            if($ch eq '*'){
857                                if(defined(next_chr()) and $ch eq '/'){
858                                    next_chr();
859                                    last;
860                                }
861                            }
862                            else{
863                                next_chr();
864                            }
865                        }
866                        else{
867                            decode_error("Unterminated comment");
868                        }
869                    }
870                    next;
871                }
872                else{
873                    $at--;
874                    decode_error("malformed JSON string, neither array, object, number, string or atom");
875                }
876            }
877            else{
878                if ($relaxed and $ch eq '#') { # correctly?
879                    pos($text) = $at;
880                    $text =~ /\G([^\n]*(?:\r\n|\r|\n|$))/g;
881                    $at = pos($text);
882                    next_chr;
883                    next;
884                }
885
886                last;
887            }
888        }
889    }
890
891
892    sub array {
893        my $a  = $_[0] || []; # you can use this code to use another array ref object.
894
895        decode_error('json text or perl structure exceeds maximum nesting level (max_depth set too low?)')
896                                                    if (++$depth > $max_depth);
897
898        next_chr();
899        white();
900
901        if(defined $ch and $ch eq ']'){
902            --$depth;
903            next_chr();
904            return $a;
905        }
906        else {
907            while(defined($ch)){
908                push @$a, value();
909
910                white();
911
912                if (!defined $ch) {
913                    last;
914                }
915
916                if($ch eq ']'){
917                    --$depth;
918                    next_chr();
919                    return $a;
920                }
921
922                if($ch ne ','){
923                    last;
924                }
925
926                next_chr();
927                white();
928
929                if ($relaxed and $ch eq ']') {
930                    --$depth;
931                    next_chr();
932                    return $a;
933                }
934
935            }
936        }
937
938        decode_error(", or ] expected while parsing array");
939    }
940
941
942    sub object {
943        my $o = $_[0] || {}; # you can use this code to use another hash ref object.
944        my $k;
945
946        decode_error('json text or perl structure exceeds maximum nesting level (max_depth set too low?)')
947                                                if (++$depth > $max_depth);
948        next_chr();
949        white();
950
951        if(defined $ch and $ch eq '}'){
952            --$depth;
953            next_chr();
954            if ($F_HOOK) {
955                return _json_object_hook($o);
956            }
957            return $o;
958        }
959        else {
960            while (defined $ch) {
961                $k = ($allow_barekey and $ch ne '"' and $ch ne "'") ? bareKey() : string();
962                white();
963
964                if(!defined $ch or $ch ne ':'){
965                    $at--;
966                    decode_error("':' expected");
967                }
968
969                next_chr();
970                $o->{$k} = value();
971                white();
972
973                last if (!defined $ch);
974
975                if($ch eq '}'){
976                    --$depth;
977                    next_chr();
978                    if ($F_HOOK) {
979                        return _json_object_hook($o);
980                    }
981                    return $o;
982                }
983
984                if($ch ne ','){
985                    last;
986                }
987
988                next_chr();
989                white();
990
991                if ($relaxed and $ch eq '}') {
992                    --$depth;
993                    next_chr();
994                    if ($F_HOOK) {
995                        return _json_object_hook($o);
996                    }
997                    return $o;
998                }
999
1000            }
1001
1002        }
1003
1004        $at--;
1005        decode_error(", or } expected while parsing object/hash");
1006    }
1007
1008
1009    sub bareKey { # doesn't strictly follow Standard ECMA-262 3rd Edition
1010        my $key;
1011        while($ch =~ /[^\x00-\x23\x25-\x2F\x3A-\x40\x5B-\x5E\x60\x7B-\x7F]/){
1012            $key .= $ch;
1013            next_chr();
1014        }
1015        return $key;
1016    }
1017
1018
1019    sub word {
1020        my $word =  substr($text,$at-1,4);
1021
1022        if($word eq 'true'){
1023            $at += 3;
1024            next_chr;
1025            return $JSON::PP::true;
1026        }
1027        elsif($word eq 'null'){
1028            $at += 3;
1029            next_chr;
1030            return undef;
1031        }
1032        elsif($word eq 'fals'){
1033            $at += 3;
1034            if(substr($text,$at,1) eq 'e'){
1035                $at++;
1036                next_chr;
1037                return $JSON::PP::false;
1038            }
1039        }
1040
1041        $at--; # for decode_error report
1042
1043        decode_error("'null' expected")  if ($word =~ /^n/);
1044        decode_error("'true' expected")  if ($word =~ /^t/);
1045        decode_error("'false' expected") if ($word =~ /^f/);
1046        decode_error("malformed JSON string, neither array, object, number, string or atom");
1047    }
1048
1049
1050    sub number {
1051        my $n    = '';
1052        my $v;
1053
1054        # According to RFC4627, hex or oct digts are invalid.
1055        if($ch eq '0'){
1056            my $peek = substr($text,$at,1);
1057            my $hex  = $peek =~ /[xX]/; # 0 or 1
1058
1059            if($hex){
1060                decode_error("malformed number (leading zero must not be followed by another digit)");
1061                ($n) = ( substr($text, $at+1) =~ /^([0-9a-fA-F]+)/);
1062            }
1063            else{ # oct
1064                ($n) = ( substr($text, $at) =~ /^([0-7]+)/);
1065                if (defined $n and length $n > 1) {
1066                    decode_error("malformed number (leading zero must not be followed by another digit)");
1067                }
1068            }
1069
1070            if(defined $n and length($n)){
1071                if (!$hex and length($n) == 1) {
1072                   decode_error("malformed number (leading zero must not be followed by another digit)");
1073                }
1074                $at += length($n) + $hex;
1075                next_chr;
1076                return $hex ? hex($n) : oct($n);
1077            }
1078        }
1079
1080        if($ch eq '-'){
1081            $n = '-';
1082            next_chr;
1083            if (!defined $ch or $ch !~ /\d/) {
1084                decode_error("malformed number (no digits after initial minus)");
1085            }
1086        }
1087
1088        while(defined $ch and $ch =~ /\d/){
1089            $n .= $ch;
1090            next_chr;
1091        }
1092
1093        if(defined $ch and $ch eq '.'){
1094            $n .= '.';
1095
1096            next_chr;
1097            if (!defined $ch or $ch !~ /\d/) {
1098                decode_error("malformed number (no digits after decimal point)");
1099            }
1100            else {
1101                $n .= $ch;
1102            }
1103
1104            while(defined(next_chr) and $ch =~ /\d/){
1105                $n .= $ch;
1106            }
1107        }
1108
1109        if(defined $ch and ($ch eq 'e' or $ch eq 'E')){
1110            $n .= $ch;
1111            next_chr;
1112
1113            if(defined($ch) and ($ch eq '+' or $ch eq '-')){
1114                $n .= $ch;
1115                next_chr;
1116                if (!defined $ch or $ch =~ /\D/) {
1117                    decode_error("malformed number (no digits after exp sign)");
1118                }
1119                $n .= $ch;
1120            }
1121            elsif(defined($ch) and $ch =~ /\d/){
1122                $n .= $ch;
1123            }
1124            else {
1125                decode_error("malformed number (no digits after exp sign)");
1126            }
1127
1128            while(defined(next_chr) and $ch =~ /\d/){
1129                $n .= $ch;
1130            }
1131
1132        }
1133
1134        $v .= $n;
1135
1136        if ($v !~ /[.eE]/ and length $v > $max_intsize) {
1137            if ($allow_bigint) { # from Adam Sussman
1138                require Math::BigInt;
1139                return Math::BigInt->new($v);
1140            }
1141            else {
1142                return "$v";
1143            }
1144        }
1145        elsif ($allow_bigint) {
1146            require Math::BigFloat;
1147            return Math::BigFloat->new($v);
1148        }
1149
1150        return 0+$v;
1151    }
1152
1153
1154    sub is_valid_utf8 {
1155
1156        $utf8_len = $_[0] =~ /[\x00-\x7F]/  ? 1
1157                  : $_[0] =~ /[\xC2-\xDF]/  ? 2
1158                  : $_[0] =~ /[\xE0-\xEF]/  ? 3
1159                  : $_[0] =~ /[\xF0-\xF4]/  ? 4
1160                  : 0
1161                  ;
1162
1163        return unless $utf8_len;
1164
1165        my $is_valid_utf8 = substr($text, $at - 1, $utf8_len);
1166
1167        return ( $is_valid_utf8 =~ /^(?:
1168             [\x00-\x7F]
1169            |[\xC2-\xDF][\x80-\xBF]
1170            |[\xE0][\xA0-\xBF][\x80-\xBF]
1171            |[\xE1-\xEC][\x80-\xBF][\x80-\xBF]
1172            |[\xED][\x80-\x9F][\x80-\xBF]
1173            |[\xEE-\xEF][\x80-\xBF][\x80-\xBF]
1174            |[\xF0][\x90-\xBF][\x80-\xBF][\x80-\xBF]
1175            |[\xF1-\xF3][\x80-\xBF][\x80-\xBF][\x80-\xBF]
1176            |[\xF4][\x80-\x8F][\x80-\xBF][\x80-\xBF]
1177        )$/x )  ? $is_valid_utf8 : '';
1178    }
1179
1180
1181    sub decode_error {
1182        my $error  = shift;
1183        my $no_rep = shift;
1184        my $str    = defined $text ? substr($text, $at) : '';
1185        my $mess   = '';
1186        my $type   = $] >= 5.008           ? 'U*'
1187                   : $] <  5.006           ? 'C*'
1188                   : utf8::is_utf8( $str ) ? 'U*' # 5.6
1189                   : 'C*'
1190                   ;
1191
1192        for my $c ( unpack( $type, $str ) ) { # emulate pv_uni_display() ?
1193            $mess .=  $c == 0x07 ? '\a'
1194                    : $c == 0x09 ? '\t'
1195                    : $c == 0x0a ? '\n'
1196                    : $c == 0x0d ? '\r'
1197                    : $c == 0x0c ? '\f'
1198                    : $c <  0x20 ? sprintf('\x{%x}', $c)
1199                    : $c == 0x5c ? '\\\\'
1200                    : $c <  0x80 ? chr($c)
1201                    : sprintf('\x{%x}', $c)
1202                    ;
1203            if ( length $mess >= 20 ) {
1204                $mess .= '...';
1205                last;
1206            }
1207        }
1208
1209        unless ( length $mess ) {
1210            $mess = '(end of string)';
1211        }
1212
1213        Carp::croak (
1214            $no_rep ? "$error" : "$error, at character offset $at (before \"$mess\")"
1215        );
1216
1217    }
1218
1219
1220    sub _json_object_hook {
1221        my $o    = $_[0];
1222        my @ks = keys %{$o};
1223
1224        if ( $cb_sk_object and @ks == 1 and exists $cb_sk_object->{ $ks[0] } and ref $cb_sk_object->{ $ks[0] } ) {
1225            my @val = $cb_sk_object->{ $ks[0] }->( $o->{$ks[0]} );
1226            if (@val == 1) {
1227                return $val[0];
1228            }
1229        }
1230
1231        my @val = $cb_object->($o) if ($cb_object);
1232        if (@val == 0 or @val > 1) {
1233            return $o;
1234        }
1235        else {
1236            return $val[0];
1237        }
1238    }
1239
1240
1241    sub PP_decode_box {
1242        {
1243            text    => $text,
1244            at      => $at,
1245            ch      => $ch,
1246            len     => $len,
1247            depth   => $depth,
1248            encoding      => $encoding,
1249            is_valid_utf8 => $is_valid_utf8,
1250        };
1251    }
1252
1253} # PARSE
1254
1255
1256sub _decode_surrogates { # from perlunicode
1257    my $uni = 0x10000 + (hex($_[0]) - 0xD800) * 0x400 + (hex($_[1]) - 0xDC00);
1258    my $un  = pack('U*', $uni);
1259    utf8::encode( $un );
1260    return $un;
1261}
1262
1263
1264sub _decode_unicode {
1265    my $un = pack('U', hex shift);
1266    utf8::encode( $un );
1267    return $un;
1268}
1269
1270#
1271# Setup for various Perl versions (the code from JSON::PP58)
1272#
1273
1274BEGIN {
1275
1276    unless ( defined &utf8::is_utf8 ) {
1277       require Encode;
1278       *utf8::is_utf8 = *Encode::is_utf8;
1279    }
1280
1281    if ( $] >= 5.008 ) {
1282        *JSON::PP::JSON_PP_encode_ascii      = \&_encode_ascii;
1283        *JSON::PP::JSON_PP_encode_latin1     = \&_encode_latin1;
1284        *JSON::PP::JSON_PP_decode_surrogates = \&_decode_surrogates;
1285        *JSON::PP::JSON_PP_decode_unicode    = \&_decode_unicode;
1286    }
1287
1288    if ($] >= 5.008 and $] < 5.008003) { # join() in 5.8.0 - 5.8.2 is broken.
1289        package JSON::PP;
1290        require subs;
1291        subs->import('join');
1292        eval q|
1293            sub join {
1294                return '' if (@_ < 2);
1295                my $j   = shift;
1296                my $str = shift;
1297                for (@_) { $str .= $j . $_; }
1298                return $str;
1299            }
1300        |;
1301    }
1302
1303
1304    sub JSON::PP::incr_parse {
1305        local $Carp::CarpLevel = 1;
1306        ( $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new )->incr_parse( @_ );
1307    }
1308
1309
1310    sub JSON::PP::incr_skip {
1311        ( $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new )->incr_skip;
1312    }
1313
1314
1315    sub JSON::PP::incr_reset {
1316        ( $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new )->incr_reset;
1317    }
1318
1319    eval q{
1320        sub JSON::PP::incr_text : lvalue {
1321            $_[0]->{_incr_parser} ||= JSON::PP::IncrParser->new;
1322
1323            if ( $_[0]->{_incr_parser}->{incr_parsing} ) {
1324                Carp::croak("incr_text can not be called when the incremental parser already started parsing");
1325            }
1326            $_[0]->{_incr_parser}->{incr_text};
1327        }
1328    } if ( $] >= 5.006 );
1329
1330} # Setup for various Perl versions (the code from JSON::PP58)
1331
1332
1333###############################
1334# Utilities
1335#
1336
1337BEGIN {
1338    eval 'require Scalar::Util';
1339    unless($@){
1340        *JSON::PP::blessed = \&Scalar::Util::blessed;
1341        *JSON::PP::reftype = \&Scalar::Util::reftype;
1342        *JSON::PP::refaddr = \&Scalar::Util::refaddr;
1343    }
1344    else{ # This code is from Sclar::Util.
1345        # warn $@;
1346        eval 'sub UNIVERSAL::a_sub_not_likely_to_be_here { ref($_[0]) }';
1347        *JSON::PP::blessed = sub {
1348            local($@, $SIG{__DIE__}, $SIG{__WARN__});
1349            ref($_[0]) ? eval { $_[0]->a_sub_not_likely_to_be_here } : undef;
1350        };
1351        my %tmap = qw(
1352            B::NULL   SCALAR
1353            B::HV     HASH
1354            B::AV     ARRAY
1355            B::CV     CODE
1356            B::IO     IO
1357            B::GV     GLOB
1358            B::REGEXP REGEXP
1359        );
1360        *JSON::PP::reftype = sub {
1361            my $r = shift;
1362
1363            return undef unless length(ref($r));
1364
1365            my $t = ref(B::svref_2object($r));
1366
1367            return
1368                exists $tmap{$t} ? $tmap{$t}
1369              : length(ref($$r)) ? 'REF'
1370              :                    'SCALAR';
1371        };
1372        *JSON::PP::refaddr = sub {
1373          return undef unless length(ref($_[0]));
1374
1375          my $addr;
1376          if(defined(my $pkg = blessed($_[0]))) {
1377            $addr .= bless $_[0], 'Scalar::Util::Fake';
1378            bless $_[0], $pkg;
1379          }
1380          else {
1381            $addr .= $_[0]
1382          }
1383
1384          $addr =~ /0x(\w+)/;
1385          local $^W;
1386          #no warnings 'portable';
1387          hex($1);
1388        }
1389    }
1390}
1391
1392
1393# shamely copied and modified from JSON::XS code.
1394
1395$JSON::PP::true  = do { bless \(my $dummy = 1), "JSON::backportPP::Boolean" };
1396$JSON::PP::false = do { bless \(my $dummy = 0), "JSON::backportPP::Boolean" };
1397
1398sub is_bool { defined $_[0] and UNIVERSAL::isa($_[0], "JSON::PP::Boolean"); }
1399
1400sub true  { $JSON::PP::true  }
1401sub false { $JSON::PP::false }
1402sub null  { undef; }
1403
1404###############################
1405
1406package JSON::backportPP::Boolean;
1407
1408@JSON::backportPP::Boolean::ISA = ('JSON::PP::Boolean');
1409use overload (
1410   "0+"     => sub { ${$_[0]} },
1411   "++"     => sub { $_[0] = ${$_[0]} + 1 },
1412   "--"     => sub { $_[0] = ${$_[0]} - 1 },
1413   fallback => 1,
1414);
1415
1416
1417###############################
1418
1419package
1420    JSON::PP::IncrParser;
1421
1422use strict;
1423
1424use constant INCR_M_WS   => 0; # initial whitespace skipping
1425use constant INCR_M_STR  => 1; # inside string
1426use constant INCR_M_BS   => 2; # inside backslash
1427use constant INCR_M_JSON => 3; # outside anything, count nesting
1428use constant INCR_M_C0   => 4;
1429use constant INCR_M_C1   => 5;
1430
1431$JSON::PP::IncrParser::VERSION = '1.01';
1432
1433my $unpack_format = $] < 5.006 ? 'C*' : 'U*';
1434
1435sub new {
1436    my ( $class ) = @_;
1437
1438    bless {
1439        incr_nest    => 0,
1440        incr_text    => undef,
1441        incr_parsing => 0,
1442        incr_p       => 0,
1443    }, $class;
1444}
1445
1446
1447sub incr_parse {
1448    my ( $self, $coder, $text ) = @_;
1449
1450    $self->{incr_text} = '' unless ( defined $self->{incr_text} );
1451
1452    if ( defined $text ) {
1453        if ( utf8::is_utf8( $text ) and !utf8::is_utf8( $self->{incr_text} ) ) {
1454            utf8::upgrade( $self->{incr_text} ) ;
1455            utf8::decode( $self->{incr_text} ) ;
1456        }
1457        $self->{incr_text} .= $text;
1458    }
1459
1460
1461    my $max_size = $coder->get_max_size;
1462
1463    if ( defined wantarray ) {
1464
1465        $self->{incr_mode} = INCR_M_WS unless defined $self->{incr_mode};
1466
1467        if ( wantarray ) {
1468            my @ret;
1469
1470            $self->{incr_parsing} = 1;
1471
1472            do {
1473                push @ret, $self->_incr_parse( $coder, $self->{incr_text} );
1474
1475                unless ( !$self->{incr_nest} and $self->{incr_mode} == INCR_M_JSON ) {
1476                    $self->{incr_mode} = INCR_M_WS if $self->{incr_mode} != INCR_M_STR;
1477                }
1478
1479            } until ( length $self->{incr_text} >= $self->{incr_p} );
1480
1481            $self->{incr_parsing} = 0;
1482
1483            return @ret;
1484        }
1485        else { # in scalar context
1486            $self->{incr_parsing} = 1;
1487            my $obj = $self->_incr_parse( $coder, $self->{incr_text} );
1488            $self->{incr_parsing} = 0 if defined $obj; # pointed by Martin J. Evans
1489            return $obj ? $obj : undef; # $obj is an empty string, parsing was completed.
1490        }
1491
1492    }
1493
1494}
1495
1496
1497sub _incr_parse {
1498    my ( $self, $coder, $text, $skip ) = @_;
1499    my $p = $self->{incr_p};
1500    my $restore = $p;
1501
1502    my @obj;
1503    my $len = length $text;
1504
1505    if ( $self->{incr_mode} == INCR_M_WS ) {
1506        while ( $len > $p ) {
1507            my $s = substr( $text, $p, 1 );
1508            $p++ and next if ( 0x20 >= unpack($unpack_format, $s) );
1509            $self->{incr_mode} = INCR_M_JSON;
1510            last;
1511       }
1512    }
1513
1514    while ( $len > $p ) {
1515        my $s = substr( $text, $p++, 1 );
1516
1517        if ( $s eq '"' ) {
1518            if (substr( $text, $p - 2, 1 ) eq '\\' ) {
1519                next;
1520            }
1521
1522            if ( $self->{incr_mode} != INCR_M_STR  ) {
1523                $self->{incr_mode} = INCR_M_STR;
1524            }
1525            else {
1526                $self->{incr_mode} = INCR_M_JSON;
1527                unless ( $self->{incr_nest} ) {
1528                    last;
1529                }
1530            }
1531        }
1532
1533        if ( $self->{incr_mode} == INCR_M_JSON ) {
1534
1535            if ( $s eq '[' or $s eq '{' ) {
1536                if ( ++$self->{incr_nest} > $coder->get_max_depth ) {
1537                    Carp::croak('json text or perl structure exceeds maximum nesting level (max_depth set too low?)');
1538                }
1539            }
1540            elsif ( $s eq ']' or $s eq '}' ) {
1541                last if ( --$self->{incr_nest} <= 0 );
1542            }
1543            elsif ( $s eq '#' ) {
1544                while ( $len > $p ) {
1545                    last if substr( $text, $p++, 1 ) eq "\n";
1546                }
1547            }
1548
1549        }
1550
1551    }
1552
1553    $self->{incr_p} = $p;
1554
1555    return if ( $self->{incr_mode} == INCR_M_STR and not $self->{incr_nest} );
1556    return if ( $self->{incr_mode} == INCR_M_JSON and $self->{incr_nest} > 0 );
1557
1558    return '' unless ( length substr( $self->{incr_text}, 0, $p ) );
1559
1560    local $Carp::CarpLevel = 2;
1561
1562    $self->{incr_p} = $restore;
1563    $self->{incr_c} = $p;
1564
1565    my ( $obj, $tail ) = $coder->PP_decode_json( substr( $self->{incr_text}, 0, $p ), 0x10000001 );
1566
1567    $self->{incr_text} = substr( $self->{incr_text}, $p );
1568    $self->{incr_p} = 0;
1569
1570    return $obj or '';
1571}
1572
1573
1574sub incr_text {
1575    if ( $_[0]->{incr_parsing} ) {
1576        Carp::croak("incr_text can not be called when the incremental parser already started parsing");
1577    }
1578    $_[0]->{incr_text};
1579}
1580
1581
1582sub incr_skip {
1583    my $self  = shift;
1584    $self->{incr_text} = substr( $self->{incr_text}, $self->{incr_c} );
1585    $self->{incr_p} = 0;
1586}
1587
1588
1589sub incr_reset {
1590    my $self = shift;
1591    $self->{incr_text}    = undef;
1592    $self->{incr_p}       = 0;
1593    $self->{incr_mode}    = 0;
1594    $self->{incr_nest}    = 0;
1595    $self->{incr_parsing} = 0;
1596}
1597
1598###############################
1599
1600
16011;
1602__END__
1603=pod
1604
1605=head1 NAME
1606
1607JSON::PP - JSON::XS compatible pure-Perl module.
1608
1609=head1 SYNOPSIS
1610
1611 use JSON::PP;
1612
1613 # exported functions, they croak on error
1614 # and expect/generate UTF-8
1615
1616 $utf8_encoded_json_text = encode_json $perl_hash_or_arrayref;
1617 $perl_hash_or_arrayref  = decode_json $utf8_encoded_json_text;
1618
1619 # OO-interface
1620
1621 $coder = JSON::PP->new->ascii->pretty->allow_nonref;
1622
1623 $json_text   = $json->encode( $perl_scalar );
1624 $perl_scalar = $json->decode( $json_text );
1625
1626 $pretty_printed = $json->pretty->encode( $perl_scalar ); # pretty-printing
1627
1628 # Note that JSON version 2.0 and above will automatically use
1629 # JSON::XS or JSON::PP, so you should be able to just:
1630
1631 use JSON;
1632
1633
1634=head1 VERSION
1635
1636    2.27200
1637
1638L<JSON::XS> 2.27 (~2.30) compatible.
1639
1640=head1 DESCRIPTION
1641
1642This module is L<JSON::XS> compatible pure Perl module.
1643(Perl 5.8 or later is recommended)
1644
1645JSON::XS is the fastest and most proper JSON module on CPAN.
1646It is written by Marc Lehmann in C, so must be compiled and
1647installed in the used environment.
1648
1649JSON::PP is a pure-Perl module and has compatibility to JSON::XS.
1650
1651
1652=head2 FEATURES
1653
1654=over
1655
1656=item * correct unicode handling
1657
1658This module knows how to handle Unicode (depending on Perl version).
1659
1660See to L<JSON::XS/A FEW NOTES ON UNICODE AND PERL> and L<UNICODE HANDLING ON PERLS>.
1661
1662
1663=item * round-trip integrity
1664
1665When you serialise a perl data structure using only data types supported
1666by JSON and Perl, the deserialised data structure is identical on the Perl
1667level. (e.g. the string "2.0" doesn't suddenly become "2" just because
1668it looks like a number). There I<are> minor exceptions to this, read the
1669MAPPING section below to learn about those.
1670
1671
1672=item * strict checking of JSON correctness
1673
1674There is no guessing, no generating of illegal JSON texts by default,
1675and only JSON is accepted as input by default (the latter is a security feature).
1676But when some options are set, loose chcking features are available.
1677
1678=back
1679
1680=head1 FUNCTIONAL INTERFACE
1681
1682Some documents are copied and modified from L<JSON::XS/FUNCTIONAL INTERFACE>.
1683
1684=head2 encode_json
1685
1686    $json_text = encode_json $perl_scalar
1687
1688Converts the given Perl data structure to a UTF-8 encoded, binary string.
1689
1690This function call is functionally identical to:
1691
1692    $json_text = JSON::PP->new->utf8->encode($perl_scalar)
1693
1694=head2 decode_json
1695
1696    $perl_scalar = decode_json $json_text
1697
1698The opposite of C<encode_json>: expects an UTF-8 (binary) string and tries
1699to parse that as an UTF-8 encoded JSON text, returning the resulting
1700reference.
1701
1702This function call is functionally identical to:
1703
1704    $perl_scalar = JSON::PP->new->utf8->decode($json_text)
1705
1706=head2 JSON::PP::is_bool
1707
1708    $is_boolean = JSON::PP::is_bool($scalar)
1709
1710Returns true if the passed scalar represents either JSON::PP::true or
1711JSON::PP::false, two constants that act like C<1> and C<0> respectively
1712and are also used to represent JSON C<true> and C<false> in Perl strings.
1713
1714=head2 JSON::PP::true
1715
1716Returns JSON true value which is blessed object.
1717It C<isa> JSON::PP::Boolean object.
1718
1719=head2 JSON::PP::false
1720
1721Returns JSON false value which is blessed object.
1722It C<isa> JSON::PP::Boolean object.
1723
1724=head2 JSON::PP::null
1725
1726Returns C<undef>.
1727
1728See L<MAPPING>, below, for more information on how JSON values are mapped to
1729Perl.
1730
1731
1732=head1 HOW DO I DECODE A DATA FROM OUTER AND ENCODE TO OUTER
1733
1734This section supposes that your perl vresion is 5.8 or later.
1735
1736If you know a JSON text from an outer world - a network, a file content, and so on,
1737is encoded in UTF-8, you should use C<decode_json> or C<JSON> module object
1738with C<utf8> enable. And the decoded result will contain UNICODE characters.
1739
1740  # from network
1741  my $json        = JSON::PP->new->utf8;
1742  my $json_text   = CGI->new->param( 'json_data' );
1743  my $perl_scalar = $json->decode( $json_text );
1744
1745  # from file content
1746  local $/;
1747  open( my $fh, '<', 'json.data' );
1748  $json_text   = <$fh>;
1749  $perl_scalar = decode_json( $json_text );
1750
1751If an outer data is not encoded in UTF-8, firstly you should C<decode> it.
1752
1753  use Encode;
1754  local $/;
1755  open( my $fh, '<', 'json.data' );
1756  my $encoding = 'cp932';
1757  my $unicode_json_text = decode( $encoding, <$fh> ); # UNICODE
1758
1759  # or you can write the below code.
1760  #
1761  # open( my $fh, "<:encoding($encoding)", 'json.data' );
1762  # $unicode_json_text = <$fh>;
1763
1764In this case, C<$unicode_json_text> is of course UNICODE string.
1765So you B<cannot> use C<decode_json> nor C<JSON> module object with C<utf8> enable.
1766Instead of them, you use C<JSON> module object with C<utf8> disable.
1767
1768  $perl_scalar = $json->utf8(0)->decode( $unicode_json_text );
1769
1770Or C<encode 'utf8'> and C<decode_json>:
1771
1772  $perl_scalar = decode_json( encode( 'utf8', $unicode_json_text ) );
1773  # this way is not efficient.
1774
1775And now, you want to convert your C<$perl_scalar> into JSON data and
1776send it to an outer world - a network or a file content, and so on.
1777
1778Your data usually contains UNICODE strings and you want the converted data to be encoded
1779in UTF-8, you should use C<encode_json> or C<JSON> module object with C<utf8> enable.
1780
1781  print encode_json( $perl_scalar ); # to a network? file? or display?
1782  # or
1783  print $json->utf8->encode( $perl_scalar );
1784
1785If C<$perl_scalar> does not contain UNICODE but C<$encoding>-encoded strings
1786for some reason, then its characters are regarded as B<latin1> for perl
1787(because it does not concern with your $encoding).
1788You B<cannot> use C<encode_json> nor C<JSON> module object with C<utf8> enable.
1789Instead of them, you use C<JSON> module object with C<utf8> disable.
1790Note that the resulted text is a UNICODE string but no problem to print it.
1791
1792  # $perl_scalar contains $encoding encoded string values
1793  $unicode_json_text = $json->utf8(0)->encode( $perl_scalar );
1794  # $unicode_json_text consists of characters less than 0x100
1795  print $unicode_json_text;
1796
1797Or C<decode $encoding> all string values and C<encode_json>:
1798
1799  $perl_scalar->{ foo } = decode( $encoding, $perl_scalar->{ foo } );
1800  # ... do it to each string values, then encode_json
1801  $json_text = encode_json( $perl_scalar );
1802
1803This method is a proper way but probably not efficient.
1804
1805See to L<Encode>, L<perluniintro>.
1806
1807
1808=head1 METHODS
1809
1810Basically, check to L<JSON> or L<JSON::XS>.
1811
1812=head2 new
1813
1814    $json = JSON::PP->new
1815
1816Rturns a new JSON::PP object that can be used to de/encode JSON
1817strings.
1818
1819All boolean flags described below are by default I<disabled>.
1820
1821The mutators for flags all return the JSON object again and thus calls can
1822be chained:
1823
1824   my $json = JSON::PP->new->utf8->space_after->encode({a => [1,2]})
1825   => {"a": [1, 2]}
1826
1827=head2 ascii
1828
1829    $json = $json->ascii([$enable])
1830
1831    $enabled = $json->get_ascii
1832
1833If $enable is true (or missing), then the encode method will not generate characters outside
1834the code range 0..127. Any Unicode characters outside that range will be escaped using either
1835a single \uXXXX or a double \uHHHH\uLLLLL escape sequence, as per RFC4627.
1836(See to L<JSON::XS/OBJECT-ORIENTED INTERFACE>).
1837
1838In Perl 5.005, there is no character having high value (more than 255).
1839See to L<UNICODE HANDLING ON PERLS>.
1840
1841If $enable is false, then the encode method will not escape Unicode characters unless
1842required by the JSON syntax or other flags. This results in a faster and more compact format.
1843
1844  JSON::PP->new->ascii(1)->encode([chr 0x10401])
1845  => ["\ud801\udc01"]
1846
1847=head2 latin1
1848
1849    $json = $json->latin1([$enable])
1850
1851    $enabled = $json->get_latin1
1852
1853If $enable is true (or missing), then the encode method will encode the resulting JSON
1854text as latin1 (or iso-8859-1), escaping any characters outside the code range 0..255.
1855
1856If $enable is false, then the encode method will not escape Unicode characters
1857unless required by the JSON syntax or other flags.
1858
1859  JSON::XS->new->latin1->encode (["\x{89}\x{abc}"]
1860  => ["\x{89}\\u0abc"]    # (perl syntax, U+abc escaped, U+89 not)
1861
1862See to L<UNICODE HANDLING ON PERLS>.
1863
1864=head2 utf8
1865
1866    $json = $json->utf8([$enable])
1867
1868    $enabled = $json->get_utf8
1869
1870If $enable is true (or missing), then the encode method will encode the JSON result
1871into UTF-8, as required by many protocols, while the decode method expects to be handled
1872an UTF-8-encoded string. Please note that UTF-8-encoded strings do not contain any
1873characters outside the range 0..255, they are thus useful for bytewise/binary I/O.
1874
1875(In Perl 5.005, any character outside the range 0..255 does not exist.
1876See to L<UNICODE HANDLING ON PERLS>.)
1877
1878In future versions, enabling this option might enable autodetection of the UTF-16 and UTF-32
1879encoding families, as described in RFC4627.
1880
1881If $enable is false, then the encode method will return the JSON string as a (non-encoded)
1882Unicode string, while decode expects thus a Unicode string. Any decoding or encoding
1883(e.g. to UTF-8 or UTF-16) needs to be done yourself, e.g. using the Encode module.
1884
1885Example, output UTF-16BE-encoded JSON:
1886
1887  use Encode;
1888  $jsontext = encode "UTF-16BE", JSON::PP->new->encode ($object);
1889
1890Example, decode UTF-32LE-encoded JSON:
1891
1892  use Encode;
1893  $object = JSON::PP->new->decode (decode "UTF-32LE", $jsontext);
1894
1895
1896=head2 pretty
1897
1898    $json = $json->pretty([$enable])
1899
1900This enables (or disables) all of the C<indent>, C<space_before> and
1901C<space_after> flags in one call to generate the most readable
1902(or most compact) form possible.
1903
1904Equivalent to:
1905
1906   $json->indent->space_before->space_after
1907
1908=head2 indent
1909
1910    $json = $json->indent([$enable])
1911
1912    $enabled = $json->get_indent
1913
1914The default indent space length is three.
1915You can use C<indent_length> to change the length.
1916
1917=head2 space_before
1918
1919    $json = $json->space_before([$enable])
1920
1921    $enabled = $json->get_space_before
1922
1923If C<$enable> is true (or missing), then the C<encode> method will add an extra
1924optional space before the C<:> separating keys from values in JSON objects.
1925
1926If C<$enable> is false, then the C<encode> method will not add any extra
1927space at those places.
1928
1929This setting has no effect when decoding JSON texts.
1930
1931Example, space_before enabled, space_after and indent disabled:
1932
1933   {"key" :"value"}
1934
1935=head2 space_after
1936
1937    $json = $json->space_after([$enable])
1938
1939    $enabled = $json->get_space_after
1940
1941If C<$enable> is true (or missing), then the C<encode> method will add an extra
1942optional space after the C<:> separating keys from values in JSON objects
1943and extra whitespace after the C<,> separating key-value pairs and array
1944members.
1945
1946If C<$enable> is false, then the C<encode> method will not add any extra
1947space at those places.
1948
1949This setting has no effect when decoding JSON texts.
1950
1951Example, space_before and indent disabled, space_after enabled:
1952
1953   {"key": "value"}
1954
1955=head2 relaxed
1956
1957    $json = $json->relaxed([$enable])
1958
1959    $enabled = $json->get_relaxed
1960
1961If C<$enable> is true (or missing), then C<decode> will accept some
1962extensions to normal JSON syntax (see below). C<encode> will not be
1963affected in anyway. I<Be aware that this option makes you accept invalid
1964JSON texts as if they were valid!>. I suggest only to use this option to
1965parse application-specific files written by humans (configuration files,
1966resource files etc.)
1967
1968If C<$enable> is false (the default), then C<decode> will only accept
1969valid JSON texts.
1970
1971Currently accepted extensions are:
1972
1973=over 4
1974
1975=item * list items can have an end-comma
1976
1977JSON I<separates> array elements and key-value pairs with commas. This
1978can be annoying if you write JSON texts manually and want to be able to
1979quickly append elements, so this extension accepts comma at the end of
1980such items not just between them:
1981
1982   [
1983      1,
1984      2, <- this comma not normally allowed
1985   ]
1986   {
1987      "k1": "v1",
1988      "k2": "v2", <- this comma not normally allowed
1989   }
1990
1991=item * shell-style '#'-comments
1992
1993Whenever JSON allows whitespace, shell-style comments are additionally
1994allowed. They are terminated by the first carriage-return or line-feed
1995character, after which more white-space and comments are allowed.
1996
1997  [
1998     1, # this comment not allowed in JSON
1999        # neither this one...
2000  ]
2001
2002=back
2003
2004=head2 canonical
2005
2006    $json = $json->canonical([$enable])
2007
2008    $enabled = $json->get_canonical
2009
2010If C<$enable> is true (or missing), then the C<encode> method will output JSON objects
2011by sorting their keys. This is adding a comparatively high overhead.
2012
2013If C<$enable> is false, then the C<encode> method will output key-value
2014pairs in the order Perl stores them (which will likely change between runs
2015of the same script).
2016
2017This option is useful if you want the same data structure to be encoded as
2018the same JSON text (given the same overall settings). If it is disabled,
2019the same hash might be encoded differently even if contains the same data,
2020as key-value pairs have no inherent ordering in Perl.
2021
2022This setting has no effect when decoding JSON texts.
2023
2024If you want your own sorting routine, you can give a code referece
2025or a subroutine name to C<sort_by>. See to C<JSON::PP OWN METHODS>.
2026
2027=head2 allow_nonref
2028
2029    $json = $json->allow_nonref([$enable])
2030
2031    $enabled = $json->get_allow_nonref
2032
2033If C<$enable> is true (or missing), then the C<encode> method can convert a
2034non-reference into its corresponding string, number or null JSON value,
2035which is an extension to RFC4627. Likewise, C<decode> will accept those JSON
2036values instead of croaking.
2037
2038If C<$enable> is false, then the C<encode> method will croak if it isn't
2039passed an arrayref or hashref, as JSON texts must either be an object
2040or array. Likewise, C<decode> will croak if given something that is not a
2041JSON object or array.
2042
2043   JSON::PP->new->allow_nonref->encode ("Hello, World!")
2044   => "Hello, World!"
2045
2046=head2 allow_unknown
2047
2048    $json = $json->allow_unknown ([$enable])
2049
2050    $enabled = $json->get_allow_unknown
2051
2052If $enable is true (or missing), then "encode" will *not* throw an
2053exception when it encounters values it cannot represent in JSON (for
2054example, filehandles) but instead will encode a JSON "null" value.
2055Note that blessed objects are not included here and are handled
2056separately by c<allow_nonref>.
2057
2058If $enable is false (the default), then "encode" will throw an
2059exception when it encounters anything it cannot encode as JSON.
2060
2061This option does not affect "decode" in any way, and it is
2062recommended to leave it off unless you know your communications
2063partner.
2064
2065=head2 allow_blessed
2066
2067    $json = $json->allow_blessed([$enable])
2068
2069    $enabled = $json->get_allow_blessed
2070
2071If C<$enable> is true (or missing), then the C<encode> method will not
2072barf when it encounters a blessed reference. Instead, the value of the
2073B<convert_blessed> option will decide whether C<null> (C<convert_blessed>
2074disabled or no C<TO_JSON> method found) or a representation of the
2075object (C<convert_blessed> enabled and C<TO_JSON> method found) is being
2076encoded. Has no effect on C<decode>.
2077
2078If C<$enable> is false (the default), then C<encode> will throw an
2079exception when it encounters a blessed object.
2080
2081=head2 convert_blessed
2082
2083    $json = $json->convert_blessed([$enable])
2084
2085    $enabled = $json->get_convert_blessed
2086
2087If C<$enable> is true (or missing), then C<encode>, upon encountering a
2088blessed object, will check for the availability of the C<TO_JSON> method
2089on the object's class. If found, it will be called in scalar context
2090and the resulting scalar will be encoded instead of the object. If no
2091C<TO_JSON> method is found, the value of C<allow_blessed> will decide what
2092to do.
2093
2094The C<TO_JSON> method may safely call die if it wants. If C<TO_JSON>
2095returns other blessed objects, those will be handled in the same
2096way. C<TO_JSON> must take care of not causing an endless recursion cycle
2097(== crash) in this case. The name of C<TO_JSON> was chosen because other
2098methods called by the Perl core (== not by the user of the object) are
2099usually in upper case letters and to avoid collisions with the C<to_json>
2100function or method.
2101
2102This setting does not yet influence C<decode> in any way.
2103
2104If C<$enable> is false, then the C<allow_blessed> setting will decide what
2105to do when a blessed object is found.
2106
2107=head2 filter_json_object
2108
2109    $json = $json->filter_json_object([$coderef])
2110
2111When C<$coderef> is specified, it will be called from C<decode> each
2112time it decodes a JSON object. The only argument passed to the coderef
2113is a reference to the newly-created hash. If the code references returns
2114a single scalar (which need not be a reference), this value
2115(i.e. a copy of that scalar to avoid aliasing) is inserted into the
2116deserialised data structure. If it returns an empty list
2117(NOTE: I<not> C<undef>, which is a valid scalar), the original deserialised
2118hash will be inserted. This setting can slow down decoding considerably.
2119
2120When C<$coderef> is omitted or undefined, any existing callback will
2121be removed and C<decode> will not change the deserialised hash in any
2122way.
2123
2124Example, convert all JSON objects into the integer 5:
2125
2126   my $js = JSON::PP->new->filter_json_object (sub { 5 });
2127   # returns [5]
2128   $js->decode ('[{}]'); # the given subroutine takes a hash reference.
2129   # throw an exception because allow_nonref is not enabled
2130   # so a lone 5 is not allowed.
2131   $js->decode ('{"a":1, "b":2}');
2132
2133=head2 filter_json_single_key_object
2134
2135    $json = $json->filter_json_single_key_object($key [=> $coderef])
2136
2137Works remotely similar to C<filter_json_object>, but is only called for
2138JSON objects having a single key named C<$key>.
2139
2140This C<$coderef> is called before the one specified via
2141C<filter_json_object>, if any. It gets passed the single value in the JSON
2142object. If it returns a single value, it will be inserted into the data
2143structure. If it returns nothing (not even C<undef> but the empty list),
2144the callback from C<filter_json_object> will be called next, as if no
2145single-key callback were specified.
2146
2147If C<$coderef> is omitted or undefined, the corresponding callback will be
2148disabled. There can only ever be one callback for a given key.
2149
2150As this callback gets called less often then the C<filter_json_object>
2151one, decoding speed will not usually suffer as much. Therefore, single-key
2152objects make excellent targets to serialise Perl objects into, especially
2153as single-key JSON objects are as close to the type-tagged value concept
2154as JSON gets (it's basically an ID/VALUE tuple). Of course, JSON does not
2155support this in any way, so you need to make sure your data never looks
2156like a serialised Perl hash.
2157
2158Typical names for the single object key are C<__class_whatever__>, or
2159C<$__dollars_are_rarely_used__$> or C<}ugly_brace_placement>, or even
2160things like C<__class_md5sum(classname)__>, to reduce the risk of clashing
2161with real hashes.
2162
2163Example, decode JSON objects of the form C<< { "__widget__" => <id> } >>
2164into the corresponding C<< $WIDGET{<id>} >> object:
2165
2166   # return whatever is in $WIDGET{5}:
2167   JSON::PP
2168      ->new
2169      ->filter_json_single_key_object (__widget__ => sub {
2170            $WIDGET{ $_[0] }
2171         })
2172      ->decode ('{"__widget__": 5')
2173
2174   # this can be used with a TO_JSON method in some "widget" class
2175   # for serialisation to json:
2176   sub WidgetBase::TO_JSON {
2177      my ($self) = @_;
2178
2179      unless ($self->{id}) {
2180         $self->{id} = ..get..some..id..;
2181         $WIDGET{$self->{id}} = $self;
2182      }
2183
2184      { __widget__ => $self->{id} }
2185   }
2186
2187=head2 shrink
2188
2189    $json = $json->shrink([$enable])
2190
2191    $enabled = $json->get_shrink
2192
2193In JSON::XS, this flag resizes strings generated by either
2194C<encode> or C<decode> to their minimum size possible.
2195It will also try to downgrade any strings to octet-form if possible.
2196
2197In JSON::PP, it is noop about resizing strings but tries
2198C<utf8::downgrade> to the returned string by C<encode>.
2199See to L<utf8>.
2200
2201See to L<JSON::XS/OBJECT-ORIENTED INTERFACE>
2202
2203=head2 max_depth
2204
2205    $json = $json->max_depth([$maximum_nesting_depth])
2206
2207    $max_depth = $json->get_max_depth
2208
2209Sets the maximum nesting level (default C<512>) accepted while encoding
2210or decoding. If a higher nesting level is detected in JSON text or a Perl
2211data structure, then the encoder and decoder will stop and croak at that
2212point.
2213
2214Nesting level is defined by number of hash- or arrayrefs that the encoder
2215needs to traverse to reach a given point or the number of C<{> or C<[>
2216characters without their matching closing parenthesis crossed to reach a
2217given character in a string.
2218
2219If no argument is given, the highest possible setting will be used, which
2220is rarely useful.
2221
2222See L<JSON::XS/SSECURITY CONSIDERATIONS> for more info on why this is useful.
2223
2224When a large value (100 or more) was set and it de/encodes a deep nested object/text,
2225it may raise a warning 'Deep recursion on subroutin' at the perl runtime phase.
2226
2227=head2 max_size
2228
2229    $json = $json->max_size([$maximum_string_size])
2230
2231    $max_size = $json->get_max_size
2232
2233Set the maximum length a JSON text may have (in bytes) where decoding is
2234being attempted. The default is C<0>, meaning no limit. When C<decode>
2235is called on a string that is longer then this many bytes, it will not
2236attempt to decode the string but throw an exception. This setting has no
2237effect on C<encode> (yet).
2238
2239If no argument is given, the limit check will be deactivated (same as when
2240C<0> is specified).
2241
2242See L<JSON::XS/SSECURITY CONSIDERATIONS> for more info on why this is useful.
2243
2244=head2 encode
2245
2246    $json_text = $json->encode($perl_scalar)
2247
2248Converts the given Perl data structure (a simple scalar or a reference
2249to a hash or array) to its JSON representation. Simple scalars will be
2250converted into JSON string or number sequences, while references to arrays
2251become JSON arrays and references to hashes become JSON objects. Undefined
2252Perl values (e.g. C<undef>) become JSON C<null> values.
2253References to the integers C<0> and C<1> are converted into C<true> and C<false>.
2254
2255=head2 decode
2256
2257    $perl_scalar = $json->decode($json_text)
2258
2259The opposite of C<encode>: expects a JSON text and tries to parse it,
2260returning the resulting simple scalar or reference. Croaks on error.
2261
2262JSON numbers and strings become simple Perl scalars. JSON arrays become
2263Perl arrayrefs and JSON objects become Perl hashrefs. C<true> becomes
2264C<1> (C<JSON::true>), C<false> becomes C<0> (C<JSON::false>) and
2265C<null> becomes C<undef>.
2266
2267=head2 decode_prefix
2268
2269    ($perl_scalar, $characters) = $json->decode_prefix($json_text)
2270
2271This works like the C<decode> method, but instead of raising an exception
2272when there is trailing garbage after the first JSON object, it will
2273silently stop parsing there and return the number of characters consumed
2274so far.
2275
2276   JSON->new->decode_prefix ("[1] the tail")
2277   => ([], 3)
2278
2279=head1 INCREMENTAL PARSING
2280
2281Most of this section are copied and modified from L<JSON::XS/INCREMENTAL PARSING>.
2282
2283In some cases, there is the need for incremental parsing of JSON texts.
2284This module does allow you to parse a JSON stream incrementally.
2285It does so by accumulating text until it has a full JSON object, which
2286it then can decode. This process is similar to using C<decode_prefix>
2287to see if a full JSON object is available, but is much more efficient
2288(and can be implemented with a minimum of method calls).
2289
2290This module will only attempt to parse the JSON text once it is sure it
2291has enough text to get a decisive result, using a very simple but
2292truly incremental parser. This means that it sometimes won't stop as
2293early as the full parser, for example, it doesn't detect parenthese
2294mismatches. The only thing it guarantees is that it starts decoding as
2295soon as a syntactically valid JSON text has been seen. This means you need
2296to set resource limits (e.g. C<max_size>) to ensure the parser will stop
2297parsing in the presence if syntax errors.
2298
2299The following methods implement this incremental parser.
2300
2301=head2 incr_parse
2302
2303    $json->incr_parse( [$string] ) # void context
2304
2305    $obj_or_undef = $json->incr_parse( [$string] ) # scalar context
2306
2307    @obj_or_empty = $json->incr_parse( [$string] ) # list context
2308
2309This is the central parsing function. It can both append new text and
2310extract objects from the stream accumulated so far (both of these
2311functions are optional).
2312
2313If C<$string> is given, then this string is appended to the already
2314existing JSON fragment stored in the C<$json> object.
2315
2316After that, if the function is called in void context, it will simply
2317return without doing anything further. This can be used to add more text
2318in as many chunks as you want.
2319
2320If the method is called in scalar context, then it will try to extract
2321exactly I<one> JSON object. If that is successful, it will return this
2322object, otherwise it will return C<undef>. If there is a parse error,
2323this method will croak just as C<decode> would do (one can then use
2324C<incr_skip> to skip the errornous part). This is the most common way of
2325using the method.
2326
2327And finally, in list context, it will try to extract as many objects
2328from the stream as it can find and return them, or the empty list
2329otherwise. For this to work, there must be no separators between the JSON
2330objects or arrays, instead they must be concatenated back-to-back. If
2331an error occurs, an exception will be raised as in the scalar context
2332case. Note that in this case, any previously-parsed JSON texts will be
2333lost.
2334
2335Example: Parse some JSON arrays/objects in a given string and return them.
2336
2337    my @objs = JSON->new->incr_parse ("[5][7][1,2]");
2338
2339=head2 incr_text
2340
2341    $lvalue_string = $json->incr_text
2342
2343This method returns the currently stored JSON fragment as an lvalue, that
2344is, you can manipulate it. This I<only> works when a preceding call to
2345C<incr_parse> in I<scalar context> successfully returned an object. Under
2346all other circumstances you must not call this function (I mean it.
2347although in simple tests it might actually work, it I<will> fail under
2348real world conditions). As a special exception, you can also call this
2349method before having parsed anything.
2350
2351This function is useful in two cases: a) finding the trailing text after a
2352JSON object or b) parsing multiple JSON objects separated by non-JSON text
2353(such as commas).
2354
2355    $json->incr_text =~ s/\s*,\s*//;
2356
2357In Perl 5.005, C<lvalue> attribute is not available.
2358You must write codes like the below:
2359
2360    $string = $json->incr_text;
2361    $string =~ s/\s*,\s*//;
2362    $json->incr_text( $string );
2363
2364=head2 incr_skip
2365
2366    $json->incr_skip
2367
2368This will reset the state of the incremental parser and will remove the
2369parsed text from the input buffer. This is useful after C<incr_parse>
2370died, in which case the input buffer and incremental parser state is left
2371unchanged, to skip the text parsed so far and to reset the parse state.
2372
2373=head2 incr_reset
2374
2375    $json->incr_reset
2376
2377This completely resets the incremental parser, that is, after this call,
2378it will be as if the parser had never parsed anything.
2379
2380This is useful if you want ot repeatedly parse JSON objects and want to
2381ignore any trailing data, which means you have to reset the parser after
2382each successful decode.
2383
2384See to L<JSON::XS/INCREMENTAL PARSING> for examples.
2385
2386
2387=head1 JSON::PP OWN METHODS
2388
2389=head2 allow_singlequote
2390
2391    $json = $json->allow_singlequote([$enable])
2392
2393If C<$enable> is true (or missing), then C<decode> will accept
2394JSON strings quoted by single quotations that are invalid JSON
2395format.
2396
2397    $json->allow_singlequote->decode({"foo":'bar'});
2398    $json->allow_singlequote->decode({'foo':"bar"});
2399    $json->allow_singlequote->decode({'foo':'bar'});
2400
2401As same as the C<relaxed> option, this option may be used to parse
2402application-specific files written by humans.
2403
2404
2405=head2 allow_barekey
2406
2407    $json = $json->allow_barekey([$enable])
2408
2409If C<$enable> is true (or missing), then C<decode> will accept
2410bare keys of JSON object that are invalid JSON format.
2411
2412As same as the C<relaxed> option, this option may be used to parse
2413application-specific files written by humans.
2414
2415    $json->allow_barekey->decode('{foo:"bar"}');
2416
2417=head2 allow_bignum
2418
2419    $json = $json->allow_bignum([$enable])
2420
2421If C<$enable> is true (or missing), then C<decode> will convert
2422the big integer Perl cannot handle as integer into a L<Math::BigInt>
2423object and convert a floating number (any) into a L<Math::BigFloat>.
2424
2425On the contary, C<encode> converts C<Math::BigInt> objects and C<Math::BigFloat>
2426objects into JSON numbers with C<allow_blessed> enable.
2427
2428   $json->allow_nonref->allow_blessed->allow_bignum;
2429   $bigfloat = $json->decode('2.000000000000000000000000001');
2430   print $json->encode($bigfloat);
2431   # => 2.000000000000000000000000001
2432
2433See to L<JSON::XS/MAPPING> aboout the normal conversion of JSON number.
2434
2435=head2 loose
2436
2437    $json = $json->loose([$enable])
2438
2439The unescaped [\x00-\x1f\x22\x2f\x5c] strings are invalid in JSON strings
2440and the module doesn't allow to C<decode> to these (except for \x2f).
2441If C<$enable> is true (or missing), then C<decode>  will accept these
2442unescaped strings.
2443
2444    $json->loose->decode(qq|["abc
2445                                   def"]|);
2446
2447See L<JSON::XS/SSECURITY CONSIDERATIONS>.
2448
2449=head2 escape_slash
2450
2451    $json = $json->escape_slash([$enable])
2452
2453According to JSON Grammar, I<slash> (U+002F) is escaped. But default
2454JSON::PP (as same as JSON::XS) encodes strings without escaping slash.
2455
2456If C<$enable> is true (or missing), then C<encode> will escape slashes.
2457
2458=head2 indent_length
2459
2460    $json = $json->indent_length($length)
2461
2462JSON::XS indent space length is 3 and cannot be changed.
2463JSON::PP set the indent space length with the given $length.
2464The default is 3. The acceptable range is 0 to 15.
2465
2466=head2 sort_by
2467
2468    $json = $json->sort_by($function_name)
2469    $json = $json->sort_by($subroutine_ref)
2470
2471If $function_name or $subroutine_ref are set, its sort routine are used
2472in encoding JSON objects.
2473
2474   $js = $pc->sort_by(sub { $JSON::PP::a cmp $JSON::PP::b })->encode($obj);
2475   # is($js, q|{"a":1,"b":2,"c":3,"d":4,"e":5,"f":6,"g":7,"h":8,"i":9}|);
2476
2477   $js = $pc->sort_by('own_sort')->encode($obj);
2478   # is($js, q|{"a":1,"b":2,"c":3,"d":4,"e":5,"f":6,"g":7,"h":8,"i":9}|);
2479
2480   sub JSON::PP::own_sort { $JSON::PP::a cmp $JSON::PP::b }
2481
2482As the sorting routine runs in the JSON::PP scope, the given
2483subroutine name and the special variables C<$a>, C<$b> will begin
2484'JSON::PP::'.
2485
2486If $integer is set, then the effect is same as C<canonical> on.
2487
2488=head1 INTERNAL
2489
2490For developers.
2491
2492=over
2493
2494=item PP_encode_box
2495
2496Returns
2497
2498        {
2499            depth        => $depth,
2500            indent_count => $indent_count,
2501        }
2502
2503
2504=item PP_decode_box
2505
2506Returns
2507
2508        {
2509            text    => $text,
2510            at      => $at,
2511            ch      => $ch,
2512            len     => $len,
2513            depth   => $depth,
2514            encoding      => $encoding,
2515            is_valid_utf8 => $is_valid_utf8,
2516        };
2517
2518=back
2519
2520=head1 MAPPING
2521
2522This section is copied from JSON::XS and modified to C<JSON::PP>.
2523JSON::XS and JSON::PP mapping mechanisms are almost equivalent.
2524
2525See to L<JSON::XS/MAPPING>.
2526
2527=head2 JSON -> PERL
2528
2529=over 4
2530
2531=item object
2532
2533A JSON object becomes a reference to a hash in Perl. No ordering of object
2534keys is preserved (JSON does not preserver object key ordering itself).
2535
2536=item array
2537
2538A JSON array becomes a reference to an array in Perl.
2539
2540=item string
2541
2542A JSON string becomes a string scalar in Perl - Unicode codepoints in JSON
2543are represented by the same codepoints in the Perl string, so no manual
2544decoding is necessary.
2545
2546=item number
2547
2548A JSON number becomes either an integer, numeric (floating point) or
2549string scalar in perl, depending on its range and any fractional parts. On
2550the Perl level, there is no difference between those as Perl handles all
2551the conversion details, but an integer may take slightly less memory and
2552might represent more values exactly than floating point numbers.
2553
2554If the number consists of digits only, C<JSON> will try to represent
2555it as an integer value. If that fails, it will try to represent it as
2556a numeric (floating point) value if that is possible without loss of
2557precision. Otherwise it will preserve the number as a string value (in
2558which case you lose roundtripping ability, as the JSON number will be
2559re-encoded toa JSON string).
2560
2561Numbers containing a fractional or exponential part will always be
2562represented as numeric (floating point) values, possibly at a loss of
2563precision (in which case you might lose perfect roundtripping ability, but
2564the JSON number will still be re-encoded as a JSON number).
2565
2566Note that precision is not accuracy - binary floating point values cannot
2567represent most decimal fractions exactly, and when converting from and to
2568floating point, C<JSON> only guarantees precision up to but not including
2569the leats significant bit.
2570
2571When C<allow_bignum> is enable, the big integers
2572and the numeric can be optionally converted into L<Math::BigInt> and
2573L<Math::BigFloat> objects.
2574
2575=item true, false
2576
2577These JSON atoms become C<JSON::PP::true> and C<JSON::PP::false>,
2578respectively. They are overloaded to act almost exactly like the numbers
2579C<1> and C<0>. You can check wether a scalar is a JSON boolean by using
2580the C<JSON::is_bool> function.
2581
2582   print JSON::PP::true . "\n";
2583    => true
2584   print JSON::PP::true + 1;
2585    => 1
2586
2587   ok(JSON::true eq  '1');
2588   ok(JSON::true == 1);
2589
2590C<JSON> will install these missing overloading features to the backend modules.
2591
2592
2593=item null
2594
2595A JSON null atom becomes C<undef> in Perl.
2596
2597C<JSON::PP::null> returns C<unddef>.
2598
2599=back
2600
2601
2602=head2 PERL -> JSON
2603
2604The mapping from Perl to JSON is slightly more difficult, as Perl is a
2605truly typeless language, so we can only guess which JSON type is meant by
2606a Perl value.
2607
2608=over 4
2609
2610=item hash references
2611
2612Perl hash references become JSON objects. As there is no inherent ordering
2613in hash keys (or JSON objects), they will usually be encoded in a
2614pseudo-random order that can change between runs of the same program but
2615stays generally the same within a single run of a program. C<JSON>
2616optionally sort the hash keys (determined by the I<canonical> flag), so
2617the same datastructure will serialise to the same JSON text (given same
2618settings and version of JSON::XS), but this incurs a runtime overhead
2619and is only rarely useful, e.g. when you want to compare some JSON text
2620against another for equality.
2621
2622
2623=item array references
2624
2625Perl array references become JSON arrays.
2626
2627=item other references
2628
2629Other unblessed references are generally not allowed and will cause an
2630exception to be thrown, except for references to the integers C<0> and
2631C<1>, which get turned into C<false> and C<true> atoms in JSON. You can
2632also use C<JSON::false> and C<JSON::true> to improve readability.
2633
2634   to_json [\0,JSON::PP::true]      # yields [false,true]
2635
2636=item JSON::PP::true, JSON::PP::false, JSON::PP::null
2637
2638These special values become JSON true and JSON false values,
2639respectively. You can also use C<\1> and C<\0> directly if you want.
2640
2641JSON::PP::null returns C<undef>.
2642
2643=item blessed objects
2644
2645Blessed objects are not directly representable in JSON. See the
2646C<allow_blessed> and C<convert_blessed> methods on various options on
2647how to deal with this: basically, you can choose between throwing an
2648exception, encoding the reference as if it weren't blessed, or provide
2649your own serialiser method.
2650
2651See to L<convert_blessed>.
2652
2653=item simple scalars
2654
2655Simple Perl scalars (any scalar that is not a reference) are the most
2656difficult objects to encode: JSON::XS and JSON::PP will encode undefined scalars as
2657JSON C<null> values, scalars that have last been used in a string context
2658before encoding as JSON strings, and anything else as number value:
2659
2660   # dump as number
2661   encode_json [2]                      # yields [2]
2662   encode_json [-3.0e17]                # yields [-3e+17]
2663   my $value = 5; encode_json [$value]  # yields [5]
2664
2665   # used as string, so dump as string
2666   print $value;
2667   encode_json [$value]                 # yields ["5"]
2668
2669   # undef becomes null
2670   encode_json [undef]                  # yields [null]
2671
2672You can force the type to be a string by stringifying it:
2673
2674   my $x = 3.1; # some variable containing a number
2675   "$x";        # stringified
2676   $x .= "";    # another, more awkward way to stringify
2677   print $x;    # perl does it for you, too, quite often
2678
2679You can force the type to be a number by numifying it:
2680
2681   my $x = "3"; # some variable containing a string
2682   $x += 0;     # numify it, ensuring it will be dumped as a number
2683   $x *= 1;     # same thing, the choise is yours.
2684
2685You can not currently force the type in other, less obscure, ways.
2686
2687Note that numerical precision has the same meaning as under Perl (so
2688binary to decimal conversion follows the same rules as in Perl, which
2689can differ to other languages). Also, your perl interpreter might expose
2690extensions to the floating point numbers of your platform, such as
2691infinities or NaN's - these cannot be represented in JSON, and it is an
2692error to pass those in.
2693
2694=item Big Number
2695
2696When C<allow_bignum> is enable,
2697C<encode> converts C<Math::BigInt> objects and C<Math::BigFloat>
2698objects into JSON numbers.
2699
2700
2701=back
2702
2703=head1 UNICODE HANDLING ON PERLS
2704
2705If you do not know about Unicode on Perl well,
2706please check L<JSON::XS/A FEW NOTES ON UNICODE AND PERL>.
2707
2708=head2 Perl 5.8 and later
2709
2710Perl can handle Unicode and the JSON::PP de/encode methods also work properly.
2711
2712    $json->allow_nonref->encode(chr hex 3042);
2713    $json->allow_nonref->encode(chr hex 12345);
2714
2715Reuturns C<"\u3042"> and C<"\ud808\udf45"> respectively.
2716
2717    $json->allow_nonref->decode('"\u3042"');
2718    $json->allow_nonref->decode('"\ud808\udf45"');
2719
2720Returns UTF-8 encoded strings with UTF8 flag, regarded as C<U+3042> and C<U+12345>.
2721
2722Note that the versions from Perl 5.8.0 to 5.8.2, Perl built-in C<join> was broken,
2723so JSON::PP wraps the C<join> with a subroutine. Thus JSON::PP works slow in the versions.
2724
2725
2726=head2 Perl 5.6
2727
2728Perl can handle Unicode and the JSON::PP de/encode methods also work.
2729
2730=head2 Perl 5.005
2731
2732Perl 5.005 is a byte sementics world -- all strings are sequences of bytes.
2733That means the unicode handling is not available.
2734
2735In encoding,
2736
2737    $json->allow_nonref->encode(chr hex 3042);  # hex 3042 is 12354.
2738    $json->allow_nonref->encode(chr hex 12345); # hex 12345 is 74565.
2739
2740Returns C<B> and C<E>, as C<chr> takes a value more than 255, it treats
2741as C<$value % 256>, so the above codes are equivalent to :
2742
2743    $json->allow_nonref->encode(chr 66);
2744    $json->allow_nonref->encode(chr 69);
2745
2746In decoding,
2747
2748    $json->decode('"\u00e3\u0081\u0082"');
2749
2750The returned is a byte sequence C<0xE3 0x81 0x82> for UTF-8 encoded
2751japanese character (C<HIRAGANA LETTER A>).
2752And if it is represented in Unicode code point, C<U+3042>.
2753
2754Next,
2755
2756    $json->decode('"\u3042"');
2757
2758We ordinary expect the returned value is a Unicode character C<U+3042>.
2759But here is 5.005 world. This is C<0xE3 0x81 0x82>.
2760
2761    $json->decode('"\ud808\udf45"');
2762
2763This is not a character C<U+12345> but bytes - C<0xf0 0x92 0x8d 0x85>.
2764
2765
2766=head1 TODO
2767
2768=over
2769
2770=item speed
2771
2772=item memory saving
2773
2774=back
2775
2776
2777=head1 SEE ALSO
2778
2779Most of the document are copied and modified from JSON::XS doc.
2780
2781L<JSON::XS>
2782
2783RFC4627 (L<http://www.ietf.org/rfc/rfc4627.txt>)
2784
2785=head1 AUTHOR
2786
2787Makamaka Hannyaharamitu, E<lt>makamaka[at]cpan.orgE<gt>
2788
2789
2790=head1 COPYRIGHT AND LICENSE
2791
2792Copyright 2007-2011 by Makamaka Hannyaharamitu
2793
2794This library is free software; you can redistribute it and/or modify
2795it under the same terms as Perl itself.
2796
2797=cut
2798