package Mojo::JSON; use Mojo::Base -base; use B; use Exporter 'import'; use Mojo::Util; use Scalar::Util 'blessed'; has 'error'; our @EXPORT_OK = ('j'); # Literal names my $FALSE = bless \(my $false = 0), 'Mojo::JSON::_Bool'; my $TRUE = bless \(my $true = 1), 'Mojo::JSON::_Bool'; # Escaped special character map (with u2028 and u2029) my %ESCAPE = ( '"' => '"', '\\' => '\\', '/' => '/', 'b' => "\x08", 'f' => "\x0c", 'n' => "\x0a", 'r' => "\x0d", 't' => "\x09", 'u2028' => "\x{2028}", 'u2029' => "\x{2029}" ); my %REVERSE = map { $ESCAPE{$_} => "\\$_" } keys %ESCAPE; for (0x00 .. 0x1f, 0x7f) { $REVERSE{pack 'C', $_} //= sprintf '\u%.4X', $_ } # Unicode encoding detection my $UTF_PATTERNS = { 'UTF-32BE' => qr/^\x00{3}[^\x00]/, 'UTF-32LE' => qr/^[^\x00]\x00{3}/, 'UTF-16BE' => qr/^(?:\x00[^\x00]){2}/, 'UTF-16LE' => qr/^(?:[^\x00]\x00){2}/ }; my $WHITESPACE_RE = qr/[\x20\x09\x0a\x0d]*/; sub decode { my ($self, $bytes) = @_; # Clean start $self->error(undef); # Missing input $self->error('Missing or empty input') and return undef unless $bytes; # Remove BOM $bytes =~ s/^(?:\357\273\277|\377\376\0\0|\0\0\376\377|\376\377|\377\376)//g; # Wide characters $self->error('Wide character in input') and return undef unless utf8::downgrade($bytes, 1); # Detect and decode Unicode my $encoding = 'UTF-8'; $bytes =~ $UTF_PATTERNS->{$_} and $encoding = $_ for keys %$UTF_PATTERNS; $bytes = Mojo::Util::decode $encoding, $bytes; # Object or array my $res = eval { local $_ = $bytes; # Leading whitespace m/\G$WHITESPACE_RE/gc; # Array my $ref; if (m/\G\[/gc) { $ref = _decode_array() } # Object elsif (m/\G\{/gc) { $ref = _decode_object() } # Invalid character else { _exception('Expected array or object') } # Leftover data unless (m/\G$WHITESPACE_RE\z/gc) { my $got = ref $ref eq 'ARRAY' ? 'array' : 'object'; _exception("Unexpected data after $got"); } $ref; }; # Exception if (!$res && (my $e = $@)) { chomp $e; $self->error($e); } return $res; } sub encode { my ($self, $ref) = @_; return Mojo::Util::encode 'UTF-8', _encode_value($ref); } sub false {$FALSE} sub j { my $d = shift; return __PACKAGE__->new->encode($d) if ref $d eq 'ARRAY' || ref $d eq 'HASH'; return __PACKAGE__->new->decode($d); } sub true {$TRUE} sub _decode_array { my @array; until (m/\G$WHITESPACE_RE\]/gc) { # Value push @array, _decode_value(); # Separator redo if m/\G$WHITESPACE_RE,/gc; # End last if m/\G$WHITESPACE_RE\]/gc; # Invalid character _exception('Expected comma or right square bracket while parsing array'); } return \@array; } sub _decode_object { my %hash; until (m/\G$WHITESPACE_RE\}/gc) { # Quote m/\G$WHITESPACE_RE"/gc or _exception('Expected string while parsing object'); # Key my $key = _decode_string(); # Colon m/\G$WHITESPACE_RE:/gc or _exception('Expected colon while parsing object'); # Value $hash{$key} = _decode_value(); # Separator redo if m/\G$WHITESPACE_RE,/gc; # End last if m/\G$WHITESPACE_RE\}/gc; # Invalid character _exception('Expected comma or right curly bracket while parsing object'); } return \%hash; } sub _decode_string { my $pos = pos; # Extract string with escaped characters m!\G((?:(?:[^\x00-\x1f\\"]|\\(?:["\\/bfnrt]|u[0-9a-fA-F]{4})){0,32766})*)!gc; my $str = $1; # Invalid character unless (m/\G"/gc) { _exception('Unexpected character or invalid escape while parsing string') if m/\G[\x00-\x1f\\]/; _exception('Unterminated string'); } # Unescape popular characters if (index($str, '\\u') < 0) { $str =~ s!\\(["\\/bfnrt])!$ESCAPE{$1}!gs; return $str; } # Unescape everything else my $buffer = ''; while ($str =~ m/\G([^\\]*)\\(?:([^u])|u(.{4}))/gc) { $buffer .= $1; # Popular character if ($2) { $buffer .= $ESCAPE{$2} } # Escaped else { my $ord = hex $3; # Surrogate pair if (($ord & 0xf800) == 0xd800) { # High surrogate ($ord & 0xfc00) == 0xd800 or pos($_) = $pos + pos($str), _exception('Missing high-surrogate'); # Low surrogate $str =~ m/\G\\u([Dd][C-Fc-f]..)/gc or pos($_) = $pos + pos($str), _exception('Missing low-surrogate'); $ord = 0x10000 + ($ord - 0xd800) * 0x400 + (hex($1) - 0xdc00); } # Character $buffer .= pack 'U', $ord; } } # The rest return $buffer . substr $str, pos($str), length($str); } sub _decode_value { # Leading whitespace m/\G$WHITESPACE_RE/gc; # String return _decode_string() if m/\G"/gc; # Array return _decode_array() if m/\G\[/gc; # Object return _decode_object() if m/\G\{/gc; # Number return 0 + $1 if m/\G([-]?(?:0|[1-9][0-9]*)(?:\.[0-9]*)?(?:[eE][+-]?[0-9]+)?)/gc; # True return $TRUE if m/\Gtrue/gc; # False return $FALSE if m/\Gfalse/gc; # Null return undef if m/\Gnull/gc; # Invalid character _exception('Expected string, array, object, number, boolean or null'); } sub _encode_array { my $array = shift; return '[' . join(',', map { _encode_value($_) } @$array) . ']'; } sub _encode_object { my $object = shift; my @pairs = map { _encode_string($_) . ':' . _encode_value($object->{$_}) } keys %$object; return '{' . join(',', @pairs) . '}'; } sub _encode_string { my $str = shift; $str =~ s!([\x00-\x1f\x7f\x{2028}\x{2029}\\"/\b\f\n\r\t])!$REVERSE{$1}!gs; return "\"$str\""; } sub _encode_value { my $value = shift; # Reference if (my $ref = ref $value) { # Array return _encode_array($value) if $ref eq 'ARRAY'; # Object return _encode_object($value) if $ref eq 'HASH'; # True or false return $$value ? 'true' : 'false' if $ref eq 'SCALAR'; return $value ? 'true' : 'false' if $ref eq 'Mojo::JSON::_Bool'; # Blessed reference with TO_JSON method if (blessed $value && (my $sub = $value->can('TO_JSON'))) { return _encode_value($value->$sub); } } # Null return 'null' unless defined $value; # Number my $flags = B::svref_2object(\$value)->FLAGS; return 0 + $value if $flags & (B::SVp_IOK | B::SVp_NOK) && $value * 0 == 0; # String return _encode_string($value); } sub _exception { # Leading whitespace m/\G$WHITESPACE_RE/gc; # Context my $context = 'Malformed JSON: ' . shift; if (m/\G\z/gc) { $context .= ' before end of data' } else { my @lines = split /\n/, substr($_, 0, pos); $context .= ' at line ' . @lines . ', offset ' . length(pop @lines || ''); } die "$context\n"; } # Emulate boolean type package Mojo::JSON::_Bool; use overload '0+' => sub { ${$_[0]} }, '""' => sub { ${$_[0]} }, fallback => 1; 1; =encoding utf8 =head1 NAME Mojo::JSON - Minimalistic JSON =head1 SYNOPSIS # Encode and decode JSON use Mojo::JSON; my $json = Mojo::JSON->new; my $bytes = $json->encode({foo => [1, 2], bar => 'hello!', baz => \1}); my $hash = $json->decode($bytes); # Check for errors my $json = Mojo::JSON->new; if (defined(my $hash = $json->decode($bytes))) { say $hash->{message} } else { say 'Error: ', $json->error } # Use the alternative interface use Mojo::JSON 'j'; my $bytes = j({foo => [1, 2], bar => 'hello!', baz => \1}); my $hash = j($bytes); =head1 DESCRIPTION L is a minimalistic and relaxed implementation of RFC 4627. While it is possibly the fastest pure-Perl JSON parser available, you should not use it for validation. It supports normal Perl data types like C, C reference, C reference and will try to call the C method on blessed references, or stringify them if it doesn't exist. Differentiating between strings and numbers in Perl is hard, depending on how it has been used, a C can be both at the same time. Since numeric comparisons on strings are very unlikely to happen intentionally, the numeric value always gets priority, so any C that has been used in numeric context is considered a number. [1, -2, 3] -> [1, -2, 3] {"foo": "bar"} -> {foo => 'bar'} Literal names will be translated to and from L constants or a similar native Perl value. true -> Mojo::JSON->true false -> Mojo::JSON->false null -> undef In addition C references will be used to generate booleans, based on if their values are true or false. \1 -> true \0 -> false Decoding UTF-16 (LE/BE) and UTF-32 (LE/BE) will be handled transparently, encoding will only generate UTF-8. The two Unicode whitespace characters C and C will always be escaped to make JSONP easier. =head1 FUNCTIONS L implements the following functions. =head2 j my $bytes = j([1, 2, 3]); my $bytes = j({foo => 'bar'}); my $array = j($bytes); my $hash = j($bytes); Encode Perl data structure or decode JSON and return C if decoding fails. =head1 ATTRIBUTES L implements the following attributes. =head2 error my $err = $json->error; $json = $json->error('Parser error'); Parser errors. =head1 METHODS L inherits all methods from L and implements the following new ones. =head2 decode my $array = $json->decode($bytes); my $hash = $json->decode($bytes); Decode JSON to Perl data structure and return C if decoding fails. =head2 encode my $bytes = $json->encode([1, 2, 3]); my $bytes = $json->encode({foo => 'bar'}); Encode Perl data structure to JSON. =head2 false my $false = Mojo::JSON->false; my $false = $json->false; False value, used because Perl has no native equivalent. =head2 true my $true = Mojo::JSON->true; my $true = $json->true; True value, used because Perl has no native equivalent. =head1 SEE ALSO L, L, L. =cut