2011-10-21 18:16:16 -07:00
|
|
|
%% The MIT License
|
|
|
|
|
|
|
|
%% Copyright (c) 2010 Alisdair Sullivan <alisdairsullivan@yahoo.ca>
|
|
|
|
|
|
|
|
%% Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
%% of this software and associated documentation files (the "Software"), to deal
|
|
|
|
%% in the Software without restriction, including without limitation the rights
|
|
|
|
%% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
%% copies of the Software, and to permit persons to whom the Software is
|
|
|
|
%% furnished to do so, subject to the following conditions:
|
|
|
|
|
|
|
|
%% The above copyright notice and this permission notice shall be included in
|
|
|
|
%% all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
%% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
%% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
%% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
%% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
%% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
%% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
%% THE SOFTWARE.
|
|
|
|
|
|
|
|
|
|
|
|
-module(jsx_decoder).
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
-export([decoder/3]).
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
2012-01-31 20:56:08 -08:00
|
|
|
-spec decoder(Handler::module(), State::any(), Opts::jsx:opts()) -> jsx:decoder().
|
2011-11-23 20:54:10 -08:00
|
|
|
|
2012-01-31 20:56:08 -08:00
|
|
|
decoder(Handler, State, Opts) ->
|
2012-04-04 20:46:41 -07:00
|
|
|
fun(JSON) -> start(JSON, {Handler, Handler:init(State)}, [], jsx_utils:parse_opts(Opts)) end.
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
2012-03-06 19:59:49 -08:00
|
|
|
-include("jsx_opts.hrl").
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
%% whitespace
|
|
|
|
-define(space, 16#20).
|
|
|
|
-define(tab, 16#09).
|
|
|
|
-define(cr, 16#0D).
|
|
|
|
-define(newline, 16#0A).
|
|
|
|
|
|
|
|
%% object delimiters
|
|
|
|
-define(start_object, 16#7B).
|
|
|
|
-define(end_object, 16#7D).
|
|
|
|
|
|
|
|
%% array delimiters
|
|
|
|
-define(start_array, 16#5B).
|
|
|
|
-define(end_array, 16#5D).
|
|
|
|
|
|
|
|
%% kv seperator
|
|
|
|
-define(comma, 16#2C).
|
2012-03-14 23:01:59 -07:00
|
|
|
-define(doublequote, 16#22).
|
|
|
|
-define(singlequote, 16#27).
|
2011-08-31 18:52:01 -07:00
|
|
|
-define(colon, 16#3A).
|
|
|
|
|
|
|
|
%% string escape sequences
|
|
|
|
-define(escape, 16#5C).
|
|
|
|
-define(rsolidus, 16#5C).
|
|
|
|
-define(solidus, 16#2F).
|
|
|
|
-define(formfeed, 16#0C).
|
|
|
|
-define(backspace, 16#08).
|
|
|
|
-define(unicode, 16#75).
|
|
|
|
|
|
|
|
%% math
|
|
|
|
-define(zero, 16#30).
|
|
|
|
-define(decimalpoint, 16#2E).
|
|
|
|
-define(negative, 16#2D).
|
|
|
|
-define(positive, 16#2B).
|
|
|
|
|
2012-03-19 14:34:07 -07:00
|
|
|
%% comments
|
|
|
|
-define(star, 16#2A).
|
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
%% some useful guards
|
|
|
|
-define(is_hex(Symbol),
|
2012-03-31 17:51:20 -07:00
|
|
|
(Symbol >= $a andalso Symbol =< $z);
|
|
|
|
(Symbol >= $A andalso Symbol =< $Z);
|
|
|
|
(Symbol >= $0 andalso Symbol =< $9)
|
2011-08-31 18:52:01 -07:00
|
|
|
).
|
|
|
|
|
|
|
|
-define(is_nonzero(Symbol),
|
|
|
|
Symbol >= $1 andalso Symbol =< $9
|
|
|
|
).
|
|
|
|
|
|
|
|
-define(is_noncontrol(Symbol),
|
|
|
|
(Symbol >= ?space)
|
|
|
|
).
|
|
|
|
|
|
|
|
-define(is_whitespace(Symbol),
|
|
|
|
Symbol =:= ?space; Symbol =:= ?tab; Symbol =:= ?cr; Symbol =:= ?newline
|
|
|
|
).
|
|
|
|
|
|
|
|
|
|
|
|
%% error, incomplete and event macros
|
|
|
|
-ifndef(error).
|
|
|
|
-define(error(Args),
|
|
|
|
erlang:error(badarg, Args)
|
|
|
|
).
|
|
|
|
-endif.
|
|
|
|
|
|
|
|
|
|
|
|
-ifndef(incomplete).
|
2011-11-23 20:54:10 -08:00
|
|
|
-define(incomplete(State, Rest, Handler, Stack, Opts),
|
2011-10-21 18:16:16 -07:00
|
|
|
{incomplete, fun(Stream) when is_binary(Stream) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
State(<<Rest/binary, Stream/binary>>, Handler, Stack, Opts)
|
2011-10-21 18:16:16 -07:00
|
|
|
; (end_stream) ->
|
|
|
|
case State(<<Rest/binary, <<" ">>/binary>>,
|
2011-11-23 20:54:10 -08:00
|
|
|
Handler,
|
2011-10-21 18:16:16 -07:00
|
|
|
Stack,
|
|
|
|
Opts#opts{explicit_end=false}) of
|
2011-11-23 20:54:10 -08:00
|
|
|
{incomplete, _} -> ?error([Rest, Handler, Stack, Opts])
|
|
|
|
; Events -> Events
|
2011-10-21 18:16:16 -07:00
|
|
|
end
|
2011-08-31 18:52:01 -07:00
|
|
|
end
|
|
|
|
}
|
|
|
|
).
|
|
|
|
-endif.
|
|
|
|
|
|
|
|
|
2011-11-02 01:11:58 -07:00
|
|
|
-define(new_seq(), []).
|
|
|
|
-define(new_seq(C), [C]).
|
2011-09-19 23:06:37 -07:00
|
|
|
|
2011-11-02 01:11:58 -07:00
|
|
|
-define(acc_seq(Seq, C), [C] ++ Seq).
|
2012-03-27 14:44:02 -07:00
|
|
|
-define(acc_seq(Seq, C, D), [C, D] ++ Seq).
|
2011-09-19 23:06:37 -07:00
|
|
|
|
2011-11-02 01:11:58 -07:00
|
|
|
-define(end_seq(Seq), unicode:characters_to_binary(lists:reverse(Seq))).
|
2011-09-19 23:06:37 -07:00
|
|
|
|
|
|
|
|
2012-04-06 08:35:40 -07:00
|
|
|
handle_event([], Handler, _Opts) -> Handler;
|
|
|
|
handle_event([Event|Rest], Handler, Opts) -> handle_event(Rest, handle_event(Event, Handler, Opts), Opts);
|
|
|
|
handle_event(Event, {Handler, State}, _Opts) -> {Handler, Handler:handle_event(Event, State)}.
|
|
|
|
|
|
|
|
|
2012-04-04 20:46:41 -07:00
|
|
|
start(<<16#ef, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
maybe_bom(Rest, Handler, Stack, Opts);
|
|
|
|
start(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(start, <<>>, Handler, Stack, Opts);
|
|
|
|
start(Bin, Handler, Stack, Opts) ->
|
|
|
|
value(Bin, Handler, Stack, Opts).
|
|
|
|
|
|
|
|
|
|
|
|
maybe_bom(<<16#bb, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
definitely_bom(Rest, Handler, Stack, Opts);
|
|
|
|
maybe_bom(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(maybe_bom, <<>>, Handler, Stack, Opts);
|
|
|
|
maybe_bom(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
definitely_bom(<<16#bf, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
value(Rest, Handler, Stack, Opts);
|
|
|
|
definitely_bom(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(definitely_bom, <<>>, Handler, Stack, Opts);
|
|
|
|
definitely_bom(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-03-14 23:01:59 -07:00
|
|
|
value(<<?doublequote, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
string(Rest, Handler, [?new_seq()|Stack], Opts);
|
2012-03-31 21:58:18 -07:00
|
|
|
value(<<?singlequote, Rest/binary>>, Handler, Stack, Opts = #opts{single_quoted_strings=true}) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
string(Rest, Handler, [?new_seq(), single_quote|Stack], Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<$t, Rest/binary>>, Handler, Stack, Opts) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
tr(Rest, Handler, Stack, Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<$f, Rest/binary>>, Handler, Stack, Opts) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
fa(Rest, Handler, Stack, Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<$n, Rest/binary>>, Handler, Stack, Opts) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
nu(Rest, Handler, Stack, Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<?negative, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-03-25 18:48:24 -07:00
|
|
|
negative(Rest, Handler, [[$-]|Stack], Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<?zero, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-03-25 18:48:24 -07:00
|
|
|
zero(Rest, Handler, [[$0]|Stack], Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_nonzero(S) ->
|
2012-03-25 18:48:24 -07:00
|
|
|
integer(Rest, Handler, [[S]|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
value(<<?start_object, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
object(Rest, handle_event(start_object, Handler, Opts), [key|Stack], Opts);
|
|
|
|
value(<<?start_array, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
array(Rest, handle_event(start_array, Handler, Opts), [array|Stack], Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_whitespace(S) ->
|
|
|
|
value(Rest, Handler, Stack, Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
value(<<?solidus, Rest/binary>>, Handler, Stack, Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [value|Stack], Opts);
|
2011-11-29 19:37:37 -08:00
|
|
|
value(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(value, <<>>, Handler, Stack, Opts);
|
|
|
|
value(Bin, Handler, Stack, Opts) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-03-14 23:01:59 -07:00
|
|
|
object(<<?doublequote, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
string(Rest, Handler, [?new_seq()|Stack], Opts);
|
2012-03-31 21:58:18 -07:00
|
|
|
object(<<?singlequote, Rest/binary>>, Handler, Stack, Opts = #opts{single_quoted_strings=true}) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
string(Rest, Handler, [?new_seq(), single_quote|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
object(<<?end_object, Rest/binary>>, Handler, [key|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event(end_object, Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
object(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_whitespace(S) ->
|
|
|
|
object(Rest, Handler, Stack, Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
object(<<?solidus, Rest/binary>>, Handler, Stack, Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [object|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
object(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(object, <<>>, Handler, Stack, Opts);
|
|
|
|
object(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-03-14 23:01:59 -07:00
|
|
|
array(<<?doublequote, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
string(Rest, Handler, [?new_seq()|Stack], Opts);
|
2012-03-31 21:58:18 -07:00
|
|
|
array(<<?singlequote, Rest/binary>>, Handler, Stack, Opts = #opts{single_quoted_strings=true}) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
string(Rest, Handler, [?new_seq(), single_quote|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
array(<<$t, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
tr(Rest, Handler, Stack, Opts);
|
|
|
|
array(<<$f, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
fa(Rest, Handler, Stack, Opts);
|
|
|
|
array(<<$n, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
nu(Rest, Handler, Stack, Opts);
|
|
|
|
array(<<?negative, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-03-25 18:48:24 -07:00
|
|
|
negative(Rest, Handler, [[$-]|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
array(<<?zero, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-03-25 18:48:24 -07:00
|
|
|
zero(Rest, Handler, [[$0]|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
array(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_nonzero(S) ->
|
2012-03-25 18:48:24 -07:00
|
|
|
integer(Rest, Handler, [[S]|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
array(<<?start_object, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
object(Rest, handle_event(start_object, Handler, Opts), [key|Stack], Opts);
|
|
|
|
array(<<?start_array, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
array(Rest, handle_event(start_array, Handler, Opts), [array|Stack], Opts);
|
|
|
|
array(<<?end_array, Rest/binary>>, Handler, [array|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event(end_array, Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
array(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_whitespace(S) ->
|
2012-03-19 14:34:07 -07:00
|
|
|
array(Rest, Handler, Stack, Opts);
|
|
|
|
array(<<?solidus, Rest/binary>>, Handler, Stack, Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [array|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
array(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(array, <<>>, Handler, Stack, Opts);
|
|
|
|
array(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
colon(<<?colon, Rest/binary>>, Handler, [key|Stack], Opts) ->
|
|
|
|
value(Rest, Handler, [object|Stack], Opts);
|
|
|
|
colon(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_whitespace(S) ->
|
|
|
|
colon(Rest, Handler, Stack, Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
colon(<<?solidus, Rest/binary>>, Handler, Stack, Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [colon|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
colon(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(colon, <<>>, Handler, Stack, Opts);
|
|
|
|
colon(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-03-14 23:01:59 -07:00
|
|
|
key(<<?doublequote, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
string(Rest, Handler, [?new_seq()|Stack], Opts);
|
2012-03-31 21:58:18 -07:00
|
|
|
key(<<?singlequote, Rest/binary>>, Handler, Stack, Opts = #opts{single_quoted_strings=true}) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
string(Rest, Handler, [?new_seq(), single_quote|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
key(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_whitespace(S) ->
|
2012-03-19 14:34:07 -07:00
|
|
|
key(Rest, Handler, Stack, Opts);
|
|
|
|
key(<<?solidus, Rest/binary>>, Handler, Stack, Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [key|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
key(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(key, <<>>, Handler, Stack, Opts);
|
|
|
|
key(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-09-19 23:06:37 -07:00
|
|
|
|
|
|
|
|
|
|
|
%% string appends it's output to the term at the top of the stack. for
|
|
|
|
%% efficiency the strings are build in reverse order and reversed before
|
|
|
|
%% being added to the output stream
|
2011-08-31 18:52:01 -07:00
|
|
|
%% when parsing strings, the naive detection of partial codepoints is
|
|
|
|
%% insufficient. this incredibly anal function should detect all badly formed
|
|
|
|
%% utf sequences
|
|
|
|
partial_utf(<<>>) -> true;
|
2011-09-02 02:33:06 -05:00
|
|
|
partial_utf(<<X>>) when X >= 16#c2, X =< 16#f4 -> true;
|
|
|
|
partial_utf(<<X, Y>>) when X >= 16#e0, X =< 16#f4, Y >= 16#80, Y =< 16#bf -> true;
|
|
|
|
partial_utf(<<X, Y, Z>>)
|
|
|
|
when X >= 16#f0, X =< 16#f4,
|
|
|
|
Y >= 16#80, Y =< 16#bf,
|
|
|
|
Z >= 16#80, Z =< 16#bf ->
|
|
|
|
true;
|
2011-08-31 18:52:01 -07:00
|
|
|
partial_utf(_) -> false.
|
|
|
|
|
2012-03-26 18:52:06 -07:00
|
|
|
|
|
|
|
%% explicitly whitelist ascii set for better efficiency (seriously, it's worth
|
|
|
|
%% almost a 20% increase)
|
2012-03-25 18:48:24 -07:00
|
|
|
string(<<32, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 32)|Stack], Opts);
|
|
|
|
string(<<33, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 33)|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
string(<<?doublequote, Rest/binary>>, Handler, S, Opts) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
case S of
|
|
|
|
[Acc, key|Stack] ->
|
2012-04-06 08:35:40 -07:00
|
|
|
colon(Rest, handle_event({key, ?end_seq(Acc)}, Handler, Opts), [key|Stack], Opts);
|
2012-03-14 23:01:59 -07:00
|
|
|
[_Acc, single_quote|_Stack] ->
|
2012-04-06 08:35:40 -07:00
|
|
|
?error([<<?doublequote, Rest/binary>>, Handler, S, Opts]);
|
2012-03-14 23:01:59 -07:00
|
|
|
[Acc|Stack] ->
|
2012-04-06 08:35:40 -07:00
|
|
|
maybe_done(Rest, handle_event({string, ?end_seq(Acc)}, Handler, Opts), Stack, Opts)
|
2012-03-14 23:01:59 -07:00
|
|
|
end;
|
2012-03-25 18:48:24 -07:00
|
|
|
string(<<35, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 35)|Stack], Opts);
|
|
|
|
string(<<36, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 36)|Stack], Opts);
|
|
|
|
string(<<37, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 37)|Stack], Opts);
|
|
|
|
string(<<38, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 38)|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
string(<<?singlequote, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 21:58:18 -07:00
|
|
|
case Opts#opts.single_quoted_strings of
|
2012-03-28 19:34:49 -07:00
|
|
|
true ->
|
|
|
|
case Stack of
|
|
|
|
[single_quote, key|S] ->
|
2012-04-06 08:35:40 -07:00
|
|
|
colon(Rest, handle_event({key, ?end_seq(Acc)}, Handler, Opts), [key|S], Opts)
|
2012-03-28 19:34:49 -07:00
|
|
|
; [single_quote|S] ->
|
2012-04-06 08:35:40 -07:00
|
|
|
maybe_done(Rest, handle_event({string, ?end_seq(Acc)}, Handler, Opts), S, Opts)
|
2012-03-28 19:34:49 -07:00
|
|
|
; _ ->
|
2012-04-06 08:35:40 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace(?singlequote, Opts))|Stack], Opts)
|
2012-03-28 19:34:49 -07:00
|
|
|
end
|
|
|
|
; false ->
|
2012-04-06 08:35:40 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, ?singlequote)|Stack], Opts)
|
2012-03-14 23:01:59 -07:00
|
|
|
end;
|
2012-03-25 18:48:24 -07:00
|
|
|
string(<<40, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 40)|Stack], Opts);
|
|
|
|
string(<<41, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 41)|Stack], Opts);
|
|
|
|
string(<<42, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 42)|Stack], Opts);
|
|
|
|
string(<<43, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 43)|Stack], Opts);
|
|
|
|
string(<<44, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 44)|Stack], Opts);
|
|
|
|
string(<<45, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 45)|Stack], Opts);
|
|
|
|
string(<<46, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 46)|Stack], Opts);
|
2012-03-31 20:38:51 -07:00
|
|
|
string(<<$/, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($/, Opts))|Stack], Opts);
|
2012-03-25 18:48:24 -07:00
|
|
|
string(<<48, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 48)|Stack], Opts);
|
|
|
|
string(<<49, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 49)|Stack], Opts);
|
|
|
|
string(<<50, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 50)|Stack], Opts);
|
|
|
|
string(<<51, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 51)|Stack], Opts);
|
|
|
|
string(<<52, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 52)|Stack], Opts);
|
|
|
|
string(<<53, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 53)|Stack], Opts);
|
|
|
|
string(<<54, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 54)|Stack], Opts);
|
|
|
|
string(<<55, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 55)|Stack], Opts);
|
|
|
|
string(<<56, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 56)|Stack], Opts);
|
|
|
|
string(<<57, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 57)|Stack], Opts);
|
|
|
|
string(<<58, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 58)|Stack], Opts);
|
|
|
|
string(<<59, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 59)|Stack], Opts);
|
|
|
|
string(<<60, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 60)|Stack], Opts);
|
|
|
|
string(<<61, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 61)|Stack], Opts);
|
|
|
|
string(<<62, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 62)|Stack], Opts);
|
|
|
|
string(<<63, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 63)|Stack], Opts);
|
|
|
|
string(<<64, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 64)|Stack], Opts);
|
|
|
|
string(<<65, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 65)|Stack], Opts);
|
|
|
|
string(<<66, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 66)|Stack], Opts);
|
|
|
|
string(<<67, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 67)|Stack], Opts);
|
|
|
|
string(<<68, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 68)|Stack], Opts);
|
|
|
|
string(<<69, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 69)|Stack], Opts);
|
|
|
|
string(<<70, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 70)|Stack], Opts);
|
|
|
|
string(<<71, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 71)|Stack], Opts);
|
|
|
|
string(<<72, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 72)|Stack], Opts);
|
|
|
|
string(<<73, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 73)|Stack], Opts);
|
|
|
|
string(<<74, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 74)|Stack], Opts);
|
|
|
|
string(<<75, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 75)|Stack], Opts);
|
|
|
|
string(<<76, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 76)|Stack], Opts);
|
|
|
|
string(<<77, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 77)|Stack], Opts);
|
|
|
|
string(<<78, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 78)|Stack], Opts);
|
|
|
|
string(<<79, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 79)|Stack], Opts);
|
|
|
|
string(<<80, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 80)|Stack], Opts);
|
|
|
|
string(<<81, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 81)|Stack], Opts);
|
|
|
|
string(<<82, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 82)|Stack], Opts);
|
|
|
|
string(<<83, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 83)|Stack], Opts);
|
|
|
|
string(<<84, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 84)|Stack], Opts);
|
|
|
|
string(<<85, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 85)|Stack], Opts);
|
|
|
|
string(<<86, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 86)|Stack], Opts);
|
|
|
|
string(<<87, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 87)|Stack], Opts);
|
|
|
|
string(<<88, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 88)|Stack], Opts);
|
|
|
|
string(<<89, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 89)|Stack], Opts);
|
|
|
|
string(<<90, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 90)|Stack], Opts);
|
|
|
|
string(<<91, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 91)|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
string(<<?rsolidus/utf8, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
escape(Rest, Handler, Stack, Opts);
|
2012-03-25 18:48:24 -07:00
|
|
|
string(<<93, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 93)|Stack], Opts);
|
|
|
|
string(<<94, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 94)|Stack], Opts);
|
|
|
|
string(<<95, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 95)|Stack], Opts);
|
|
|
|
string(<<96, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 96)|Stack], Opts);
|
|
|
|
string(<<97, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 97)|Stack], Opts);
|
|
|
|
string(<<98, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 98)|Stack], Opts);
|
|
|
|
string(<<99, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 99)|Stack], Opts);
|
|
|
|
string(<<100, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 100)|Stack], Opts);
|
|
|
|
string(<<101, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 101)|Stack], Opts);
|
|
|
|
string(<<102, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 102)|Stack], Opts);
|
|
|
|
string(<<103, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 103)|Stack], Opts);
|
|
|
|
string(<<104, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 104)|Stack], Opts);
|
|
|
|
string(<<105, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 105)|Stack], Opts);
|
|
|
|
string(<<106, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 106)|Stack], Opts);
|
|
|
|
string(<<107, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 107)|Stack], Opts);
|
|
|
|
string(<<108, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 108)|Stack], Opts);
|
|
|
|
string(<<109, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 109)|Stack], Opts);
|
|
|
|
string(<<110, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 110)|Stack], Opts);
|
|
|
|
string(<<111, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 111)|Stack], Opts);
|
|
|
|
string(<<112, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 112)|Stack], Opts);
|
|
|
|
string(<<113, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 113)|Stack], Opts);
|
|
|
|
string(<<114, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 114)|Stack], Opts);
|
|
|
|
string(<<115, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 115)|Stack], Opts);
|
|
|
|
string(<<116, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 116)|Stack], Opts);
|
|
|
|
string(<<117, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 117)|Stack], Opts);
|
|
|
|
string(<<118, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 118)|Stack], Opts);
|
|
|
|
string(<<119, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 119)|Stack], Opts);
|
|
|
|
string(<<120, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 120)|Stack], Opts);
|
|
|
|
string(<<121, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 121)|Stack], Opts);
|
|
|
|
string(<<122, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 122)|Stack], Opts);
|
|
|
|
string(<<123, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 123)|Stack], Opts);
|
|
|
|
string(<<124, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 124)|Stack], Opts);
|
|
|
|
string(<<125, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 125)|Stack], Opts);
|
|
|
|
string(<<126, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 126)|Stack], Opts);
|
|
|
|
string(<<127, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 127)|Stack], Opts);
|
2012-03-31 20:38:51 -07:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X == 16#2028; X == 16#2029 ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace(X, Opts))|Stack], Opts);
|
2012-04-01 17:27:55 -07:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#20, X < 16#d800 ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X > 16#dfff, X < 16#fdd0 ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X > 16#fdef, X < 16#fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#10000, X < 16#1fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#20000, X < 16#2fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#30000, X < 16#3fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#40000, X < 16#4fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#50000, X < 16#5fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#60000, X < 16#6fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#70000, X < 16#7fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#80000, X < 16#8fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#90000, X < 16#9fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#a0000, X < 16#afffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#b0000, X < 16#bfffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#c0000, X < 16#cfffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#d0000, X < 16#dfffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#e0000, X < 16#efffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#f0000, X < 16#ffffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 16#100000, X < 16#10fffe ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, X)|Stack], Opts);
|
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
case Opts#opts.replaced_bad_utf8 of
|
|
|
|
true -> noncharacter(<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts)
|
|
|
|
; false -> ?error([<<X/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts])
|
2012-03-28 19:34:49 -07:00
|
|
|
end;
|
2011-11-23 20:54:10 -08:00
|
|
|
string(Bin, Handler, Stack, Opts) ->
|
2011-08-31 18:52:01 -07:00
|
|
|
case partial_utf(Bin) of
|
2011-11-23 20:54:10 -08:00
|
|
|
true -> ?incomplete(string, Bin, Handler, Stack, Opts)
|
2011-08-31 18:52:01 -07:00
|
|
|
; false ->
|
2012-03-31 21:58:18 -07:00
|
|
|
case Opts#opts.replaced_bad_utf8 of
|
2011-11-23 20:54:10 -08:00
|
|
|
true -> noncharacter(Bin, Handler, Stack, Opts)
|
|
|
|
; false -> ?error([Bin, Handler, Stack, Opts])
|
2011-08-31 18:52:01 -07:00
|
|
|
end
|
|
|
|
end.
|
2012-03-29 21:43:55 -07:00
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
%% we don't need to guard against partial utf here, because it's already taken
|
2012-03-26 19:39:28 -07:00
|
|
|
%% care of in string
|
2011-08-31 18:52:01 -07:00
|
|
|
%% surrogates
|
2011-11-23 20:54:10 -08:00
|
|
|
noncharacter(<<237, X, _, Rest/binary>>, Handler, [Acc|Stack], Opts) when X >= 160 ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts);
|
2012-03-27 13:41:23 -07:00
|
|
|
%% u+fffe and u+ffff for R14BXX
|
|
|
|
noncharacter(<<239, 191, X, Rest/binary>>, Handler, [Acc|Stack], Opts) when X == 190; X == 191 ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts);
|
2012-03-28 19:34:49 -07:00
|
|
|
%% u+xfffe, u+xffff and other noncharacters
|
|
|
|
noncharacter(<<_/utf8, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts);
|
|
|
|
%% overlong encodings and missing continuations of a 2 byte sequence
|
2012-03-28 19:50:57 -07:00
|
|
|
noncharacter(<<X, Rest/binary>>, Handler, Stack, Opts) when X >= 192, X =< 223 ->
|
|
|
|
strip_continuations(Rest, Handler, [1|Stack], Opts);
|
2012-03-28 19:34:49 -07:00
|
|
|
%% overlong encodings and missing continuations of a 3 byte sequence
|
2012-03-28 19:50:57 -07:00
|
|
|
noncharacter(<<X, Rest/binary>>, Handler, Stack, Opts) when X >= 224, X =< 239 ->
|
|
|
|
strip_continuations(Rest, Handler, [2|Stack], Opts);
|
2012-03-28 19:34:49 -07:00
|
|
|
%% overlong encodings and missing continuations of a 4 byte sequence
|
2012-03-28 19:50:57 -07:00
|
|
|
noncharacter(<<X, Rest/binary>>, Handler, Stack, Opts) when X >= 240, X =< 247 ->
|
|
|
|
strip_continuations(Rest, Handler, [3|Stack], Opts);
|
2012-03-28 19:34:49 -07:00
|
|
|
%% unexpected bytes, including orphan continuations
|
2012-03-21 05:19:47 -07:00
|
|
|
noncharacter(<<_, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-28 19:50:57 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts);
|
|
|
|
noncharacter(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(noncharacter, <<>>, Handler, Stack, Opts).
|
2011-11-23 20:54:10 -08:00
|
|
|
|
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
%% strips continuation bytes after bad utf bytes, guards against both too short
|
|
|
|
%% and overlong sequences. N is the maximum number of bytes to strip
|
2012-03-28 19:50:57 -07:00
|
|
|
strip_continuations(Rest, Handler, [0, Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts);
|
|
|
|
strip_continuations(<<X, Rest/binary>>, Handler, [N|Stack], Opts) when X >= 128, X =< 191 ->
|
|
|
|
strip_continuations(Rest, Handler, [N - 1|Stack], Opts);
|
|
|
|
%% incomplete
|
|
|
|
strip_continuations(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(strip_continuations, <<>>, Handler, Stack, Opts);
|
2012-03-28 19:34:49 -07:00
|
|
|
%% not a continuation byte, dispatch back to string
|
2012-03-28 19:50:57 -07:00
|
|
|
strip_continuations(Rest, Handler, [_, Acc|Stack], Opts) ->
|
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts).
|
2012-03-27 23:18:06 -07:00
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(<<$b, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\b, Opts))|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(<<$f, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\f, Opts))|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(<<$n, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\n, Opts))|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(<<$r, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\r, Opts))|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(<<$t, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\t, Opts))|Stack], Opts);
|
2012-03-19 15:57:00 -07:00
|
|
|
escape(<<?rsolidus, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\\, Opts))|Stack], Opts);
|
2012-04-26 13:04:17 -07:00
|
|
|
escape(<<?solidus, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($/, Opts))|Stack], Opts);
|
2012-03-19 15:57:00 -07:00
|
|
|
escape(<<?doublequote, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace($\", Opts))|Stack], Opts);
|
2012-03-31 21:58:18 -07:00
|
|
|
escape(<<?singlequote, Rest/binary>>, Handler, [Acc|Stack], Opts = #opts{single_quoted_strings=true}) ->
|
2012-03-31 20:38:51 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, maybe_replace(?singlequote, Opts))|Stack], Opts);
|
2012-03-19 15:57:00 -07:00
|
|
|
escape(<<$u, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-03-27 14:44:02 -07:00
|
|
|
escaped_unicode(Rest, Handler, Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(escape, <<>>, Handler, Stack, Opts);
|
2012-03-31 21:58:18 -07:00
|
|
|
escape(Bin, Handler, [Acc|Stack], Opts=#opts{ignored_bad_escapes=true}) ->
|
2012-03-29 00:18:53 -07:00
|
|
|
string(Bin, Handler, [?acc_seq(Acc, ?rsolidus)|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
escape(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
|
|
|
%% this code is ugly and unfortunate, but so is json's handling of escaped
|
|
|
|
%% unicode codepoint sequences.
|
2012-03-27 14:44:02 -07:00
|
|
|
escaped_unicode(<<A, B, C, D, Rest/binary>>, Handler, [Acc|Stack], Opts)
|
|
|
|
when ?is_hex(A), ?is_hex(B), ?is_hex(C), ?is_hex(D) ->
|
2011-08-31 18:52:01 -07:00
|
|
|
case erlang:list_to_integer([A, B, C, D], 16) of
|
2012-03-27 14:44:02 -07:00
|
|
|
%% high surrogate, dispatch to low surrogate
|
2011-08-31 18:52:01 -07:00
|
|
|
X when X >= 16#d800, X =< 16#dbff ->
|
2011-11-23 20:54:10 -08:00
|
|
|
low_surrogate(Rest, Handler, [X, Acc|Stack], Opts)
|
2012-03-27 14:44:02 -07:00
|
|
|
%% low surrogate, illegal in this position
|
|
|
|
; X when X >= 16#dc00, X =< 16#dfff ->
|
2012-03-31 21:58:18 -07:00
|
|
|
case Opts#opts.replaced_bad_utf8 of
|
2012-03-27 14:44:02 -07:00
|
|
|
true -> string(Rest, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts)
|
|
|
|
; false -> ?error([<<A, B, C, D, Rest/binary>>, Handler, [Acc|Stack], Opts])
|
2011-08-31 18:52:01 -07:00
|
|
|
end
|
|
|
|
%% anything else
|
2012-03-31 20:38:51 -07:00
|
|
|
; X -> string(Rest, Handler, [?acc_seq(Acc, maybe_replace(X, Opts))|Stack], Opts)
|
2011-08-31 18:52:01 -07:00
|
|
|
end;
|
2011-11-23 20:54:10 -08:00
|
|
|
escaped_unicode(Bin, Handler, Stack, Opts) ->
|
2012-03-27 14:44:02 -07:00
|
|
|
case is_partial_escape(Bin) of
|
|
|
|
true -> ?incomplete(escaped_unicode, Bin, Handler, Stack, Opts)
|
|
|
|
; false -> ?error([Bin, Handler, Stack, Opts])
|
|
|
|
end.
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-03-27 14:44:02 -07:00
|
|
|
is_partial_escape(<<A, B, C>>) when ?is_hex(A), ?is_hex(B), ?is_hex(C) -> true;
|
|
|
|
is_partial_escape(<<A, B>>) when ?is_hex(A), ?is_hex(B) -> true;
|
|
|
|
is_partial_escape(<<A>>) when ?is_hex(A) -> true;
|
|
|
|
is_partial_escape(<<>>) -> true;
|
|
|
|
is_partial_escape(_) -> false.
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-03-27 14:44:02 -07:00
|
|
|
low_surrogate(<<?rsolidus, $u, A, B, C, D, Rest/binary>>, Handler, [High, Acc|Stack], Opts)
|
|
|
|
when ?is_hex(A), ?is_hex(B), ?is_hex(C), ?is_hex(D) ->
|
2011-08-31 18:52:01 -07:00
|
|
|
case erlang:list_to_integer([A, B, C, D], 16) of
|
2012-03-27 14:44:02 -07:00
|
|
|
X when X >= 16#dc00, X =< 16#dfff ->
|
|
|
|
Y = surrogate_to_codepoint(High, X),
|
|
|
|
case (Y =< 16#d800 orelse Y >= 16#e000) of
|
|
|
|
true -> string(Rest, Handler, [?acc_seq(Acc, Y)|Stack], Opts)
|
|
|
|
; false ->
|
2012-03-31 21:58:18 -07:00
|
|
|
case Opts#opts.replaced_bad_utf8 of
|
2011-08-31 18:52:01 -07:00
|
|
|
true ->
|
2012-03-27 14:44:02 -07:00
|
|
|
string(Rest, Handler, [?acc_seq(Acc, 16#fffd, 16#fffd)|Stack], Opts)
|
|
|
|
; false ->
|
|
|
|
?error([<<?rsolidus, $u, A, B, C, D, Rest/binary>>, Handler, [High, Acc|Stack], Opts])
|
2011-08-31 18:52:01 -07:00
|
|
|
end
|
|
|
|
end
|
|
|
|
; _ ->
|
2012-03-31 21:58:18 -07:00
|
|
|
case Opts#opts.replaced_bad_utf8 of
|
2012-03-27 14:44:02 -07:00
|
|
|
true -> string(Rest, Handler, [?acc_seq(Acc, 16#fffd, 16#fffd)|Stack], Opts)
|
|
|
|
; false -> ?error([<<?rsolidus, $u, A, B, C, D, Rest/binary>>, Handler, [High, Acc|Stack], Opts])
|
2011-08-31 18:52:01 -07:00
|
|
|
end
|
|
|
|
end;
|
2012-03-27 14:44:02 -07:00
|
|
|
low_surrogate(Bin, Handler, [High, Acc|Stack], Opts) ->
|
|
|
|
case is_partial_low(Bin) of
|
|
|
|
true -> ?incomplete(low_surrogate, Bin, Handler, [High, Acc|Stack], Opts)
|
|
|
|
; false ->
|
2012-03-31 21:58:18 -07:00
|
|
|
case Opts#opts.replaced_bad_utf8 of
|
2012-03-27 14:44:02 -07:00
|
|
|
true -> string(Bin, Handler, [?acc_seq(Acc, 16#fffd)|Stack], Opts)
|
|
|
|
; false -> ?error([Bin, Handler, [High, Acc|Stack], Opts])
|
|
|
|
end
|
|
|
|
end.
|
|
|
|
|
|
|
|
|
|
|
|
is_partial_low(<<?rsolidus, $u, A, B, C>>) when ?is_hex(A), ?is_hex(B), ?is_hex(C) -> true;
|
|
|
|
is_partial_low(<<?rsolidus, $u, A, B>>) when ?is_hex(A), ?is_hex(B) -> true;
|
|
|
|
is_partial_low(<<?rsolidus, $u, A>>) when ?is_hex(A) -> true;
|
|
|
|
is_partial_low(<<?rsolidus, $u>>) -> true;
|
|
|
|
is_partial_low(<<?rsolidus>>) -> true;
|
|
|
|
is_partial_low(<<>>) -> true;
|
|
|
|
is_partial_low(_) -> false.
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
|
|
|
%% stole this from the unicode spec
|
|
|
|
surrogate_to_codepoint(High, Low) ->
|
|
|
|
(High - 16#d800) * 16#400 + (Low - 16#dc00) + 16#10000.
|
|
|
|
|
|
|
|
|
2012-03-31 20:38:51 -07:00
|
|
|
maybe_replace(X, #opts{dirty_strings=true}) when is_integer(X) -> [X];
|
2012-03-31 21:58:18 -07:00
|
|
|
maybe_replace($\b, #opts{escaped_strings=true}) -> [$\\, $b];
|
|
|
|
maybe_replace($\t, #opts{escaped_strings=true}) -> [$\\, $t];
|
|
|
|
maybe_replace($\n, #opts{escaped_strings=true}) -> [$\\, $n];
|
|
|
|
maybe_replace($\f, #opts{escaped_strings=true}) -> [$\\, $f];
|
|
|
|
maybe_replace($\r, #opts{escaped_strings=true}) -> [$\\, $r];
|
|
|
|
maybe_replace($\", #opts{escaped_strings=true}) -> [$\\, $\"];
|
|
|
|
maybe_replace($', Opts=#opts{escaped_strings=true}) ->
|
|
|
|
case Opts#opts.single_quoted_strings of
|
2012-03-31 20:38:51 -07:00
|
|
|
true -> [$\\, $']
|
|
|
|
; false -> [$']
|
|
|
|
end;
|
2012-03-31 21:58:18 -07:00
|
|
|
maybe_replace($/, Opts=#opts{escaped_strings=true}) ->
|
|
|
|
case Opts#opts.escaped_forward_slashes of
|
2012-03-31 20:38:51 -07:00
|
|
|
true -> [$\\, $/]
|
|
|
|
; false -> [$/]
|
|
|
|
end;
|
2012-03-31 21:58:18 -07:00
|
|
|
maybe_replace($\\, #opts{escaped_strings=true}) -> [$\\, $\\];
|
|
|
|
maybe_replace(X, Opts=#opts{escaped_strings=true}) when X == 16#2028; X == 16#2029 ->
|
|
|
|
case Opts#opts.unescaped_jsonp of
|
2012-03-31 20:38:51 -07:00
|
|
|
true -> [X]
|
|
|
|
; false -> jsx_utils:json_escape_sequence(X)
|
|
|
|
end;
|
2012-03-31 21:58:18 -07:00
|
|
|
maybe_replace(X, #opts{escaped_strings=true}) when X < 32 ->
|
2012-03-31 20:38:51 -07:00
|
|
|
jsx_utils:json_escape_sequence(X);
|
|
|
|
maybe_replace(X, _Opts) -> [X].
|
|
|
|
|
|
|
|
|
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
%% like strings, numbers are collected in an intermediate accumulator before
|
|
|
|
%% being emitted to the callback handler
|
2011-11-23 20:54:10 -08:00
|
|
|
negative(<<$0, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
zero(Rest, Handler, ["0" ++ Acc|Stack], Opts);
|
|
|
|
negative(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when ?is_nonzero(S) ->
|
|
|
|
integer(Rest, Handler, [[S] ++ Acc|Stack], Opts);
|
|
|
|
negative(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(negative, <<>>, Handler, Stack, Opts);
|
|
|
|
negative(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-04-06 08:35:40 -07:00
|
|
|
zero(<<?end_object, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_object], Handler, Opts), Stack, Opts);
|
|
|
|
zero(<<?end_array, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event(end_array, handle_event(format_number(Acc), Handler, Opts), Opts), Stack, Opts);
|
|
|
|
zero(<<?comma, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
key(Rest, handle_event(format_number(Acc), Handler, Opts), [key|Stack], Opts);
|
|
|
|
zero(<<?comma, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
value(Rest, handle_event(format_number(Acc), Handler, Opts), [array|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
zero(<<?decimalpoint, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
initial_decimal(Rest, Handler, [{Acc, []}|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
zero(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when ?is_whitespace(S) ->
|
|
|
|
maybe_done(Rest, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
|
|
|
zero(<<?solidus, Rest/binary>>, Handler, [Acc|Stack], Opts=#opts{comments=true}) ->
|
|
|
|
comment(Rest, handle_event(format_number(Acc), Handler, Opts), [maybe_done|Stack], Opts);
|
|
|
|
zero(<<>>, Handler, [Acc|Stack], Opts = #opts{explicit_end=false}) ->
|
|
|
|
maybe_done(<<>>, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
zero(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(zero, <<>>, Handler, Stack, Opts);
|
|
|
|
zero(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
integer(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when ?is_nonzero(S) ->
|
|
|
|
integer(Rest, Handler, [[S] ++ Acc|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
integer(<<?end_object, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_object], Handler, Opts), Stack, Opts);
|
|
|
|
integer(<<?end_array, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_array], Handler, Opts), Stack, Opts);
|
|
|
|
integer(<<?comma, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
key(Rest, handle_event(format_number(Acc), Handler, Opts), [key|Stack], Opts);
|
|
|
|
integer(<<?comma, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
value(Rest, handle_event(format_number(Acc), Handler, Opts), [array|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
integer(<<?decimalpoint, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
initial_decimal(Rest, Handler, [{Acc, []}|Stack], Opts);
|
|
|
|
integer(<<?zero, Rest/binary>>, Handler, [Acc|Stack], Opts) ->
|
|
|
|
integer(Rest, Handler, [[?zero] ++ Acc|Stack], Opts);
|
|
|
|
integer(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when S =:= $e; S =:= $E ->
|
|
|
|
e(Rest, Handler, [{Acc, [], []}|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
integer(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when ?is_whitespace(S) ->
|
|
|
|
maybe_done(Rest, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
|
|
|
integer(<<?solidus, Rest/binary>>, Handler, [Acc|Stack], Opts=#opts{comments=true}) ->
|
|
|
|
comment(Rest, handle_event(format_number(Acc), Handler, Opts), [maybe_done|Stack], Opts);
|
|
|
|
integer(<<>>, Handler, [Acc|Stack], Opts = #opts{explicit_end=false}) ->
|
|
|
|
maybe_done(<<>>, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
integer(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(integer, <<>>, Handler, Stack, Opts);
|
|
|
|
integer(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-03-31 17:51:20 -07:00
|
|
|
initial_decimal(<<S, Rest/binary>>, Handler, [{Int, Frac}|Stack], Opts) when S =:= ?zero; ?is_nonzero(S) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
decimal(Rest, Handler, [{Int, [S] ++ Frac}|Stack], Opts);
|
|
|
|
initial_decimal(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(initial_decimal, <<>>, Handler, Stack, Opts);
|
|
|
|
initial_decimal(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
decimal(<<S, Rest/binary>>, Handler, [{Int, Frac}|Stack], Opts)
|
2011-08-31 18:52:01 -07:00
|
|
|
when S=:= ?zero; ?is_nonzero(S) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
decimal(Rest, Handler, [{Int, [S] ++ Frac}|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
decimal(<<?end_object, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_object], Handler, Opts), Stack, Opts);
|
|
|
|
decimal(<<?end_array, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_array], Handler, Opts), Stack, Opts);
|
|
|
|
decimal(<<?comma, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
key(Rest, handle_event(format_number(Acc), Handler, Opts), [key|Stack], Opts);
|
|
|
|
decimal(<<?comma, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
value(Rest, handle_event(format_number(Acc), Handler, Opts), [array|Stack], Opts);
|
2012-03-31 17:51:20 -07:00
|
|
|
decimal(<<S, Rest/binary>>, Handler, [{Int, Frac}|Stack], Opts) when S =:= $e; S =:= $E ->
|
2011-11-23 20:54:10 -08:00
|
|
|
e(Rest, Handler, [{Int, Frac, []}|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
decimal(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when ?is_whitespace(S) ->
|
|
|
|
maybe_done(Rest, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
|
|
|
decimal(<<?solidus, Rest/binary>>, Handler, [Acc|Stack], Opts=#opts{comments=true}) ->
|
|
|
|
comment(Rest, handle_event(format_number(Acc), Handler, Opts), [maybe_done|Stack], Opts);
|
|
|
|
decimal(<<>>, Handler, [Acc|Stack], Opts = #opts{explicit_end=false}) ->
|
|
|
|
maybe_done(<<>>, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
decimal(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(decimal, <<>>, Handler, Stack, Opts);
|
|
|
|
decimal(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-03-31 17:51:20 -07:00
|
|
|
e(<<S, Rest/binary>>, Handler, [{Int, Frac, Exp}|Stack], Opts) when S =:= ?zero; ?is_nonzero(S) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
exp(Rest, Handler, [{Int, Frac, [S] ++ Exp}|Stack], Opts);
|
2012-03-31 17:51:20 -07:00
|
|
|
e(<<S, Rest/binary>>, Handler, [{Int, Frac, Exp}|Stack], Opts) when S =:= ?positive; S =:= ?negative ->
|
2011-11-23 20:54:10 -08:00
|
|
|
ex(Rest, Handler, [{Int, Frac, [S] ++ Exp}|Stack], Opts);
|
|
|
|
e(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(e, <<>>, Handler, Stack, Opts);
|
|
|
|
e(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-03-31 17:51:20 -07:00
|
|
|
ex(<<S, Rest/binary>>, Handler, [{Int, Frac, Exp}|Stack], Opts) when S =:= ?zero; ?is_nonzero(S) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
exp(Rest, Handler, [{Int, Frac, [S] ++ Exp}|Stack], Opts);
|
|
|
|
ex(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(ex, <<>>, Handler, Stack, Opts);
|
|
|
|
ex(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-03-31 17:51:20 -07:00
|
|
|
exp(<<S, Rest/binary>>, Handler, [{Int, Frac, Exp}|Stack], Opts) when S =:= ?zero; ?is_nonzero(S) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
exp(Rest, Handler, [{Int, Frac, [S] ++ Exp}|Stack], Opts);
|
2012-04-06 08:35:40 -07:00
|
|
|
exp(<<?end_object, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_object], Handler, Opts), Stack, Opts);
|
|
|
|
exp(<<?end_array, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_array], Handler, Opts), Stack, Opts);
|
|
|
|
exp(<<?comma, Rest/binary>>, Handler, [Acc, object|Stack], Opts) ->
|
|
|
|
key(Rest, handle_event(format_number(Acc), Handler, Opts), [key|Stack], Opts);
|
|
|
|
exp(<<?comma, Rest/binary>>, Handler, [Acc, array|Stack], Opts) ->
|
|
|
|
value(Rest, handle_event(format_number(Acc), Handler, Opts), [array|Stack], Opts);
|
|
|
|
exp(<<S, Rest/binary>>, Handler, [Acc|Stack], Opts) when ?is_whitespace(S) ->
|
|
|
|
maybe_done(Rest, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
|
|
|
exp(<<?solidus, Rest/binary>>, Handler, [Acc|Stack], Opts=#opts{comments=true}) ->
|
|
|
|
comment(Rest, handle_event(format_number(Acc), Handler, Opts), [maybe_done|Stack], Opts);
|
|
|
|
exp(<<>>, Handler, [Acc|Stack], Opts = #opts{explicit_end=false}) ->
|
|
|
|
maybe_done(<<>>, handle_event(format_number(Acc), Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
exp(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(exp, <<>>, Handler, Stack, Opts);
|
|
|
|
exp(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
|
|
|
format_number(Int) when is_list(Int) ->
|
|
|
|
{integer, list_to_integer(lists:reverse(Int))};
|
|
|
|
format_number({Int, Frac}) ->
|
|
|
|
{float, list_to_float(lists:reverse(Frac ++ "." ++ Int))};
|
|
|
|
format_number({Int, [], Exp}) ->
|
|
|
|
{float, list_to_float(lists:reverse(Exp ++ "e0." ++ Int))};
|
|
|
|
format_number({Int, Frac, Exp}) ->
|
|
|
|
{float, list_to_float(lists:reverse(Exp ++ "e" ++ Frac ++ "." ++ Int))}.
|
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
tr(<<$r, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
tru(Rest, Handler, Stack, Opts);
|
|
|
|
tr(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(tr, <<>>, Handler, Stack, Opts);
|
|
|
|
tr(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
tru(<<$u, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
true(Rest, Handler, Stack, Opts);
|
|
|
|
tru(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(tru, <<>>, Handler, Stack, Opts);
|
|
|
|
tru(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-04-06 08:35:40 -07:00
|
|
|
true(<<$e, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
maybe_done(Rest, handle_event({literal, true}, Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
true(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(true, <<>>, Handler, Stack, Opts);
|
|
|
|
true(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
fa(<<$a, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
fal(Rest, Handler, Stack, Opts);
|
|
|
|
fa(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(fa, <<>>, Handler, Stack, Opts);
|
|
|
|
fa(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
fal(<<$l, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
fals(Rest, Handler, Stack, Opts);
|
|
|
|
fal(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(fal, <<>>, Handler, Stack, Opts);
|
|
|
|
fal(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
fals(<<$s, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
false(Rest, Handler, Stack, Opts);
|
|
|
|
fals(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(fals, <<>>, Handler, Stack, Opts);
|
|
|
|
fals(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2012-04-06 08:35:40 -07:00
|
|
|
false(<<$e, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
maybe_done(Rest, handle_event({literal, false}, Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
false(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(false, <<>>, Handler, Stack, Opts);
|
|
|
|
false(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
nu(<<$u, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
nul(Rest, Handler, Stack, Opts);
|
|
|
|
nu(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(nu, <<>>, Handler, Stack, Opts);
|
|
|
|
nu(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
nul(<<$l, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
null(Rest, Handler, Stack, Opts);
|
|
|
|
nul(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(nul, <<>>, Handler, Stack, Opts);
|
|
|
|
nul(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-04-06 08:35:40 -07:00
|
|
|
null(<<$l, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
maybe_done(Rest, handle_event({literal, null}, Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
null(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(null, <<>>, Handler, Stack, Opts);
|
|
|
|
null(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-03-19 14:34:07 -07:00
|
|
|
comment(<<?solidus, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
single_comment(Rest, Handler, Stack, Opts);
|
|
|
|
comment(<<?star, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
multi_comment(Rest, Handler, Stack, Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
comment(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(comment, <<>>, Handler, Stack, Opts);
|
|
|
|
comment(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-04-01 17:16:22 -07:00
|
|
|
single_comment(<<?newline, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
end_comment(Rest, Handler, Stack, Opts);
|
|
|
|
single_comment(<<_/utf8, Rest/binary>>, Handler, Stack, Opts) ->
|
2012-03-19 14:34:07 -07:00
|
|
|
single_comment(Rest, Handler, Stack, Opts);
|
2012-04-01 17:53:59 -07:00
|
|
|
single_comment(<<>>, Handler, [done], Opts=#opts{explicit_end=false}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
end_comment(<<>>, Handler, [done], Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
single_comment(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(single_comment, <<>>, Handler, Stack, Opts);
|
|
|
|
single_comment(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
multi_comment(<<?star, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
end_multi_comment(Rest, Handler, Stack, Opts);
|
|
|
|
multi_comment(<<_S/utf8, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Opts);
|
|
|
|
multi_comment(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(multi_comment, <<>>, Handler, Stack, Opts);
|
|
|
|
multi_comment(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-04-01 17:16:22 -07:00
|
|
|
end_multi_comment(<<?solidus, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
end_comment(Rest, Handler, Stack, Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
end_multi_comment(<<_S/utf8, Rest/binary>>, Handler, Stack, Opts) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Opts);
|
|
|
|
end_multi_comment(<<>>, Handler, Stack, Opts) ->
|
|
|
|
?incomplete(end_multi_comment, <<>>, Handler, Stack, Opts);
|
|
|
|
end_multi_comment(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
2012-04-01 17:16:22 -07:00
|
|
|
end_comment(Rest, Handler, [Resume|Stack], Opts) ->
|
|
|
|
case Resume of
|
|
|
|
value -> value(Rest, Handler, Stack, Opts)
|
|
|
|
; object -> object(Rest, Handler, Stack, Opts)
|
|
|
|
; array -> array(Rest, Handler, Stack, Opts)
|
|
|
|
; colon -> colon(Rest, Handler, Stack, Opts)
|
|
|
|
; key -> key(Rest, Handler, Stack, Opts)
|
|
|
|
; maybe_done -> maybe_done(Rest, Handler, Stack, Opts)
|
|
|
|
; done -> done(Rest, Handler, Stack, Opts)
|
|
|
|
end.
|
|
|
|
|
|
|
|
|
2012-04-06 08:35:40 -07:00
|
|
|
maybe_done(Rest, Handler, [], Opts) ->
|
|
|
|
done(Rest, handle_event(end_json, Handler, Opts), [], Opts);
|
|
|
|
maybe_done(<<?end_object, Rest/binary>>, Handler, [object|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event(end_object, Handler, Opts), Stack, Opts);
|
|
|
|
maybe_done(<<?end_array, Rest/binary>>, Handler, [array|Stack], Opts) ->
|
|
|
|
maybe_done(Rest, handle_event(end_array, Handler, Opts), Stack, Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
maybe_done(<<?comma, Rest/binary>>, Handler, [object|Stack], Opts) ->
|
|
|
|
key(Rest, Handler, [key|Stack], Opts);
|
|
|
|
maybe_done(<<?comma, Rest/binary>>, Handler, [array|_] = Stack, Opts) ->
|
|
|
|
value(Rest, Handler, Stack, Opts);
|
|
|
|
maybe_done(<<S, Rest/binary>>, Handler, Stack, Opts) when ?is_whitespace(S) ->
|
|
|
|
maybe_done(Rest, Handler, Stack, Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
maybe_done(<<?solidus, Rest/binary>>, Handler, Stack, Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [maybe_done|Stack], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
maybe_done(<<>>, Handler, Stack, Opts) when length(Stack) > 0 ->
|
|
|
|
?incomplete(maybe_done, <<>>, Handler, Stack, Opts);
|
|
|
|
maybe_done(Bin, Handler, Stack, Opts) ->
|
|
|
|
?error([Bin, Handler, Stack, Opts]).
|
|
|
|
|
|
|
|
|
|
|
|
done(<<S, Rest/binary>>, Handler, [], Opts) when ?is_whitespace(S) ->
|
|
|
|
done(Rest, Handler, [], Opts);
|
2012-03-19 14:34:07 -07:00
|
|
|
done(<<?solidus, Rest/binary>>, Handler, [], Opts=#opts{comments=true}) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
comment(Rest, Handler, [done], Opts);
|
2011-11-23 20:54:10 -08:00
|
|
|
done(<<>>, {Handler, State}, [], Opts = #opts{explicit_end=true}) ->
|
2011-10-21 18:16:16 -07:00
|
|
|
{incomplete, fun(Stream) when is_binary(Stream) ->
|
2011-11-23 20:54:10 -08:00
|
|
|
done(<<Stream/binary>>, {Handler, State}, [], Opts)
|
|
|
|
; (end_stream) -> State
|
2011-10-21 18:16:16 -07:00
|
|
|
end
|
|
|
|
};
|
2011-11-23 20:54:10 -08:00
|
|
|
done(<<>>, {_Handler, State}, [], _Opts) -> State;
|
|
|
|
done(Bin, Handler, Stack, Opts) -> ?error([Bin, Handler, Stack, Opts]).
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-ifdef(TEST).
|
|
|
|
-include_lib("eunit/include/eunit.hrl").
|
|
|
|
|
|
|
|
|
2012-03-28 23:31:07 -07:00
|
|
|
xcode(Bin) -> xcode(Bin, []).
|
|
|
|
|
|
|
|
xcode(Bin, Opts) ->
|
|
|
|
Size = size(Bin),
|
|
|
|
try jsx:to_term(<<34, Bin:Size/binary, 34>>, Opts)
|
|
|
|
catch error:badarg -> {error, badarg}
|
|
|
|
end.
|
|
|
|
|
|
|
|
|
|
|
|
is_bad({error, badarg}) -> true;
|
|
|
|
is_bad(_) -> false.
|
|
|
|
|
|
|
|
|
|
|
|
bad_utf8_test_() ->
|
|
|
|
[
|
|
|
|
{"orphan continuation byte u+0080",
|
|
|
|
?_assert(is_bad(xcode(<<16#0080>>)))
|
|
|
|
},
|
|
|
|
{"orphan continuation byte u+0080 replaced",
|
2012-03-31 21:58:18 -07:00
|
|
|
?_assertEqual(xcode(<<16#0080>>, [replaced_bad_utf8]), <<16#fffd/utf8>>)
|
2012-03-28 23:31:07 -07:00
|
|
|
},
|
|
|
|
{"orphan continuation byte u+00bf",
|
|
|
|
?_assert(is_bad(xcode(<<16#00bf>>)))
|
|
|
|
},
|
|
|
|
{"orphan continuation byte u+00bf replaced",
|
2012-03-31 21:58:18 -07:00
|
|
|
?_assertEqual(xcode(<<16#00bf>>, [replaced_bad_utf8]), <<16#fffd/utf8>>)
|
2012-03-28 23:31:07 -07:00
|
|
|
},
|
|
|
|
{"2 continuation bytes",
|
|
|
|
?_assert(is_bad(xcode(<<(binary:copy(<<16#0080>>, 2))/binary>>)))
|
|
|
|
},
|
|
|
|
{"2 continuation bytes replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<(binary:copy(<<16#0080>>, 2))/binary>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
binary:copy(<<16#fffd/utf8>>, 2)
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"3 continuation bytes",
|
|
|
|
?_assert(is_bad(xcode(<<(binary:copy(<<16#0080>>, 3))/binary>>)))
|
|
|
|
},
|
|
|
|
{"3 continuation bytes replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<(binary:copy(<<16#0080>>, 3))/binary>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
binary:copy(<<16#fffd/utf8>>, 3)
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"4 continuation bytes",
|
|
|
|
?_assert(is_bad(xcode(<<(binary:copy(<<16#0080>>, 4))/binary>>)))
|
|
|
|
},
|
|
|
|
{"4 continuation bytes replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<(binary:copy(<<16#0080>>, 4))/binary>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
binary:copy(<<16#fffd/utf8>>, 4)
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"5 continuation bytes",
|
|
|
|
?_assert(is_bad(xcode(<<(binary:copy(<<16#0080>>, 5))/binary>>)))
|
|
|
|
},
|
|
|
|
{"5 continuation bytes replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<(binary:copy(<<16#0080>>, 5))/binary>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
binary:copy(<<16#fffd/utf8>>, 5)
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"6 continuation bytes",
|
|
|
|
?_assert(is_bad(xcode(<<(binary:copy(<<16#0080>>, 6))/binary>>)))
|
|
|
|
},
|
|
|
|
{"6 continuation bytes replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<(binary:copy(<<16#0080>>, 6))/binary>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
binary:copy(<<16#fffd/utf8>>, 6)
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"all continuation bytes",
|
|
|
|
?_assert(is_bad(xcode(<<(list_to_binary(lists:seq(16#0080, 16#00bf)))/binary>>)))
|
|
|
|
},
|
|
|
|
{"all continuation bytes replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<(list_to_binary(lists:seq(16#0080, 16#00bf)))/binary>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
binary:copy(<<16#fffd/utf8>>, length(lists:seq(16#0080, 16#00bf)))
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"lonely start byte",
|
|
|
|
?_assert(is_bad(xcode(<<16#00c0>>)))
|
|
|
|
},
|
|
|
|
{"lonely start byte replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#00c0>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"lonely start bytes (2 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<16#00c0, 32, 16#00df>>)))
|
|
|
|
},
|
|
|
|
{"lonely start bytes (2 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#00c0, 32, 16#00df>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32, 16#fffd/utf8>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"lonely start bytes (3 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<16#00e0, 32, 16#00ef>>)))
|
|
|
|
},
|
|
|
|
{"lonely start bytes (3 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#00e0, 32, 16#00ef>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32, 16#fffd/utf8>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"lonely start bytes (4 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<16#00f0, 32, 16#00f7>>)))
|
|
|
|
},
|
|
|
|
{"lonely start bytes (4 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#00f0, 32, 16#00f7>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32, 16#fffd/utf8>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"missing continuation byte (3 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<224, 160, 32>>)))
|
|
|
|
},
|
|
|
|
{"missing continuation byte (3 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<224, 160, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"missing continuation byte (4 byte missing one)",
|
|
|
|
?_assert(is_bad(xcode(<<240, 144, 128, 32>>)))
|
|
|
|
},
|
|
|
|
{"missing continuation byte2 (4 byte missing one) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<240, 144, 128, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"missing continuation byte (4 byte missing two)",
|
|
|
|
?_assert(is_bad(xcode(<<240, 144, 32>>)))
|
|
|
|
},
|
|
|
|
{"missing continuation byte2 (4 byte missing two) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<240, 144, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"overlong encoding of u+002f (2 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<16#c0, 16#af, 32>>)))
|
|
|
|
},
|
|
|
|
{"overlong encoding of u+002f (2 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#c0, 16#af, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"overlong encoding of u+002f (3 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<16#e0, 16#80, 16#af, 32>>)))
|
|
|
|
},
|
|
|
|
{"overlong encoding of u+002f (3 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#e0, 16#80, 16#af, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"overlong encoding of u+002f (4 byte)",
|
|
|
|
?_assert(is_bad(xcode(<<16#f0, 16#80, 16#80, 16#af, 32>>)))
|
|
|
|
},
|
|
|
|
{"overlong encoding of u+002f (4 byte) replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#f0, 16#80, 16#80, 16#af, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"highest overlong 2 byte sequence",
|
|
|
|
?_assert(is_bad(xcode(<<16#c1, 16#bf, 32>>)))
|
|
|
|
},
|
|
|
|
{"highest overlong 2 byte sequence replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#c1, 16#bf, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"highest overlong 3 byte sequence",
|
|
|
|
?_assert(is_bad(xcode(<<16#e0, 16#9f, 16#bf, 32>>)))
|
|
|
|
},
|
|
|
|
{"highest overlong 3 byte sequence replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#e0, 16#9f, 16#bf, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"highest overlong 4 byte sequence",
|
|
|
|
?_assert(is_bad(xcode(<<16#f0, 16#8f, 16#bf, 16#bf, 32>>)))
|
|
|
|
},
|
|
|
|
{"highest overlong 4 byte sequence replaced",
|
|
|
|
?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
xcode(<<16#f0, 16#8f, 16#bf, 16#bf, 32>>, [replaced_bad_utf8]),
|
2012-03-28 23:31:07 -07:00
|
|
|
<<16#fffd/utf8, 32>>
|
|
|
|
)
|
|
|
|
}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2012-03-31 08:02:27 -07:00
|
|
|
decode(JSON, Opts) ->
|
|
|
|
try
|
|
|
|
(decoder(jsx, [], Opts))(JSON)
|
|
|
|
catch
|
|
|
|
error:badarg -> {error, badjson}
|
|
|
|
end.
|
|
|
|
|
|
|
|
|
2012-03-31 21:58:18 -07:00
|
|
|
ignored_bad_escapes_test_() ->
|
2012-03-29 00:13:08 -07:00
|
|
|
[
|
|
|
|
{"ignore unrecognized escape sequence", ?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
decode(<<"[\"\\x25\"]">>, [ignored_bad_escapes]),
|
2012-03-29 00:13:08 -07:00
|
|
|
[start_array, {string, <<"\\x25">>}, end_array, end_json]
|
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2012-03-19 14:34:07 -07:00
|
|
|
comments_test_() ->
|
|
|
|
[
|
|
|
|
{"preceeding // comment", ?_assertEqual(
|
|
|
|
decode(<<"// comment ", ?newline, "[]">>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"preceeding /**/ comment", ?_assertEqual(
|
|
|
|
decode(<<"/* comment */[]">>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"trailing // comment", ?_assertEqual(
|
|
|
|
decode(<<"[]// comment", ?newline>>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"trailing // comment (no newline)", ?_assertEqual(
|
|
|
|
decode(<<"[]// comment">>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"trailing /**/ comment", ?_assertEqual(
|
|
|
|
decode(<<"[] /* comment */">>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment inside array", ?_assertEqual(
|
|
|
|
decode(<<"[ // comment", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment inside array", ?_assertEqual(
|
|
|
|
decode(<<"[ /* comment */ ]">>, [comments]),
|
|
|
|
[start_array, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment at beginning of array", ?_assertEqual(
|
|
|
|
decode(<<"[ // comment", ?newline, "true", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment at beginning of array", ?_assertEqual(
|
|
|
|
decode(<<"[ /* comment */ true ]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment at end of array", ?_assertEqual(
|
|
|
|
decode(<<"[ true // comment", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment at end of array", ?_assertEqual(
|
|
|
|
decode(<<"[ true /* comment */ ]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment midarray (post comma)", ?_assertEqual(
|
|
|
|
decode(<<"[ true, // comment", ?newline, "false ]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment midarray (post comma)", ?_assertEqual(
|
|
|
|
decode(<<"[ true, /* comment */ false ]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment midarray (pre comma)", ?_assertEqual(
|
|
|
|
decode(<<"[ true// comment", ?newline, ", false ]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment midarray (pre comma)", ?_assertEqual(
|
|
|
|
decode(<<"[ true/* comment */, false ]">>, [comments]),
|
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment inside object", ?_assertEqual(
|
|
|
|
decode(<<"{ // comment", ?newline, "}">>, [comments]),
|
|
|
|
[start_object, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment inside object", ?_assertEqual(
|
|
|
|
decode(<<"{ /* comment */ }">>, [comments]),
|
|
|
|
[start_object, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment at beginning of object", ?_assertEqual(
|
|
|
|
decode(<<"{ // comment", ?newline, " \"key\": true", ?newline, "}">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment at beginning of object", ?_assertEqual(
|
|
|
|
decode(<<"{ /* comment */ \"key\": true }">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment at end of object", ?_assertEqual(
|
|
|
|
decode(<<"{ \"key\": true // comment", ?newline, "}">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment at end of object", ?_assertEqual(
|
|
|
|
decode(<<"{ \"key\": true /* comment */ }">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment midobject (post comma)", ?_assertEqual(
|
|
|
|
decode(<<"{ \"x\": true, // comment", ?newline, "\"y\": false }">>, [comments]),
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
|
|
|
]
|
|
|
|
)},
|
|
|
|
{"/**/ comment midobject (post comma)", ?_assertEqual(
|
|
|
|
decode(<<"{ \"x\": true, /* comment */", ?newline, "\"y\": false }">>, [comments]),
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
|
|
|
]
|
|
|
|
)},
|
|
|
|
{"// comment midobject (pre comma)", ?_assertEqual(
|
|
|
|
decode(<<"{ \"x\": true// comment", ?newline, ", \"y\": false }">>, [comments]),
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
|
|
|
]
|
|
|
|
)},
|
|
|
|
{"/**/ comment midobject (pre comma)", ?_assertEqual(
|
|
|
|
decode(<<"{ \"x\": true/* comment */", ?newline, ", \"y\": false }">>, [comments]),
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
|
|
|
]
|
|
|
|
)},
|
|
|
|
{"// comment precolon", ?_assertEqual(
|
|
|
|
decode(<<"{ \"key\" // comment", ?newline, ": true }">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment precolon", ?_assertEqual(
|
|
|
|
decode(<<"{ \"key\"/* comment */: true }">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment postcolon", ?_assertEqual(
|
|
|
|
decode(<<"{ \"key\": // comment", ?newline, " true }">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment postcolon", ?_assertEqual(
|
|
|
|
decode(<<"{ \"key\":/* comment */ true }">>, [comments]),
|
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment terminating zero", ?_assertEqual(
|
|
|
|
decode(<<"[ 0// comment", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, {integer, 0}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment terminating integer", ?_assertEqual(
|
|
|
|
decode(<<"[ 1// comment", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, {integer, 1}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment terminating float", ?_assertEqual(
|
|
|
|
decode(<<"[ 1.0// comment", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, {float, 1.0}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"// comment terminating exp", ?_assertEqual(
|
|
|
|
decode(<<"[ 1e1// comment", ?newline, "]">>, [comments]),
|
|
|
|
[start_array, {float, 1.0e1}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment terminating zero", ?_assertEqual(
|
|
|
|
decode(<<"[ 0/* comment */ ]">>, [comments]),
|
|
|
|
[start_array, {integer, 0}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment terminating integer", ?_assertEqual(
|
|
|
|
decode(<<"[ 1/* comment */ ]">>, [comments]),
|
|
|
|
[start_array, {integer, 1}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment terminating float", ?_assertEqual(
|
|
|
|
decode(<<"[ 1.0/* comment */ ]">>, [comments]),
|
|
|
|
[start_array, {float, 1.0}, end_array, end_json]
|
|
|
|
)},
|
|
|
|
{"/**/ comment terminating exp", ?_assertEqual(
|
|
|
|
decode(<<"[ 1e1/* comment */ ]">>, [comments]),
|
|
|
|
[start_array, {float, 1.0e1}, end_array, end_json]
|
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-31 21:58:18 -07:00
|
|
|
escaped_forward_slashes_test_() ->
|
2012-03-19 15:57:00 -07:00
|
|
|
[
|
|
|
|
{"escape forward slash test", ?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
decode(<<"[ \" \/ \" ]">>, [escaped_forward_slashes]),
|
2012-03-19 15:57:00 -07:00
|
|
|
[start_array, {string, <<" / ">>}, end_array, end_json]
|
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-31 12:30:47 -07:00
|
|
|
escapes_test_() ->
|
2012-03-30 23:17:05 -07:00
|
|
|
[
|
2012-03-31 21:58:18 -07:00
|
|
|
{"backspace escape", ?_assertEqual(decode(<<"\"\\b\"">>, [escaped_strings]), [{string, <<"\\b">>}, end_json])},
|
|
|
|
{"formfeed escape", ?_assertEqual(decode(<<"\"\\f\"">>, [escaped_strings]), [{string, <<"\\f">>}, end_json])},
|
|
|
|
{"newline escape", ?_assertEqual(decode(<<"\"\\n\"">>, [escaped_strings]), [{string, <<"\\n">>}, end_json])},
|
|
|
|
{"carriage return escape", ?_assertEqual(decode(<<"\"\\r\"">>, [escaped_strings]), [{string, <<"\\r">>}, end_json])},
|
|
|
|
{"tab escape", ?_assertEqual(decode(<<"\"\\t\"">>, [escaped_strings]), [{string, <<"\\t">>}, end_json])},
|
|
|
|
{"quote escape", ?_assertEqual(decode(<<"\"\\\"\"">>, [escaped_strings]), [{string, <<"\\\"">>}, end_json])},
|
|
|
|
{"single quote escape", ?_assertEqual(decode(<<"\"'\"">>, [escaped_strings, single_quoted_strings]), [{string, <<"\\'">>}, end_json])},
|
|
|
|
{"naked single quote escape", ?_assertEqual(decode(<<"'\\''">>, [escaped_strings, single_quoted_strings]), [{string, <<"\\'">>}, end_json])},
|
|
|
|
{"no single quote escape", ?_assertEqual(decode(<<"\"'\"">>, [escaped_strings]), [{string, <<"'">>}, end_json])},
|
|
|
|
{"forward slash escape", ?_assertEqual(decode(<<"\"/\"">>, [escaped_strings, escaped_forward_slashes]), [{string, <<"\\/">>}, end_json])},
|
|
|
|
{"no forward slash escape", ?_assertEqual(decode(<<"\"/\"">>, [escaped_strings]), [{string, <<"/">>}, end_json])},
|
|
|
|
{"back slash escape", ?_assertEqual(decode(<<"\"\\\\\"">>, [escaped_strings]), [{string, <<"\\\\">>}, end_json])},
|
2012-03-31 12:30:47 -07:00
|
|
|
{"jsonp escape", ?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
decode(<<$\", 16#2028/utf8, 16#2029/utf8, $\">>, [escaped_strings]),
|
2012-03-31 12:30:47 -07:00
|
|
|
[{string, <<"\\u2028\\u2029">>}, end_json]
|
2012-03-30 23:17:05 -07:00
|
|
|
)},
|
2012-03-31 12:30:47 -07:00
|
|
|
{"no jsonp escape", ?_assertEqual(
|
2012-03-31 21:58:18 -07:00
|
|
|
decode(<<$\", 16#2028/utf8, 16#2029/utf8, $\">>, [escaped_strings, unescaped_jsonp]),
|
2012-03-31 12:30:47 -07:00
|
|
|
[{string, <<16#2028/utf8, 16#2029/utf8>>}, end_json]
|
|
|
|
)},
|
2012-03-31 21:58:18 -07:00
|
|
|
{"control escape", ?_assertEqual(decode(<<$\", "\\u0000"/utf8, $\">>, [escaped_strings]), [{string, <<"\\u0000">>}, end_json])},
|
|
|
|
{"dirty strings", ?_assertEqual(decode(<<"\"\\n\"">>, [escaped_strings, dirty_strings]), [{string, <<"\n">>}, end_json])},
|
|
|
|
{"ignore bad escapes", ?_assertEqual(decode(<<"\"\\x25\"">>, [escaped_strings, ignored_bad_escapes]), [{string, <<"\\x25">>}, end_json])}
|
2012-03-30 23:17:05 -07:00
|
|
|
].
|
|
|
|
|
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
noncharacters_test_() ->
|
|
|
|
[
|
|
|
|
{"noncharacters - badjson",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_bad(noncharacters()))
|
2012-03-28 19:34:49 -07:00
|
|
|
},
|
|
|
|
{"noncharacters - replaced",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_replaced(noncharacters()))
|
2012-03-28 19:34:49 -07:00
|
|
|
}
|
|
|
|
].
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
extended_noncharacters_test_() ->
|
|
|
|
[
|
|
|
|
{"extended noncharacters - badjson",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_bad(extended_noncharacters()))
|
2012-03-28 19:34:49 -07:00
|
|
|
},
|
|
|
|
{"extended noncharacters - replaced",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_replaced(extended_noncharacters()))
|
2012-03-28 19:34:49 -07:00
|
|
|
}
|
|
|
|
].
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
surrogates_test_() ->
|
|
|
|
[
|
|
|
|
{"surrogates - badjson",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_bad(surrogates()))
|
2011-10-21 18:16:16 -07:00
|
|
|
},
|
|
|
|
{"surrogates - replaced",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_replaced(surrogates()))
|
2011-10-21 18:16:16 -07:00
|
|
|
}
|
|
|
|
].
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
control_test_() ->
|
|
|
|
[
|
|
|
|
{"control characters - badjson",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_bad(control_characters()))
|
2011-10-21 18:16:16 -07:00
|
|
|
}
|
|
|
|
].
|
2012-03-28 19:34:49 -07:00
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
reserved_test_() ->
|
|
|
|
[
|
|
|
|
{"reserved noncharacters - badjson",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_bad(reserved_space()))
|
2012-03-28 19:34:49 -07:00
|
|
|
},
|
|
|
|
{"reserved noncharacters - replaced",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_replaced(reserved_space()))
|
2012-03-28 19:34:49 -07:00
|
|
|
}
|
|
|
|
].
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
good_characters_test_() ->
|
|
|
|
[
|
|
|
|
{"acceptable codepoints",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_good(good()))
|
2011-10-21 18:16:16 -07:00
|
|
|
},
|
2012-03-31 21:58:18 -07:00
|
|
|
{"acceptable codepoints - escaped_strings",
|
|
|
|
?_assert(check_good(good(), [escaped_strings]))
|
2012-03-31 12:30:47 -07:00
|
|
|
},
|
2012-03-31 21:58:18 -07:00
|
|
|
{"acceptable codepoints - replaced_bad_utf8",
|
|
|
|
?_assert(check_good(good(), [escaped_strings]))
|
2012-03-31 12:30:47 -07:00
|
|
|
},
|
2012-03-31 21:58:18 -07:00
|
|
|
{"acceptable codepoints - escaped_strings + replaced_bad_utf8",
|
|
|
|
?_assert(check_good(good(), [escaped_strings, replaced_bad_utf8]))
|
2012-03-31 12:30:47 -07:00
|
|
|
},
|
2011-10-21 18:16:16 -07:00
|
|
|
{"acceptable extended",
|
2012-03-31 08:02:27 -07:00
|
|
|
?_assert(check_good(good_extended()))
|
2011-10-21 18:16:16 -07:00
|
|
|
}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
|
|
|
check_bad(List) ->
|
2012-03-31 08:02:27 -07:00
|
|
|
[] == lists:dropwhile(fun({_, {error, badjson}}) -> true ; (_) -> false end,
|
2011-10-21 18:16:16 -07:00
|
|
|
check(List, [], [])
|
|
|
|
).
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
check_replaced(List) ->
|
2012-03-31 08:02:27 -07:00
|
|
|
[] == lists:dropwhile(fun({_, [{string, <<16#fffd/utf8>>}|_]}) -> true ; (_) -> false
|
2011-10-21 18:16:16 -07:00
|
|
|
end,
|
2012-03-31 21:58:18 -07:00
|
|
|
check(List, [replaced_bad_utf8], [])
|
2011-10-21 18:16:16 -07:00
|
|
|
).
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-31 08:02:27 -07:00
|
|
|
check_good(List) -> check_good(List, []).
|
|
|
|
|
|
|
|
check_good(List, Opts) ->
|
|
|
|
[] == lists:dropwhile(fun({_, [{string, _}|_]}) -> true ; (_) -> false end,
|
|
|
|
check(List, Opts, [])
|
2011-10-21 18:16:16 -07:00
|
|
|
).
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
check([], _Opts, Acc) -> Acc;
|
|
|
|
check([H|T], Opts, Acc) ->
|
|
|
|
R = decode(to_fake_utf(H, utf8), Opts),
|
|
|
|
check(T, Opts, [{H, R}] ++ Acc).
|
|
|
|
|
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
noncharacters() -> lists:seq(16#fffe, 16#ffff).
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
extended_noncharacters() ->
|
|
|
|
[16#1fffe, 16#1ffff, 16#2fffe, 16#2ffff]
|
|
|
|
++ [16#3fffe, 16#3ffff, 16#4fffe, 16#4ffff]
|
|
|
|
++ [16#5fffe, 16#5ffff, 16#6fffe, 16#6ffff]
|
|
|
|
++ [16#7fffe, 16#7ffff, 16#8fffe, 16#8ffff]
|
|
|
|
++ [16#9fffe, 16#9ffff, 16#afffe, 16#affff]
|
|
|
|
++ [16#bfffe, 16#bffff, 16#cfffe, 16#cffff]
|
|
|
|
++ [16#dfffe, 16#dffff, 16#efffe, 16#effff]
|
|
|
|
++ [16#ffffe, 16#fffff, 16#10fffe, 16#10ffff].
|
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
surrogates() -> lists:seq(16#d800, 16#dfff).
|
|
|
|
|
|
|
|
control_characters() -> lists:seq(1, 31).
|
|
|
|
|
2012-03-28 19:34:49 -07:00
|
|
|
reserved_space() -> lists:seq(16#fdd0, 16#fdef).
|
|
|
|
|
|
|
|
good() -> [32, 33]
|
|
|
|
++ lists:seq(16#23, 16#5b)
|
|
|
|
++ lists:seq(16#5d, 16#d7ff)
|
|
|
|
++ lists:seq(16#e000, 16#fdcf)
|
|
|
|
++ lists:seq(16#fdf0, 16#fffd).
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-29 06:25:49 -07:00
|
|
|
good_extended() -> [16#10000, 16#20000, 16#30000, 16#40000, 16#50000,
|
|
|
|
16#60000, 16#70000, 16#80000, 16#90000, 16#a0000,
|
|
|
|
16#b0000, 16#c0000, 16#d0000, 16#e0000, 16#f0000
|
|
|
|
] ++ lists:seq(16#100000, 16#10fffd).
|
2011-10-21 18:16:16 -07:00
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-31 12:30:47 -07:00
|
|
|
%% erlang refuses to decode certain codepoints, so fake them all
|
2011-10-21 18:16:16 -07:00
|
|
|
to_fake_utf(N, utf8) when N < 16#0080 -> <<34/utf8, N:8, 34/utf8>>;
|
|
|
|
to_fake_utf(N, utf8) when N < 16#0800 ->
|
|
|
|
<<0:5, Y:5, X:6>> = <<N:16>>,
|
|
|
|
<<34/utf8, 2#110:3, Y:5, 2#10:2, X:6, 34/utf8>>;
|
|
|
|
to_fake_utf(N, utf8) when N < 16#10000 ->
|
|
|
|
<<Z:4, Y:6, X:6>> = <<N:16>>,
|
|
|
|
<<34/utf8, 2#1110:4, Z:4, 2#10:2, Y:6, 2#10:2, X:6, 34/utf8>>;
|
|
|
|
to_fake_utf(N, utf8) ->
|
|
|
|
<<0:3, W:3, Z:6, Y:6, X:6>> = <<N:24>>,
|
|
|
|
<<34/utf8, 2#11110:5, W:3, 2#10:2, Z:6, 2#10:2, Y:6, 2#10:2, X:6, 34/utf8>>.
|
|
|
|
|
|
|
|
|
|
|
|
-endif.
|