2011-10-21 18:16:16 -07:00
|
|
|
%% The MIT License
|
|
|
|
|
|
|
|
%% Copyright (c) 2010 Alisdair Sullivan <alisdairsullivan@yahoo.ca>
|
|
|
|
|
|
|
|
%% Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
%% of this software and associated documentation files (the "Software"), to deal
|
|
|
|
%% in the Software without restriction, including without limitation the rights
|
|
|
|
%% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
%% copies of the Software, and to permit persons to whom the Software is
|
|
|
|
%% furnished to do so, subject to the following conditions:
|
|
|
|
|
|
|
|
%% The above copyright notice and this permission notice shall be included in
|
|
|
|
%% all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
%% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
%% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
%% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
%% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
%% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
%% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
%% THE SOFTWARE.
|
|
|
|
|
|
|
|
|
|
|
|
-module(jsx_decoder).
|
|
|
|
|
2013-03-02 15:12:29 -08:00
|
|
|
%% inline sequence accumulation, handle_event and format_number
|
|
|
|
-compile({inline, [new_seq/0, new_seq/1, acc_seq/2, end_seq/1]}).
|
|
|
|
-compile({inline, [handle_event/3]}).
|
|
|
|
-compile({inline, [format_number/1]}).
|
|
|
|
|
2011-11-23 20:54:10 -08:00
|
|
|
-export([decoder/3]).
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
2013-02-12 11:54:42 -08:00
|
|
|
-spec decoder(Handler::module(), State::any(), Config::jsx:config()) -> jsx:decoder().
|
2011-11-23 20:54:10 -08:00
|
|
|
|
2013-02-12 11:54:42 -08:00
|
|
|
decoder(Handler, State, Config) ->
|
|
|
|
fun(JSON) -> start(JSON, {Handler, Handler:init(State)}, [], jsx_utils:parse_config(Config)) end.
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
2013-02-12 11:54:42 -08:00
|
|
|
-include("jsx_config.hrl").
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
%% whitespace
|
|
|
|
-define(space, 16#20).
|
|
|
|
-define(tab, 16#09).
|
|
|
|
-define(cr, 16#0D).
|
|
|
|
-define(newline, 16#0A).
|
|
|
|
|
|
|
|
%% object delimiters
|
|
|
|
-define(start_object, 16#7B).
|
|
|
|
-define(end_object, 16#7D).
|
|
|
|
|
|
|
|
%% array delimiters
|
|
|
|
-define(start_array, 16#5B).
|
|
|
|
-define(end_array, 16#5D).
|
|
|
|
|
|
|
|
%% kv seperator
|
|
|
|
-define(comma, 16#2C).
|
2012-03-14 23:01:59 -07:00
|
|
|
-define(doublequote, 16#22).
|
|
|
|
-define(singlequote, 16#27).
|
2011-08-31 18:52:01 -07:00
|
|
|
-define(colon, 16#3A).
|
|
|
|
|
|
|
|
%% string escape sequences
|
|
|
|
-define(escape, 16#5C).
|
|
|
|
-define(rsolidus, 16#5C).
|
|
|
|
-define(solidus, 16#2F).
|
|
|
|
-define(formfeed, 16#0C).
|
|
|
|
-define(backspace, 16#08).
|
|
|
|
|
|
|
|
%% math
|
|
|
|
-define(zero, 16#30).
|
|
|
|
-define(decimalpoint, 16#2E).
|
|
|
|
-define(negative, 16#2D).
|
|
|
|
-define(positive, 16#2B).
|
|
|
|
|
2012-03-19 14:34:07 -07:00
|
|
|
%% comments
|
|
|
|
-define(star, 16#2A).
|
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
%% some useful guards
|
|
|
|
-define(is_hex(Symbol),
|
2013-02-27 19:41:22 -08:00
|
|
|
(Symbol >= $a andalso Symbol =< $f) orelse
|
|
|
|
(Symbol >= $A andalso Symbol =< $F) orelse
|
2012-03-31 17:51:20 -07:00
|
|
|
(Symbol >= $0 andalso Symbol =< $9)
|
2011-08-31 18:52:01 -07:00
|
|
|
).
|
|
|
|
|
|
|
|
-define(is_nonzero(Symbol),
|
|
|
|
Symbol >= $1 andalso Symbol =< $9
|
|
|
|
).
|
|
|
|
|
|
|
|
-define(is_noncontrol(Symbol),
|
|
|
|
(Symbol >= ?space)
|
|
|
|
).
|
|
|
|
|
|
|
|
-define(is_whitespace(Symbol),
|
|
|
|
Symbol =:= ?space; Symbol =:= ?tab; Symbol =:= ?cr; Symbol =:= ?newline
|
|
|
|
).
|
|
|
|
|
|
|
|
|
|
|
|
%% error, incomplete and event macros
|
|
|
|
-ifndef(error).
|
2013-03-03 15:23:17 -08:00
|
|
|
-define(error(_State, _Bin, _Handler, _Stack, _Config),
|
|
|
|
erlang:error(badarg)
|
|
|
|
).
|
|
|
|
-define(error(_State, _Bin, _Handler, _Acc, _Stack, _Config),
|
|
|
|
erlang:error(badarg)
|
2011-08-31 18:52:01 -07:00
|
|
|
).
|
|
|
|
-endif.
|
|
|
|
|
|
|
|
|
|
|
|
-ifndef(incomplete).
|
2013-02-12 11:54:42 -08:00
|
|
|
-define(incomplete(State, Rest, Handler, Stack, Config),
|
2011-10-21 18:16:16 -07:00
|
|
|
{incomplete, fun(Stream) when is_binary(Stream) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
State(<<Rest/binary, Stream/binary>>, Handler, Stack, Config)
|
2011-10-21 18:16:16 -07:00
|
|
|
; (end_stream) ->
|
|
|
|
case State(<<Rest/binary, <<" ">>/binary>>,
|
2011-11-23 20:54:10 -08:00
|
|
|
Handler,
|
2011-10-21 18:16:16 -07:00
|
|
|
Stack,
|
2013-02-12 11:54:42 -08:00
|
|
|
Config#config{explicit_end=false}) of
|
2013-03-03 15:23:17 -08:00
|
|
|
{incomplete, _} -> ?error(State, Rest, Handler, Stack, Config)
|
2011-11-23 20:54:10 -08:00
|
|
|
; Events -> Events
|
2011-10-21 18:16:16 -07:00
|
|
|
end
|
2011-08-31 18:52:01 -07:00
|
|
|
end
|
|
|
|
}
|
|
|
|
).
|
2013-02-25 17:24:06 -08:00
|
|
|
-define(incomplete(State, Rest, Handler, Acc, Stack, Config),
|
|
|
|
{incomplete, fun(Stream) when is_binary(Stream) ->
|
|
|
|
State(<<Rest/binary, Stream/binary>>, Handler, Acc, Stack, Config)
|
|
|
|
; (end_stream) ->
|
|
|
|
case State(<<Rest/binary, <<" ">>/binary>>,
|
|
|
|
Handler,
|
|
|
|
Acc,
|
|
|
|
Stack,
|
|
|
|
Config#config{explicit_end=false}) of
|
2013-03-03 15:23:17 -08:00
|
|
|
{incomplete, _} -> ?error(State, Rest, Handler, Acc, Stack, Config)
|
2013-02-25 17:24:06 -08:00
|
|
|
; Events -> Events
|
|
|
|
end
|
|
|
|
end
|
|
|
|
}
|
|
|
|
).
|
2011-08-31 18:52:01 -07:00
|
|
|
-endif.
|
|
|
|
|
|
|
|
|
2013-03-02 14:56:32 -08:00
|
|
|
new_seq() -> [].
|
|
|
|
new_seq(C) -> [C].
|
2011-09-19 23:06:37 -07:00
|
|
|
|
2013-03-02 15:12:29 -08:00
|
|
|
acc_seq(Seq, C) when is_list(C) -> lists:reverse(C) ++ Seq;
|
2013-03-02 14:56:32 -08:00
|
|
|
acc_seq(Seq, C) -> [C] ++ Seq.
|
2011-09-19 23:06:37 -07:00
|
|
|
|
2013-03-02 14:56:32 -08:00
|
|
|
end_seq(Seq) -> unicode:characters_to_binary(lists:reverse(Seq)).
|
2011-09-19 23:06:37 -07:00
|
|
|
|
|
|
|
|
2013-02-12 11:54:42 -08:00
|
|
|
handle_event([], Handler, _Config) -> Handler;
|
2013-02-25 17:24:06 -08:00
|
|
|
handle_event([Event|Rest], Handler, Config) ->
|
|
|
|
handle_event(Rest, handle_event(Event, Handler, Config), Config);
|
|
|
|
handle_event(Event, {Handler, State}, _Config) ->
|
|
|
|
{Handler, Handler:handle_event(Event, State)}.
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
start(<<16#ef, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
maybe_bom(Rest, Handler, Stack, Config);
|
|
|
|
start(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(start, <<>>, Handler, Stack, Config);
|
|
|
|
start(Bin, Handler, Stack, Config) ->
|
|
|
|
value(Bin, Handler, Stack, Config).
|
|
|
|
|
|
|
|
|
|
|
|
maybe_bom(<<16#bb, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
definitely_bom(Rest, Handler, Stack, Config);
|
|
|
|
maybe_bom(<<>>, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?incomplete(start, <<16#ef>>, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_bom(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(start, <<16#ef>>, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
definitely_bom(<<16#bf, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
value(Rest, Handler, Stack, Config);
|
|
|
|
definitely_bom(<<>>, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?incomplete(start, <<16#ef, 16#bb>>, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
definitely_bom(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(start, <<16#ef, 16#bb>>, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
value(<<?doublequote, Rest/binary>>, Handler, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, new_seq(), Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<?singlequote, Rest/binary>>, Handler, Stack, Config = #config{single_quoted_strings=true}) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, new_seq(), [single_quote|Stack], Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<$t, Rest/binary>>, Handler, Stack, Config) ->
|
2013-02-25 21:38:07 -08:00
|
|
|
true(Rest, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<$f, Rest/binary>>, Handler, Stack, Config) ->
|
2013-02-25 21:38:07 -08:00
|
|
|
false(Rest, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<$n, Rest/binary>>, Handler, Stack, Config) ->
|
2013-02-25 21:38:07 -08:00
|
|
|
null(Rest, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<?negative, Rest/binary>>, Handler, Stack, Config) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
negative(Rest, Handler, new_seq($-), Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<?zero, Rest/binary>>, Handler, Stack, Config) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
zero(Rest, Handler, new_seq($0), Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
integer(Rest, Handler, new_seq(S), Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
value(<<?start_object, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
object(Rest, handle_event(start_object, Handler, Config), [key|Stack], Config);
|
|
|
|
value(<<?start_array, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
array(Rest, handle_event(start_array, Handler, Config), [array|Stack], Config);
|
|
|
|
value(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_whitespace(S) ->
|
|
|
|
value(Rest, Handler, Stack, Config);
|
|
|
|
value(<<?solidus, Rest/binary>>, Handler, Stack, Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [value|Stack], Config);
|
|
|
|
value(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(value, <<>>, Handler, Stack, Config);
|
|
|
|
value(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(value, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
object(<<?doublequote, Rest/binary>>, Handler, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, new_seq(), Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
object(<<?singlequote, Rest/binary>>, Handler, Stack, Config = #config{single_quoted_strings=true}) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, new_seq(), [single_quote|Stack], Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
object(<<?end_object, Rest/binary>>, Handler, [key|Stack], Config) ->
|
|
|
|
maybe_done(Rest, handle_event(end_object, Handler, Config), Stack, Config);
|
|
|
|
object(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_whitespace(S) ->
|
|
|
|
object(Rest, Handler, Stack, Config);
|
|
|
|
object(<<?solidus, Rest/binary>>, Handler, Stack, Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [object|Stack], Config);
|
|
|
|
object(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(object, <<>>, Handler, Stack, Config);
|
|
|
|
object(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(object, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
array(<<?end_array, Rest/binary>>, Handler, [array|Stack], Config) ->
|
|
|
|
maybe_done(Rest, handle_event(end_array, Handler, Config), Stack, Config);
|
|
|
|
array(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_whitespace(S) ->
|
|
|
|
array(Rest, Handler, Stack, Config);
|
|
|
|
array(<<?solidus, Rest/binary>>, Handler, Stack, Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [array|Stack], Config);
|
|
|
|
array(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(array, <<>>, Handler, Stack, Config);
|
|
|
|
array(Bin, Handler, Stack, Config) ->
|
|
|
|
value(Bin, Handler, Stack, Config).
|
|
|
|
|
|
|
|
|
|
|
|
colon(<<?colon, Rest/binary>>, Handler, [key|Stack], Config) ->
|
|
|
|
value(Rest, Handler, [object|Stack], Config);
|
|
|
|
colon(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_whitespace(S) ->
|
|
|
|
colon(Rest, Handler, Stack, Config);
|
|
|
|
colon(<<?solidus, Rest/binary>>, Handler, Stack, Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [colon|Stack], Config);
|
|
|
|
colon(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(colon, <<>>, Handler, Stack, Config);
|
|
|
|
colon(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(colon, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
key(<<?doublequote, Rest/binary>>, Handler, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, new_seq(), Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
key(<<?singlequote, Rest/binary>>, Handler, Stack, Config = #config{single_quoted_strings=true}) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, new_seq(), [single_quote|Stack], Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
key(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_whitespace(S) ->
|
|
|
|
key(Rest, Handler, Stack, Config);
|
|
|
|
key(<<?solidus, Rest/binary>>, Handler, Stack, Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [key|Stack], Config);
|
|
|
|
key(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(key, <<>>, Handler, Stack, Config);
|
|
|
|
key(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(key, Bin, Handler, Stack, Config).
|
2011-09-19 23:06:37 -07:00
|
|
|
|
|
|
|
|
2013-02-25 17:24:06 -08:00
|
|
|
%% explicitly whitelist ascii set for better efficiency (seriously, it's worth
|
|
|
|
%% almost a 20% increase)
|
|
|
|
string(<<32, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 32), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<33, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 33), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<?doublequote, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
|
|
|
case Stack of
|
|
|
|
[key|_] ->
|
2013-03-02 14:56:32 -08:00
|
|
|
colon(Rest, handle_event({key, end_seq(Acc)}, Handler, Config), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
[single_quote|_] ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler,acc_seq(Acc, maybe_replace(?doublequote, Config)), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
_ ->
|
2013-03-02 14:56:32 -08:00
|
|
|
maybe_done(Rest, handle_event({string, end_seq(Acc)}, Handler, Config), Stack, Config)
|
2013-02-25 17:24:06 -08:00
|
|
|
end;
|
|
|
|
string(<<35, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 35), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<36, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 36), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<37, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 37), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<38, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 38), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<?singlequote, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
|
|
|
case Stack of
|
|
|
|
[single_quote, key|S] ->
|
2013-03-02 14:56:32 -08:00
|
|
|
colon(Rest, handle_event({key, end_seq(Acc)}, Handler, Config), [key|S], Config)
|
2013-02-25 17:24:06 -08:00
|
|
|
; [single_quote|S] ->
|
2013-03-02 14:56:32 -08:00
|
|
|
maybe_done(Rest, handle_event({string, end_seq(Acc)}, Handler, Config), S, Config)
|
2013-02-25 17:24:06 -08:00
|
|
|
; _ ->
|
2013-03-03 15:27:39 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, ?singlequote), Stack, Config)
|
2013-02-25 17:24:06 -08:00
|
|
|
end;
|
|
|
|
string(<<40, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 40), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<41, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 41), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<42, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 42), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<43, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 43), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<44, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 44), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<45, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 45), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<46, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 46), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<?solidus, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace(?solidus, Config)), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<48, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 48), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<49, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 49), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<50, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 50), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<51, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 51), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<52, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 52), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<53, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 53), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<54, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 54), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<55, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 55), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<56, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 56), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<57, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 57), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<58, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 58), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<59, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 59), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<60, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 60), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<61, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 61), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<62, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 62), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<63, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 63), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<64, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 64), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<65, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 65), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<66, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 66), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<67, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 67), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<68, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 68), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<69, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 69), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<70, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 70), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<71, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 71), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<72, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 72), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<73, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 73), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<74, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 74), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<75, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 75), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<76, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 76), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<77, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 77), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<78, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 78), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<79, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 79), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<80, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 80), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<81, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 81), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<82, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 82), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<83, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 83), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<84, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 84), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<85, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 85), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<86, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 86), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<87, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 87), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<88, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 88), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<89, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 89), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<90, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 90), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<91, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 91), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<?rsolidus/utf8, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(Rest, Handler, Acc, Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<93, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 93), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<94, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 94), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<95, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 95), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<96, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 96), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<97, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 97), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<98, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 98), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<99, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 99), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<100, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 100), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<101, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 101), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<102, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 102), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<103, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 103), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<104, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 104), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<105, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 105), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<106, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 106), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<107, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 107), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<108, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 108), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<109, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 109), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<110, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 110), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<111, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 111), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<112, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 112), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<113, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 113), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<114, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 114), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<115, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 115), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<116, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 116), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<117, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 117), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<118, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 118), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<119, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 119), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<120, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 120), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<121, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 121), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<122, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 122), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<123, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 123), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<124, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 124), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<125, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 125), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<126, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 126), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<127, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 127), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#20, X < 16#2028 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X == 16#2028; X == 16#2029 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace(X, Config)), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X > 16#2029, X < 16#d800 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X > 16#dfff, X < 16#fdd0 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X > 16#fdef, X < 16#fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#10000, X < 16#1fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#20000, X < 16#2fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#30000, X < 16#3fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#40000, X < 16#4fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#50000, X < 16#5fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#60000, X < 16#6fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#70000, X < 16#7fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#80000, X < 16#8fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#90000, X < 16#9fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#a0000, X < 16#afffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#b0000, X < 16#bfffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#c0000, X < 16#cfffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#d0000, X < 16#dfffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#e0000, X < 16#efffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#f0000, X < 16#ffffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<X/utf8, Rest/binary>>, Handler, Acc, Stack, Config) when X >= 16#100000, X < 16#10fffe ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, X), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
%% surrogates
|
|
|
|
string(<<237, X, _, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config)
|
|
|
|
when X >= 160 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
%% u+fffe and u+ffff for R14BXX
|
|
|
|
string(<<239, 191, X, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config)
|
|
|
|
when X == 190; X == 191 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config);
|
2013-02-25 17:37:49 -08:00
|
|
|
%% u+xfffe, u+xffff, control codes and other noncharacters
|
2013-02-25 17:24:06 -08:00
|
|
|
string(<<_/utf8, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
%% overlong encodings and missing continuations of a 2 byte sequence
|
|
|
|
string(<<X, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config)
|
|
|
|
when X >= 192, X =< 223 ->
|
|
|
|
strip_continuations(Rest, Handler, Acc, Stack, Config, 1);
|
|
|
|
%% overlong encodings and missing continuations of a 3 byte sequence
|
|
|
|
string(<<X, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config)
|
|
|
|
when X >= 224, X =< 239 ->
|
|
|
|
strip_continuations(Rest, Handler, Acc, Stack, Config, 2);
|
|
|
|
%% overlong encodings and missing continuations of a 4 byte sequence
|
|
|
|
string(<<X, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config)
|
|
|
|
when X >= 240, X =< 247 ->
|
|
|
|
strip_continuations(Rest, Handler, Acc, Stack, Config, 3);
|
|
|
|
%% incompletes and unexpected bytes, including orphan continuations
|
2013-03-02 15:48:26 -08:00
|
|
|
string(<<C, Rest/binary>>, Handler, Acc, Stack, #config{replaced_bad_utf8=true} = Config) ->
|
2013-03-03 15:19:02 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
string(Bin, Handler, Acc, Stack, Config) ->
|
|
|
|
case partial_utf(Bin) of
|
|
|
|
true -> ?incomplete(string, Bin, Handler, Acc, Stack, Config);
|
2013-03-03 15:23:17 -08:00
|
|
|
false -> ?error(string, Bin, Handler, Acc, Stack, Config)
|
2013-02-25 17:24:06 -08:00
|
|
|
end.
|
|
|
|
|
|
|
|
|
2013-02-24 01:07:16 -08:00
|
|
|
%% string appends it's output to the term at the top of the stack. for
|
|
|
|
%% efficiency the strings are build in reverse order and reversed before
|
|
|
|
%% being added to the output stream
|
|
|
|
%% when parsing strings, the naive detection of partial codepoints is
|
|
|
|
%% insufficient. this incredibly anal function should detect all badly formed
|
|
|
|
%% utf sequences
|
|
|
|
partial_utf(<<>>) -> true;
|
|
|
|
partial_utf(<<X>>) when X >= 16#c2, X =< 16#f4 -> true;
|
|
|
|
partial_utf(<<X, Y>>) when X >= 16#e0, X =< 16#f4, Y >= 16#80, Y =< 16#bf -> true;
|
|
|
|
partial_utf(<<X, Y, Z>>)
|
|
|
|
when X >= 16#f0, X =< 16#f4,
|
|
|
|
Y >= 16#80, Y =< 16#bf,
|
|
|
|
Z >= 16#80, Z =< 16#bf ->
|
|
|
|
true;
|
|
|
|
partial_utf(_) -> false.
|
|
|
|
|
|
|
|
|
|
|
|
%% strips continuation bytes after bad utf bytes, guards against both too short
|
|
|
|
%% and overlong sequences. N is the maximum number of bytes to strip
|
2013-02-25 21:45:13 -08:00
|
|
|
%% if end of input is reached before stripping the max number of continuations
|
|
|
|
%% possible magic numbers are reinserted into the stream that get us back to
|
|
|
|
%% the same state without complicated machinery
|
2013-02-25 17:24:06 -08:00
|
|
|
strip_continuations(Rest, Handler, Acc, Stack, Config, 0) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config);
|
2013-02-25 17:24:06 -08:00
|
|
|
strip_continuations(<<X, Rest/binary>>, Handler, Acc, Stack, Config, N) when X >= 128, X =< 191 ->
|
|
|
|
strip_continuations(Rest, Handler, Acc, Stack, Config, N - 1);
|
2013-02-24 01:07:16 -08:00
|
|
|
%% incomplete
|
2013-02-25 17:24:06 -08:00
|
|
|
strip_continuations(<<>>, Handler, Acc, Stack, Config, N) ->
|
|
|
|
case N of
|
|
|
|
1 -> ?incomplete(string, <<192>>, Handler, Acc, Stack, Config);
|
|
|
|
2 -> ?incomplete(string, <<224>>, Handler, Acc, Stack, Config);
|
|
|
|
3 -> ?incomplete(string, <<240>>, Handler, Acc, Stack, Config)
|
|
|
|
end;
|
2013-02-24 01:07:16 -08:00
|
|
|
%% not a continuation byte, dispatch back to string
|
2013-02-25 17:24:06 -08:00
|
|
|
strip_continuations(Rest, Handler, Acc, Stack, Config, _) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config).
|
2013-02-25 17:24:06 -08:00
|
|
|
|
|
|
|
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$b, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\b, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$f, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\f, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$n, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\n, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$r, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\r, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$t, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\t, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<?rsolidus, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\\, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<?solidus, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($/, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<?doublequote, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace($\", Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<?singlequote, Rest/binary>>, Handler, Acc, Stack, Config=#config{single_quoted_strings=true}) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace(?singlequote, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$u, $d, A, B, C, ?rsolidus, $u, $d, X, Y, Z, Rest/binary>>, Handler, Acc, Stack, Config)
|
|
|
|
when (A == $8 orelse A == $9 orelse A == $a orelse A == $b),
|
|
|
|
(X == $c orelse X == $d orelse X == $e orelse X == $f),
|
|
|
|
?is_hex(B), ?is_hex(C), ?is_hex(Y), ?is_hex(Z)
|
|
|
|
->
|
|
|
|
High = erlang:list_to_integer([$d, A, B, C], 16),
|
|
|
|
Low = erlang:list_to_integer([$d, X, Y, Z], 16),
|
|
|
|
Codepoint = (High - 16#d800) * 16#400 + (Low - 16#dc00) + 16#10000,
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, Codepoint), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(<<$u, $d, A, B, C, ?rsolidus, $u, W, X, Y, Z, Rest/binary>>, Handler, Acc, Stack, Config)
|
|
|
|
when (A == $8 orelse A == $9 orelse A == $a orelse A == $b),
|
|
|
|
?is_hex(B), ?is_hex(C), ?is_hex(W), ?is_hex(X), ?is_hex(Y), ?is_hex(Z)
|
|
|
|
->
|
2013-03-04 14:40:07 -08:00
|
|
|
case Config#config.replaced_bad_utf8 of
|
|
|
|
true -> string(Rest, Handler, acc_seq(Acc, [16#fffd, 16#fffd]), Stack, Config);
|
|
|
|
false -> ?error(<<$u, $d, A, B, C, ?rsolidus, $u, W, X, Y, Z, Rest/binary>>, Handler, Acc, Stack, Config)
|
|
|
|
end;
|
2013-03-02 15:48:26 -08:00
|
|
|
unescape(<<$u, $d, A, B, C, ?rsolidus, Rest/binary>>, Handler, Acc, Stack, Config)
|
2013-02-27 19:41:22 -08:00
|
|
|
when (A == $8 orelse A == $9 orelse A == $a orelse A == $b) andalso
|
|
|
|
?is_hex(B), ?is_hex(C)
|
|
|
|
->
|
2013-03-03 15:23:17 -08:00
|
|
|
?incomplete(string, <<?rsolidus, $u, $d, A, B, C, ?rsolidus, Rest/binary>>, Handler, Acc, Stack, Config);
|
2013-03-02 15:48:26 -08:00
|
|
|
unescape(<<$u, $d, A, B, C>>, Handler, Acc, Stack, Config)
|
2013-02-27 19:41:22 -08:00
|
|
|
when (A == $8 orelse A == $9 orelse A == $a orelse A == $b) andalso
|
|
|
|
?is_hex(B), ?is_hex(C)
|
|
|
|
->
|
2013-03-02 15:48:26 -08:00
|
|
|
?incomplete(string, <<?rsolidus, $u, $d, A, B, C>>, Handler, Acc, Stack, Config);
|
|
|
|
unescape(<<$u, A, B, C, D, Rest/binary>>, Handler, Acc, Stack, Config)
|
2013-02-24 01:07:16 -08:00
|
|
|
when ?is_hex(A), ?is_hex(B), ?is_hex(C), ?is_hex(D) ->
|
|
|
|
case erlang:list_to_integer([A, B, C, D], 16) of
|
2013-02-27 19:41:22 -08:00
|
|
|
Codepoint when Codepoint < 16#d800; Codepoint > 16#dfff ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, maybe_replace(Codepoint, Config)), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
_ when Config#config.replaced_bad_utf8 ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Rest, Handler, acc_seq(Acc, 16#fffd), Stack, Config);
|
2013-03-03 15:23:17 -08:00
|
|
|
_ -> ?error(string, <<?rsolidus, $u, A, B, C, D, Rest/binary>>, Handler, Acc, Stack, Config)
|
2013-02-24 01:07:16 -08:00
|
|
|
end;
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(Bin, Handler, Acc, Stack, Config=#config{ignored_bad_escapes=true}) ->
|
2013-03-02 14:56:32 -08:00
|
|
|
string(Bin, Handler, acc_seq(Acc, ?rsolidus), Stack, Config);
|
2013-02-27 19:41:22 -08:00
|
|
|
unescape(Bin, Handler, Acc, Stack, Config) ->
|
2013-02-24 01:07:16 -08:00
|
|
|
case is_partial_escape(Bin) of
|
2013-02-25 17:24:06 -08:00
|
|
|
true -> ?incomplete(string, <<?rsolidus/utf8, Bin/binary>>, Handler, Acc, Stack, Config);
|
2013-03-03 15:23:17 -08:00
|
|
|
false -> ?error(string, <<?rsolidus, Bin/binary>>, Handler, Acc, Stack, Config)
|
2012-03-27 14:44:02 -07:00
|
|
|
end.
|
2012-11-21 23:04:14 -08:00
|
|
|
|
2012-03-27 14:44:02 -07:00
|
|
|
|
2013-02-27 19:41:22 -08:00
|
|
|
is_partial_escape(<<$u, A, B, C>>) when ?is_hex(A), ?is_hex(B), ?is_hex(C) -> true;
|
|
|
|
is_partial_escape(<<$u, A, B>>) when ?is_hex(A), ?is_hex(B) -> true;
|
|
|
|
is_partial_escape(<<$u, A>>) when ?is_hex(A) -> true;
|
2013-02-25 17:24:06 -08:00
|
|
|
is_partial_escape(<<$u>>) -> true;
|
2013-02-24 01:07:16 -08:00
|
|
|
is_partial_escape(<<>>) -> true;
|
|
|
|
is_partial_escape(_) -> false.
|
|
|
|
|
|
|
|
|
|
|
|
maybe_replace(X, #config{dirty_strings=true}) when is_integer(X) -> [X];
|
|
|
|
maybe_replace($\b, #config{escaped_strings=true}) -> [$\\, $b];
|
|
|
|
maybe_replace($\t, #config{escaped_strings=true}) -> [$\\, $t];
|
|
|
|
maybe_replace($\n, #config{escaped_strings=true}) -> [$\\, $n];
|
|
|
|
maybe_replace($\f, #config{escaped_strings=true}) -> [$\\, $f];
|
|
|
|
maybe_replace($\r, #config{escaped_strings=true}) -> [$\\, $r];
|
|
|
|
maybe_replace($\", #config{escaped_strings=true}) -> [$\\, $\"];
|
|
|
|
maybe_replace($/, Config=#config{escaped_strings=true}) ->
|
|
|
|
case Config#config.escaped_forward_slashes of
|
|
|
|
true -> [$\\, $/]
|
|
|
|
; false -> [$/]
|
|
|
|
end;
|
|
|
|
maybe_replace($\\, #config{escaped_strings=true}) -> [$\\, $\\];
|
|
|
|
maybe_replace(X, Config=#config{escaped_strings=true}) when X == 16#2028; X == 16#2029 ->
|
|
|
|
case Config#config.unescaped_jsonp of
|
|
|
|
true -> [X]
|
|
|
|
; false -> jsx_utils:json_escape_sequence(X)
|
|
|
|
end;
|
|
|
|
maybe_replace(X, #config{escaped_strings=true}) when X < 32 ->
|
|
|
|
jsx_utils:json_escape_sequence(X);
|
|
|
|
maybe_replace(X, _Config) -> [X].
|
2012-03-31 20:38:51 -07:00
|
|
|
|
|
|
|
|
2011-08-31 18:52:01 -07:00
|
|
|
%% like strings, numbers are collected in an intermediate accumulator before
|
|
|
|
%% being emitted to the callback handler
|
2013-03-02 14:50:40 -08:00
|
|
|
negative(<<$0, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
zero(Rest, Handler, acc_seq(Acc, $0), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
negative(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
integer(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-03 15:23:17 -08:00
|
|
|
negative(<<>>, Handler, [?negative], Stack, Config) ->
|
|
|
|
?incomplete(value, <<?negative>>, Handler, Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
negative(Bin, Handler, Acc, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(value, <<?negative, Bin/binary>>, Handler, Acc, Stack, Config).
|
2013-03-02 14:50:40 -08:00
|
|
|
|
|
|
|
|
|
|
|
zero(<<?decimalpoint, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
decimal(Rest, Handler, acc_seq(Acc, ?decimalpoint), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
zero(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= $e; S =:= $E ->
|
2013-03-02 15:12:29 -08:00
|
|
|
e(Rest, Handler, acc_seq(Acc, ".0e"), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
zero(<<>>, Handler, Acc, [], Config=#config{explicit_end=false}) ->
|
|
|
|
finish_number(<<>>, Handler, {zero, Acc}, [], Config);
|
|
|
|
zero(<<>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
?incomplete(value, (end_seq(Acc)), Handler, Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
zero(Bin, Handler, Acc, Stack, Config) ->
|
|
|
|
finish_number(Bin, Handler, {zero, Acc}, Stack, Config).
|
|
|
|
|
|
|
|
|
|
|
|
integer(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= ?zero; ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
integer(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
integer(<<?decimalpoint, Rest/binary>>, Handler, Acc, Stack, Config) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
decimal(Rest, Handler, acc_seq(Acc, ?decimalpoint), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
integer(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= $e; S =:= $E ->
|
2013-03-02 15:12:29 -08:00
|
|
|
e(Rest, Handler, acc_seq(Acc, ".0e"), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
integer(Bin, Handler, Acc, Stack, Config) ->
|
|
|
|
finish_number(Bin, Handler, {integer, Acc}, Stack, Config).
|
|
|
|
|
|
|
|
|
|
|
|
decimal(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S=:= ?zero; ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
decimal(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-02 15:48:26 -08:00
|
|
|
decimal(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= $e; S =:= $E ->
|
2013-03-02 14:50:40 -08:00
|
|
|
case Acc of
|
2013-03-03 15:23:17 -08:00
|
|
|
[?decimalpoint|_] -> ?error(decimal, <<S, Rest/binary>>, Handler, Acc, Stack, Config);
|
2013-03-02 15:01:32 -08:00
|
|
|
_ -> e(Rest, Handler, acc_seq(Acc, $e), Stack, Config)
|
2013-03-02 14:50:40 -08:00
|
|
|
end;
|
|
|
|
decimal(Bin, Handler, Acc, Stack, Config) ->
|
|
|
|
finish_number(Bin, Handler, {decimal, Acc}, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-03-02 14:50:40 -08:00
|
|
|
e(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= ?zero; ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
exp(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
e(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= ?positive; S =:= ?negative ->
|
2013-03-02 15:01:32 -08:00
|
|
|
ex(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
e(<<>>, Handler, [$e|Acc], Stack, Config) ->
|
|
|
|
?incomplete(decimal, <<$e>>, Handler, Acc, Stack, Config);
|
|
|
|
e(Bin, Handler, Acc, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(decimal, <<$e, Bin/binary>>, Handler, Acc, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-03-02 14:50:40 -08:00
|
|
|
ex(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= ?zero; ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
exp(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
ex(<<>>, Handler, [S, $e|Acc], Stack, Config) ->
|
|
|
|
?incomplete(decimal, <<$e, S/utf8>>, Handler, Acc, Stack, Config);
|
|
|
|
ex(Bin, Handler, Acc, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(decimal, <<$e, Bin/binary>>, Handler, Acc, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-03-02 14:50:40 -08:00
|
|
|
exp(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when S =:= ?zero; ?is_nonzero(S) ->
|
2013-03-02 15:01:32 -08:00
|
|
|
exp(Rest, Handler, acc_seq(Acc, S), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
exp(Bin, Handler, Acc, Stack, Config) ->
|
|
|
|
finish_number(Bin, Handler, {exp, Acc}, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(Rest, Handler, Acc, [], Config=#config{explicit_end=false}) ->
|
|
|
|
maybe_done(Rest, handle_event(format_number(Acc), Handler, Config), [], Config);
|
|
|
|
finish_number(<<?end_object, Rest/binary>>, Handler, Acc, [object|Stack], Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_object], Handler, Config), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(<<?end_array, Rest/binary>>, Handler, Acc, [array|Stack], Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, handle_event([format_number(Acc), end_array], Handler, Config), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(<<?comma, Rest/binary>>, Handler, Acc, [object|Stack], Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
key(Rest, handle_event(format_number(Acc), Handler, Config), [key|Stack], Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(<<?comma, Rest/binary>>, Handler, Acc, [array|Stack], Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
value(Rest, handle_event(format_number(Acc), Handler, Config), [array|Stack], Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(<<S, Rest/binary>>, Handler, Acc, Stack, Config) when ?is_whitespace(S) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, handle_event(format_number(Acc), Handler, Config), Stack, Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(<<?solidus, Rest/binary>>, Handler, Acc, Stack, Config=#config{comments=true}) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
comment(Rest, handle_event(format_number(Acc), Handler, Config), [maybe_done|Stack], Config);
|
2013-03-02 14:50:40 -08:00
|
|
|
finish_number(<<>>, Handler, {NumType, Acc}, Stack, Config) ->
|
|
|
|
case NumType of
|
|
|
|
zero -> ?incomplete(zero, <<>>, Handler, Acc, Stack, Config);
|
|
|
|
integer -> ?incomplete(integer, <<>>, Handler, Acc, Stack, Config);
|
|
|
|
decimal -> ?incomplete(decimal, <<>>, Handler, Acc, Stack, Config);
|
|
|
|
exp -> ?incomplete(exp, <<>>, Handler, Acc, Stack, Config)
|
|
|
|
end;
|
2013-03-03 15:23:17 -08:00
|
|
|
finish_number(Bin, Handler, {NumType, Acc}, Stack, Config) ->
|
|
|
|
case NumType of
|
|
|
|
zero -> ?error(zero, <<>>, Handler, Acc, Stack, Config);
|
|
|
|
integer -> ?error(integer, <<>>, Handler, Acc, Stack, Config);
|
|
|
|
decimal -> ?error(decimal, <<>>, Handler, Acc, Stack, Config);
|
|
|
|
exp -> ?error(exp, <<>>, Handler, Acc, Stack, Config)
|
|
|
|
end.
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2013-03-02 14:50:40 -08:00
|
|
|
format_number({zero, Acc}) -> {integer, list_to_integer(lists:reverse(Acc))};
|
|
|
|
format_number({integer, Acc}) -> {integer, list_to_integer(lists:reverse(Acc))};
|
|
|
|
format_number({decimal, Acc}) -> {float, list_to_float(lists:reverse(Acc))};
|
|
|
|
format_number({exp, Acc}) -> {float, list_to_float(lists:reverse(Acc))}.
|
2011-08-31 18:52:01 -07:00
|
|
|
|
|
|
|
|
2013-02-25 21:38:07 -08:00
|
|
|
true(<<$r, $u, $e, Rest/binary>>, Handler, Stack, Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, handle_event({literal, true}, Handler, Config), Stack, Config);
|
2013-03-02 15:48:26 -08:00
|
|
|
true(<<$r, $u>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(true, <<$r, $u>>, Handler, Stack, Config);
|
|
|
|
true(<<$r>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(true, <<$r>>, Handler, Stack, Config);
|
|
|
|
true(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(true, <<>>, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
true(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(true, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-02-25 21:38:07 -08:00
|
|
|
false(<<$a, $l, $s, $e, Rest/binary>>, Handler, Stack, Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, handle_event({literal, false}, Handler, Config), Stack, Config);
|
2013-03-02 15:48:26 -08:00
|
|
|
false(<<$a, $l, $s>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(false, <<$a, $l, $s>>, Handler, Stack, Config);
|
|
|
|
false(<<$a, $l>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(false, <<$a, $l>>, Handler, Stack, Config);
|
|
|
|
false(<<$a>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(false, <<$a>>, Handler, Stack, Config);
|
|
|
|
false(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(false, <<>>, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
false(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(false, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-02-25 21:38:07 -08:00
|
|
|
null(<<$u, $l, $l, Rest/binary>>, Handler, Stack, Config) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, handle_event({literal, null}, Handler, Config), Stack, Config);
|
2013-03-02 15:48:26 -08:00
|
|
|
null(<<$u, $l>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(null, <<$u, $l>>, Handler, Stack, Config);
|
|
|
|
null(<<$u>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(null, <<$u>>, Handler, Stack, Config);
|
|
|
|
null(<<>>, Handler, Stack, Config) ->
|
|
|
|
?incomplete(null, <<>>, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
null(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(null, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
2013-02-26 18:31:44 -08:00
|
|
|
%% this just exists to bridge to when i can properly clean up comments
|
|
|
|
comment(Bin, Handler, Resume, Stack, Config) ->
|
|
|
|
comment(Bin, Handler, [Resume|Stack], Config).
|
|
|
|
|
2013-02-12 11:54:42 -08:00
|
|
|
comment(<<?solidus, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
single_comment(Rest, Handler, Stack, Config);
|
|
|
|
comment(<<?star, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Config);
|
2013-02-26 18:41:53 -08:00
|
|
|
%% nested /**/ comments
|
|
|
|
comment(<<_/utf8, Rest/binary>>, Handler, [comment|Stack], Config) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Config);
|
|
|
|
comment(<<_, Rest/binary>>, Handler, [comment|Stack], Config=#config{replaced_bad_utf8=true}) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Config);
|
2013-02-26 18:31:44 -08:00
|
|
|
comment(<<>>, Handler, [Resume|Stack], Config) ->
|
|
|
|
?incomplete(comment, <<>>, Handler, Resume, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
comment(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(comment, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
single_comment(<<?newline, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
end_comment(Rest, Handler, Stack, Config);
|
|
|
|
single_comment(<<_/utf8, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
single_comment(Rest, Handler, Stack, Config);
|
2013-02-26 18:31:44 -08:00
|
|
|
single_comment(<<_, Rest/binary>>, Handler, Stack, Config=#config{replaced_bad_utf8=true}) ->
|
|
|
|
single_comment(Rest, Handler, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
single_comment(<<>>, Handler, [done], Config=#config{explicit_end=false}) ->
|
|
|
|
end_comment(<<>>, Handler, [done], Config);
|
2013-02-26 18:31:44 -08:00
|
|
|
single_comment(<<>>, Handler, [Resume|Stack], Config) ->
|
|
|
|
?incomplete(comment, <<?solidus>>, Handler, Resume, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
single_comment(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(comment, <<?solidus, Bin/binary>>, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
multi_comment(<<?star, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
end_multi_comment(Rest, Handler, Stack, Config);
|
2013-02-26 18:41:53 -08:00
|
|
|
multi_comment(<<?solidus, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
comment(Rest, Handler, [comment|Stack], Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
multi_comment(<<_S/utf8, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Config);
|
2013-02-26 18:31:44 -08:00
|
|
|
multi_comment(<<_, Rest/binary>>, Handler, Stack, Config=#config{replaced_bad_utf8=true}) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Config);
|
|
|
|
multi_comment(<<>>, Handler, [Resume|Stack], Config) ->
|
|
|
|
?incomplete(comment, <<?star>>, Handler, Resume, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
multi_comment(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(comment, <<?star, Bin/binary>>, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
end_multi_comment(<<?solidus, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
end_comment(Rest, Handler, Stack, Config);
|
|
|
|
end_multi_comment(<<_S/utf8, Rest/binary>>, Handler, Stack, Config) ->
|
|
|
|
multi_comment(Rest, Handler, Stack, Config);
|
2013-02-26 18:31:44 -08:00
|
|
|
end_multi_comment(<<>>, Handler, [Resume|Stack], Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?incomplete(comment, <<?star, ?star>>, Handler, Resume, Stack, Config);
|
2013-02-12 11:54:42 -08:00
|
|
|
end_multi_comment(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(comment, <<?star, ?star, Bin/binary>>, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
end_comment(Rest, Handler, [Resume|Stack], Config) ->
|
2012-04-01 17:16:22 -07:00
|
|
|
case Resume of
|
2013-02-12 11:54:42 -08:00
|
|
|
value -> value(Rest, Handler, Stack, Config)
|
|
|
|
; object -> object(Rest, Handler, Stack, Config)
|
|
|
|
; array -> array(Rest, Handler, Stack, Config)
|
|
|
|
; colon -> colon(Rest, Handler, Stack, Config)
|
|
|
|
; key -> key(Rest, Handler, Stack, Config)
|
|
|
|
; maybe_done -> maybe_done(Rest, Handler, Stack, Config)
|
|
|
|
; done -> done(Rest, Handler, Stack, Config)
|
2013-02-26 18:41:53 -08:00
|
|
|
; comment -> multi_comment(Rest, Handler, Stack, Config)
|
2012-04-01 17:16:22 -07:00
|
|
|
end.
|
|
|
|
|
|
|
|
|
2013-02-12 11:54:42 -08:00
|
|
|
maybe_done(Rest, Handler, [], Config) ->
|
|
|
|
done(Rest, handle_event(end_json, Handler, Config), [], Config);
|
|
|
|
maybe_done(<<?end_object, Rest/binary>>, Handler, [object|Stack], Config) ->
|
|
|
|
maybe_done(Rest, handle_event(end_object, Handler, Config), Stack, Config);
|
|
|
|
maybe_done(<<?end_array, Rest/binary>>, Handler, [array|Stack], Config) ->
|
|
|
|
maybe_done(Rest, handle_event(end_array, Handler, Config), Stack, Config);
|
|
|
|
maybe_done(<<?comma, Rest/binary>>, Handler, [object|Stack], Config) ->
|
|
|
|
key(Rest, Handler, [key|Stack], Config);
|
|
|
|
maybe_done(<<?comma, Rest/binary>>, Handler, [array|_] = Stack, Config) ->
|
|
|
|
value(Rest, Handler, Stack, Config);
|
|
|
|
maybe_done(<<S, Rest/binary>>, Handler, Stack, Config) when ?is_whitespace(S) ->
|
|
|
|
maybe_done(Rest, Handler, Stack, Config);
|
|
|
|
maybe_done(<<?solidus, Rest/binary>>, Handler, Stack, Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [maybe_done|Stack], Config);
|
|
|
|
maybe_done(<<>>, Handler, Stack, Config) when length(Stack) > 0 ->
|
|
|
|
?incomplete(maybe_done, <<>>, Handler, Stack, Config);
|
|
|
|
maybe_done(Bin, Handler, Stack, Config) ->
|
2013-03-03 15:23:17 -08:00
|
|
|
?error(maybe_done, Bin, Handler, Stack, Config).
|
2013-02-12 11:54:42 -08:00
|
|
|
|
|
|
|
|
|
|
|
done(<<S, Rest/binary>>, Handler, [], Config) when ?is_whitespace(S) ->
|
|
|
|
done(Rest, Handler, [], Config);
|
|
|
|
done(<<?solidus, Rest/binary>>, Handler, [], Config=#config{comments=true}) ->
|
|
|
|
comment(Rest, Handler, [done], Config);
|
|
|
|
done(<<>>, {Handler, State}, [], Config = #config{explicit_end=true}) ->
|
2011-10-21 18:16:16 -07:00
|
|
|
{incomplete, fun(Stream) when is_binary(Stream) ->
|
2013-02-12 11:54:42 -08:00
|
|
|
done(<<Stream/binary>>, {Handler, State}, [], Config)
|
2011-11-23 20:54:10 -08:00
|
|
|
; (end_stream) -> State
|
2011-10-21 18:16:16 -07:00
|
|
|
end
|
|
|
|
};
|
2013-02-12 11:54:42 -08:00
|
|
|
done(<<>>, {_Handler, State}, [], _Config) -> State;
|
2013-03-03 15:23:17 -08:00
|
|
|
done(Bin, Handler, Stack, Config) -> ?error(done, Bin, Handler, Stack, Config).
|
2011-10-21 18:16:16 -07:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-ifdef(TEST).
|
|
|
|
-include_lib("eunit/include/eunit.hrl").
|
|
|
|
|
|
|
|
|
2013-02-25 20:23:31 -08:00
|
|
|
json_to_bytes(JSON) -> json_to_bytes(JSON, []).
|
|
|
|
|
2013-03-04 14:40:07 -08:00
|
|
|
json_to_bytes(<<>>, Acc) -> [<<>>] ++ lists:reverse(Acc);
|
2013-02-25 20:23:31 -08:00
|
|
|
json_to_bytes(<<X, Rest/binary>>, Acc) -> json_to_bytes(Rest, [<<X>>] ++ Acc).
|
|
|
|
|
|
|
|
|
2013-02-24 01:32:17 -08:00
|
|
|
decode(JSON, Config) ->
|
2013-02-26 21:11:31 -08:00
|
|
|
Chunk = try
|
|
|
|
start(JSON, {jsx, []}, [], jsx_utils:parse_config(Config))
|
|
|
|
catch
|
|
|
|
error:badarg -> {error, badarg}
|
|
|
|
end,
|
|
|
|
Incremental = try
|
2013-02-25 20:23:31 -08:00
|
|
|
Final = lists:foldl(
|
|
|
|
fun(Byte, Decoder) -> {incomplete, F} = Decoder(Byte), F end,
|
|
|
|
decoder(jsx, [], [explicit_end] ++ Config),
|
|
|
|
json_to_bytes(JSON)
|
|
|
|
),
|
2013-02-26 21:11:31 -08:00
|
|
|
Final(end_stream)
|
2013-02-24 01:32:17 -08:00
|
|
|
catch
|
|
|
|
error:badarg -> {error, badarg}
|
2013-02-26 21:11:31 -08:00
|
|
|
end,
|
2013-03-04 14:51:51 -08:00
|
|
|
?assert(Chunk == Incremental),
|
2013-03-04 14:45:08 -08:00
|
|
|
Chunk.
|
2013-02-24 00:54:16 -08:00
|
|
|
|
|
|
|
|
2013-02-20 23:57:06 -08:00
|
|
|
decode_test_() ->
|
|
|
|
Data = jsx:test_cases(),
|
2013-02-24 00:54:16 -08:00
|
|
|
[{Title, ?_assertEqual(Events ++ [end_json], decode(JSON, []))}
|
|
|
|
|| {Title, JSON, _, Events} <- Data
|
2013-02-20 23:57:06 -08:00
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-13 21:54:09 -08:00
|
|
|
%% all these numbers have different representation in erlang than in javascript and
|
|
|
|
%% do not roundtrip like most integers/floats
|
|
|
|
special_number_test_() ->
|
|
|
|
[
|
|
|
|
{"-0", ?_assertEqual(
|
|
|
|
[{integer, 0}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"-0">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)},
|
|
|
|
{"-0.0", ?_assertEqual(
|
|
|
|
[{float, 0.0}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"-0.0">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)},
|
|
|
|
{"0e0", ?_assertEqual(
|
|
|
|
[{float, 0.0}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"0e0">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)},
|
|
|
|
{"0e4", ?_assertEqual(
|
|
|
|
[{float, 0.0}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"0e4">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)},
|
|
|
|
{"1e0", ?_assertEqual(
|
|
|
|
[{float, 1.0}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"1e0">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)},
|
|
|
|
{"-1e0", ?_assertEqual(
|
|
|
|
[{float, -1.0}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"-1e0">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)},
|
|
|
|
{"1e4", ?_assertEqual(
|
|
|
|
[{float, 1.0e4}, end_json],
|
2013-02-24 00:54:16 -08:00
|
|
|
decode(<<"1e4">>, [])
|
2013-03-04 14:25:07 -08:00
|
|
|
)},
|
|
|
|
{"number terminated by whitespace", ?_assertEqual(
|
|
|
|
[start_array, {integer, 1}, end_array, end_json],
|
|
|
|
decode(<<"[ 1 ]">>, [])
|
2013-03-04 14:51:05 -08:00
|
|
|
)},
|
|
|
|
{"number terminated by comma", ?_assertEqual(
|
|
|
|
[start_array, {integer, 1}, {integer, 1}, end_array, end_json],
|
|
|
|
decode(<<"[ 1, 1 ]">>, [])
|
|
|
|
)},
|
|
|
|
{"number terminated by comma in object", ?_assertEqual(
|
|
|
|
[start_object, {key, <<"x">>}, {integer, 1}, {key, <<"y">>}, {integer, 1}, end_object, end_json],
|
|
|
|
decode(<<"{\"x\": 1, \"y\": 1}">>, [])
|
2013-02-13 21:54:09 -08:00
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2012-03-19 14:34:07 -07:00
|
|
|
comments_test_() ->
|
|
|
|
[
|
|
|
|
{"preceeding // comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"// comment ", ?newline, "[]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"preceeding /**/ comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"/* comment */[]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"trailing // comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"[]// comment", ?newline>>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"trailing // comment (no newline)", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"[]// comment">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"trailing /**/ comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"[] /* comment */">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment inside array", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"[ // comment", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment inside array", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<"[ /* comment */ ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment at beginning of array", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ // comment", ?newline, "true", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment at beginning of array", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ /* comment */ true ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment at end of array", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ true // comment", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment at end of array", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ true /* comment */ ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment midarray (post comma)", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json],
|
|
|
|
decode(<<"[ true, // comment", ?newline, "false ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment midarray (post comma)", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json],
|
|
|
|
decode(<<"[ true, /* comment */ false ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment midarray (pre comma)", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json],
|
|
|
|
decode(<<"[ true// comment", ?newline, ", false ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment midarray (pre comma)", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, {literal, false}, end_array, end_json],
|
|
|
|
decode(<<"[ true/* comment */, false ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment inside object", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, end_object, end_json],
|
|
|
|
decode(<<"{ // comment", ?newline, "}">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment inside object", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, end_object, end_json],
|
|
|
|
decode(<<"{ /* comment */ }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment at beginning of object", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ // comment", ?newline, " \"key\": true", ?newline, "}">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment at beginning of object", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ /* comment */ \"key\": true }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment at end of object", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ \"key\": true // comment", ?newline, "}">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment at end of object", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ \"key\": true /* comment */ }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment midobject (post comma)", ?_assertEqual(
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
2013-02-21 00:13:07 -08:00
|
|
|
],
|
|
|
|
decode(<<"{ \"x\": true, // comment", ?newline, "\"y\": false }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment midobject (post comma)", ?_assertEqual(
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
2013-02-21 00:13:07 -08:00
|
|
|
],
|
|
|
|
decode(<<"{ \"x\": true, /* comment */", ?newline, "\"y\": false }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment midobject (pre comma)", ?_assertEqual(
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
2013-02-21 00:13:07 -08:00
|
|
|
],
|
|
|
|
decode(<<"{ \"x\": true// comment", ?newline, ", \"y\": false }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment midobject (pre comma)", ?_assertEqual(
|
|
|
|
[
|
|
|
|
start_object,
|
|
|
|
{key, <<"x">>},
|
|
|
|
{literal, true},
|
|
|
|
{key, <<"y">>},
|
|
|
|
{literal, false},
|
|
|
|
end_object,
|
|
|
|
end_json
|
2013-02-21 00:13:07 -08:00
|
|
|
],
|
|
|
|
decode(<<"{ \"x\": true/* comment */", ?newline, ", \"y\": false }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment precolon", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ \"key\" // comment", ?newline, ": true }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment precolon", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ \"key\"/* comment */: true }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment postcolon", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ \"key\": // comment", ?newline, " true }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment postcolon", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_object, {key, <<"key">>}, {literal, true}, end_object, end_json],
|
|
|
|
decode(<<"{ \"key\":/* comment */ true }">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment terminating zero", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {integer, 0}, end_array, end_json],
|
|
|
|
decode(<<"[ 0// comment", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment terminating integer", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {integer, 1}, end_array, end_json],
|
|
|
|
decode(<<"[ 1// comment", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment terminating float", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {float, 1.0}, end_array, end_json],
|
|
|
|
decode(<<"[ 1.0// comment", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"// comment terminating exp", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {float, 1.0e1}, end_array, end_json],
|
|
|
|
decode(<<"[ 1e1// comment", ?newline, "]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment terminating zero", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {integer, 0}, end_array, end_json],
|
|
|
|
decode(<<"[ 0/* comment */ ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment terminating integer", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {integer, 1}, end_array, end_json],
|
|
|
|
decode(<<"[ 1/* comment */ ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment terminating float", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {float, 1.0}, end_array, end_json],
|
|
|
|
decode(<<"[ 1.0/* comment */ ]">>, [comments])
|
2012-03-19 14:34:07 -07:00
|
|
|
)},
|
|
|
|
{"/**/ comment terminating exp", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {float, 1.0e1}, end_array, end_json],
|
|
|
|
decode(<<"[ 1e1/* comment */ ]">>, [comments])
|
2013-02-12 12:06:45 -08:00
|
|
|
)},
|
|
|
|
{"/**/ comment following /**/ comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[/* comment *//* comment */true]">>, [comments])
|
2013-02-12 12:06:45 -08:00
|
|
|
)},
|
|
|
|
{"/**/ comment following // comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[// comment", ?newline, "/* comment */true]">>, [comments])
|
2013-02-12 12:06:45 -08:00
|
|
|
)},
|
|
|
|
{"// comment following /**/ comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[/* comment */// comment", ?newline, "true]">>, [comments])
|
2013-02-12 12:06:45 -08:00
|
|
|
)},
|
|
|
|
{"// comment following // comment", ?_assertEqual(
|
2013-02-21 00:13:07 -08:00
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[// comment", ?newline, "// comment", ?newline, "true]">>, [comments])
|
2013-02-26 18:31:44 -08:00
|
|
|
)},
|
2013-02-26 18:41:53 -08:00
|
|
|
{"/**/ comment inside /**/ comment", ?_assertEqual(
|
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ /* /* comment */ */ true ]">>, [comments])
|
|
|
|
)},
|
2013-03-03 15:34:45 -08:00
|
|
|
{"/**/ comment with /", ?_assertEqual(
|
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ /* / */ true ]">>, [comments])
|
|
|
|
)},
|
|
|
|
{"/**/ comment with *", ?_assertEqual(
|
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ /* * */ true ]">>, [comments])
|
|
|
|
)},
|
2013-02-26 18:31:44 -08:00
|
|
|
{"// comment with badutf", ?_assertEqual(
|
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ // comment ", 16#00c0, " ", ?newline, "true]">>, [comments, replaced_bad_utf8])
|
|
|
|
)},
|
|
|
|
{"/**/ comment with badutf", ?_assertEqual(
|
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ /* comment ", 16#00c0, " */ true]">>, [comments, replaced_bad_utf8])
|
2013-03-03 15:34:45 -08:00
|
|
|
)},
|
|
|
|
{"/**/ comment with badutf preceeded by /", ?_assertEqual(
|
|
|
|
[start_array, {literal, true}, end_array, end_json],
|
|
|
|
decode(<<"[ /* comment /", 16#00c0, " */ true]">>, [comments, replaced_bad_utf8])
|
2012-03-19 14:34:07 -07:00
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2013-02-20 23:57:06 -08:00
|
|
|
codepoints() ->
|
|
|
|
unicode:characters_to_binary(
|
|
|
|
[32, 33]
|
|
|
|
++ lists:seq(35, 38)
|
|
|
|
++ lists:seq(40, 46)
|
|
|
|
++ lists:seq(48, 91)
|
|
|
|
++ lists:seq(93, 16#2027)
|
|
|
|
++ lists:seq(16#202a, 16#d7ff)
|
2012-12-28 06:35:26 -08:00
|
|
|
++ lists:seq(16#e000, 16#fdcf)
|
2013-02-20 23:57:06 -08:00
|
|
|
++ lists:seq(16#fdf0, 16#fffd)
|
|
|
|
).
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2013-02-20 23:57:06 -08:00
|
|
|
extended_codepoints() ->
|
|
|
|
unicode:characters_to_binary(
|
|
|
|
lists:seq(16#10000, 16#1fffd) ++ [
|
|
|
|
16#20000, 16#30000, 16#40000, 16#50000, 16#60000,
|
|
|
|
16#70000, 16#80000, 16#90000, 16#a0000, 16#b0000,
|
|
|
|
16#c0000, 16#d0000, 16#e0000, 16#f0000, 16#100000
|
|
|
|
]
|
|
|
|
).
|
2011-10-21 18:16:16 -07:00
|
|
|
|
2013-02-21 00:05:12 -08:00
|
|
|
reserved_space() -> [ to_fake_utf8(N) || N <- lists:seq(16#fdd0, 16#fdef) ].
|
|
|
|
|
|
|
|
surrogates() -> [ to_fake_utf8(N) || N <- lists:seq(16#d800, 16#dfff) ].
|
|
|
|
|
|
|
|
noncharacters() -> [ to_fake_utf8(N) || N <- lists:seq(16#fffe, 16#ffff) ].
|
|
|
|
|
|
|
|
extended_noncharacters() ->
|
|
|
|
[ to_fake_utf8(N) || N <- [16#1fffe, 16#1ffff, 16#2fffe, 16#2ffff]
|
|
|
|
++ [16#3fffe, 16#3ffff, 16#4fffe, 16#4ffff]
|
|
|
|
++ [16#5fffe, 16#5ffff, 16#6fffe, 16#6ffff]
|
|
|
|
++ [16#7fffe, 16#7ffff, 16#8fffe, 16#8ffff]
|
|
|
|
++ [16#9fffe, 16#9ffff, 16#afffe, 16#affff]
|
|
|
|
++ [16#bfffe, 16#bffff, 16#cfffe, 16#cffff]
|
|
|
|
++ [16#dfffe, 16#dffff, 16#efffe, 16#effff]
|
|
|
|
++ [16#ffffe, 16#fffff, 16#10fffe, 16#10ffff]
|
|
|
|
].
|
2012-03-28 23:46:18 -07:00
|
|
|
|
2012-03-31 12:30:47 -07:00
|
|
|
%% erlang refuses to decode certain codepoints, so fake them all
|
2013-02-21 00:05:12 -08:00
|
|
|
to_fake_utf8(N) when N < 16#0080 -> <<34/utf8, N:8, 34/utf8>>;
|
|
|
|
to_fake_utf8(N) when N < 16#0800 ->
|
2011-10-21 18:16:16 -07:00
|
|
|
<<0:5, Y:5, X:6>> = <<N:16>>,
|
2012-11-21 23:04:14 -08:00
|
|
|
<<34/utf8, 2#110:3, Y:5, 2#10:2, X:6, 34/utf8>>;
|
2013-02-21 00:05:12 -08:00
|
|
|
to_fake_utf8(N) when N < 16#10000 ->
|
2011-10-21 18:16:16 -07:00
|
|
|
<<Z:4, Y:6, X:6>> = <<N:16>>,
|
|
|
|
<<34/utf8, 2#1110:4, Z:4, 2#10:2, Y:6, 2#10:2, X:6, 34/utf8>>;
|
2013-02-21 00:05:12 -08:00
|
|
|
to_fake_utf8(N) ->
|
2011-10-21 18:16:16 -07:00
|
|
|
<<0:3, W:3, Z:6, Y:6, X:6>> = <<N:24>>,
|
|
|
|
<<34/utf8, 2#11110:5, W:3, 2#10:2, Z:6, 2#10:2, Y:6, 2#10:2, X:6, 34/utf8>>.
|
|
|
|
|
|
|
|
|
2013-02-20 23:57:06 -08:00
|
|
|
clean_string_test_() ->
|
2013-02-11 18:22:45 -08:00
|
|
|
[
|
2013-02-24 00:54:16 -08:00
|
|
|
{"clean codepoints", ?_assertEqual(
|
2013-02-20 23:57:06 -08:00
|
|
|
[{string, codepoints()}, end_json],
|
|
|
|
decode(<<34, (codepoints())/binary, 34>>, [])
|
|
|
|
)},
|
2013-02-24 00:54:16 -08:00
|
|
|
{"clean extended codepoints", ?_assertEqual(
|
2013-02-20 23:57:06 -08:00
|
|
|
[{string, extended_codepoints()}, end_json],
|
|
|
|
decode(<<34, (extended_codepoints())/binary, 34>>, [])
|
2013-02-24 00:54:16 -08:00
|
|
|
)},
|
2013-02-24 01:32:17 -08:00
|
|
|
{"error reserved space", ?_assertEqual(
|
|
|
|
lists:duplicate(length(reserved_space()), {error, badarg}),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, []) end, reserved_space())
|
|
|
|
)},
|
|
|
|
{"error surrogates", ?_assertEqual(
|
|
|
|
lists:duplicate(length(surrogates()), {error, badarg}),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, []) end, surrogates())
|
|
|
|
)},
|
|
|
|
{"error noncharacters", ?_assertEqual(
|
|
|
|
lists:duplicate(length(noncharacters()), {error, badarg}),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, []) end, noncharacters())
|
|
|
|
)},
|
|
|
|
{"error extended noncharacters", ?_assertEqual(
|
|
|
|
lists:duplicate(length(extended_noncharacters()), {error, badarg}),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, []) end, extended_noncharacters())
|
|
|
|
)},
|
2013-02-24 00:54:16 -08:00
|
|
|
{"clean reserved space", ?_assertEqual(
|
|
|
|
lists:duplicate(length(reserved_space()), [{string, <<16#fffd/utf8>>}, end_json]),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, [replaced_bad_utf8]) end, reserved_space())
|
2013-02-24 01:32:17 -08:00
|
|
|
)},
|
|
|
|
{"clean surrogates", ?_assertEqual(
|
|
|
|
lists:duplicate(length(surrogates()), [{string, <<16#fffd/utf8>>}, end_json]),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, [replaced_bad_utf8]) end, surrogates())
|
|
|
|
)},
|
|
|
|
{"clean noncharacters", ?_assertEqual(
|
|
|
|
lists:duplicate(length(noncharacters()), [{string, <<16#fffd/utf8>>}, end_json]),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, [replaced_bad_utf8]) end, noncharacters())
|
|
|
|
)},
|
|
|
|
{"clean extended noncharacters", ?_assertEqual(
|
|
|
|
lists:duplicate(length(extended_noncharacters()), [{string, <<16#fffd/utf8>>}, end_json]),
|
|
|
|
lists:map(fun(Codepoint) -> decode(Codepoint, [replaced_bad_utf8]) end, extended_noncharacters())
|
2013-02-20 23:57:06 -08:00
|
|
|
)}
|
2013-02-11 18:22:45 -08:00
|
|
|
].
|
|
|
|
|
2013-02-20 23:57:06 -08:00
|
|
|
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(String, Config) ->
|
|
|
|
case decode(<<34, String/binary, 34>>, Config) of
|
|
|
|
{error, badarg} -> erlang:error(badarg);
|
|
|
|
[{string, S}, end_json] -> S
|
|
|
|
end.
|
2013-02-24 02:14:47 -08:00
|
|
|
|
|
|
|
bad_utf8_test_() ->
|
|
|
|
[
|
|
|
|
{"noncharacter u+fffe", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<239, 191, 190>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"noncharacter u+fffe replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<239, 191, 190>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"noncharacter u+ffff", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<239, 191, 191>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"noncharacter u+ffff replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<239, 191, 191>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"orphan continuation byte u+0080", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#0080>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"orphan continuation byte u+0080 replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#0080>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"orphan continuation byte u+00bf", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00bf>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"orphan continuation byte u+00bf replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00bf>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"2 continuation bytes", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 2))/binary>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"2 continuation bytes replaced", ?_assertEqual(
|
|
|
|
binary:copy(<<16#fffd/utf8>>, 2),
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 2))/binary>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"3 continuation bytes", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 3))/binary>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"3 continuation bytes replaced", ?_assertEqual(
|
|
|
|
binary:copy(<<16#fffd/utf8>>, 3),
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 3))/binary>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"4 continuation bytes", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 4))/binary>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"4 continuation bytes replaced", ?_assertEqual(
|
|
|
|
binary:copy(<<16#fffd/utf8>>, 4),
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 4))/binary>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"5 continuation bytes", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 5))/binary>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"5 continuation bytes replaced", ?_assertEqual(
|
|
|
|
binary:copy(<<16#fffd/utf8>>, 5),
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 5))/binary>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"6 continuation bytes", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 6))/binary>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"6 continuation bytes replaced", ?_assertEqual(
|
|
|
|
binary:copy(<<16#fffd/utf8>>, 6),
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(binary:copy(<<16#0080>>, 6))/binary>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"all continuation bytes", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<(list_to_binary(lists:seq(16#0080, 16#00bf)))/binary>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"all continuation bytes replaced", ?_assertEqual(
|
|
|
|
binary:copy(<<16#fffd/utf8>>, length(lists:seq(16#0080, 16#00bf))),
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(
|
2013-02-24 02:14:47 -08:00
|
|
|
<<(list_to_binary(lists:seq(16#0080, 16#00bf)))/binary>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
[replaced_bad_utf8]
|
2013-02-24 02:14:47 -08:00
|
|
|
)
|
|
|
|
)},
|
|
|
|
{"lonely start byte", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00c0>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start byte replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00c0>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start bytes (2 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00c0, 32, 16#00df>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start bytes (2 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32, 16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00c0, 32, 16#00df>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start bytes (3 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00e0, 32, 16#00ef>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start bytes (3 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32, 16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00e0, 32, 16#00ef>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start bytes (4 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00f0, 32, 16#00f7>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"lonely start bytes (4 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32, 16#fffd/utf8>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#00f0, 32, 16#00f7>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"missing continuation byte (3 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<224, 160, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"missing continuation byte (3 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<224, 160, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"missing continuation byte (4 byte missing one)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<240, 144, 128, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"missing continuation byte (4 byte missing one) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<240, 144, 128, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"missing continuation byte (4 byte missing two)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<240, 144, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"missing continuation byte (4 byte missing two) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<240, 144, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"overlong encoding of u+002f (2 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#c0, 16#af, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"overlong encoding of u+002f (2 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#c0, 16#af, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"overlong encoding of u+002f (3 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#e0, 16#80, 16#af, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"overlong encoding of u+002f (3 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#e0, 16#80, 16#af, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"overlong encoding of u+002f (4 byte)", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#f0, 16#80, 16#80, 16#af, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"overlong encoding of u+002f (4 byte) replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#f0, 16#80, 16#80, 16#af, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"highest overlong 2 byte sequence", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#c1, 16#bf, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"highest overlong 2 byte sequence replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#c1, 16#bf, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"highest overlong 3 byte sequence", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#e0, 16#9f, 16#bf, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"highest overlong 3 byte sequence replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#e0, 16#9f, 16#bf, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"highest overlong 4 byte sequence", ?_assertError(
|
|
|
|
badarg,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#f0, 16#8f, 16#bf, 16#bf, 32>>, [])
|
2013-02-24 02:14:47 -08:00
|
|
|
)},
|
|
|
|
{"highest overlong 4 byte sequence replaced", ?_assertEqual(
|
|
|
|
<<16#fffd/utf8, 32>>,
|
2013-02-26 21:11:31 -08:00
|
|
|
decode_bad_utf(<<16#f0, 16#8f, 16#bf, 16#bf, 32>>, [replaced_bad_utf8])
|
2013-02-24 02:14:47 -08:00
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-24 02:28:33 -08:00
|
|
|
unescape(Bin, Config) ->
|
2013-03-04 14:40:07 -08:00
|
|
|
case decode(<<34, Bin/binary, 34>>, Config) of
|
|
|
|
[{string, String}, end_json] -> String;
|
|
|
|
{error, badarg} -> erlang:error(badarg)
|
|
|
|
end.
|
2013-02-24 02:28:33 -08:00
|
|
|
|
|
|
|
unescape_test_() ->
|
|
|
|
[
|
|
|
|
{"unescape backspace", ?_assertEqual(
|
|
|
|
<<"\b">>,
|
|
|
|
unescape(<<"\\b"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape tab", ?_assertEqual(
|
|
|
|
<<"\t">>,
|
|
|
|
unescape(<<"\\t"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape newline", ?_assertEqual(
|
|
|
|
<<"\n">>,
|
|
|
|
unescape(<<"\\n"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape formfeed", ?_assertEqual(
|
|
|
|
<<"\f">>,
|
|
|
|
unescape(<<"\\f"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape carriage return", ?_assertEqual(
|
|
|
|
<<"\r">>,
|
|
|
|
unescape(<<"\\r"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape quote", ?_assertEqual(
|
|
|
|
<<"\"">>,
|
|
|
|
unescape(<<"\\\""/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape single quote", ?_assertEqual(
|
|
|
|
<<"'">>,
|
|
|
|
unescape(<<"\\'"/utf8>>, [single_quoted_strings])
|
|
|
|
)},
|
|
|
|
{"unescape solidus", ?_assertEqual(
|
|
|
|
<<"/">>,
|
|
|
|
unescape(<<"\\/"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape reverse solidus", ?_assertEqual(
|
|
|
|
<<"\\">>,
|
|
|
|
unescape(<<"\\\\"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape control", ?_assertEqual(
|
|
|
|
<<0>>,
|
|
|
|
unescape(<<"\\u0000"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"unescape surrogate pair", ?_assertEqual(
|
|
|
|
<<16#10000/utf8>>,
|
|
|
|
unescape(<<"\\ud800\\udc00"/utf8>>, [])
|
2013-02-27 19:41:22 -08:00
|
|
|
)},
|
2013-03-04 14:40:07 -08:00
|
|
|
{"replace bad high surrogate", ?_assertEqual(
|
2013-02-27 19:41:22 -08:00
|
|
|
<<16#fffd/utf8>>,
|
|
|
|
unescape(<<"\\udc00"/utf8>>, [replaced_bad_utf8])
|
|
|
|
)},
|
2013-03-04 14:40:07 -08:00
|
|
|
{"do not unescape bad high surrogate", ?_assertError(
|
|
|
|
badarg,
|
|
|
|
unescape(<<"\\udc00"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"replace naked high surrogate", ?_assertEqual(
|
2013-02-27 19:41:22 -08:00
|
|
|
<<16#fffd/utf8, "hello world">>,
|
|
|
|
unescape(<<"\\ud800hello world"/utf8>>, [replaced_bad_utf8])
|
|
|
|
)},
|
2013-03-04 14:40:07 -08:00
|
|
|
{"do not unescape naked high surrogate", ?_assertError(
|
|
|
|
badarg,
|
|
|
|
unescape(<<"\\ud800hello world"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"replace naked low surrogate", ?_assertEqual(
|
2013-02-27 19:41:22 -08:00
|
|
|
<<16#fffd/utf8, "hello world">>,
|
|
|
|
unescape(<<"\\udc00hello world"/utf8>>, [replaced_bad_utf8])
|
|
|
|
)},
|
2013-03-04 14:40:07 -08:00
|
|
|
{"do not unescape naked low surrogate", ?_assertError(
|
|
|
|
badarg,
|
|
|
|
unescape(<<"\\udc00hello world"/utf8>>, [])
|
|
|
|
)},
|
|
|
|
{"replace bad surrogate pair", ?_assertEqual(
|
2013-02-27 19:41:22 -08:00
|
|
|
<<16#fffd/utf8, 16#fffd/utf8>>,
|
|
|
|
unescape(<<"\\ud800\\u0000">>, [replaced_bad_utf8])
|
2013-03-04 14:40:07 -08:00
|
|
|
)},
|
|
|
|
{"do not unescape bad surrogate pair", ?_assertError(
|
|
|
|
badarg,
|
|
|
|
unescape(<<"\\ud800\\u0000">>, [])
|
2013-03-04 14:43:56 -08:00
|
|
|
)},
|
|
|
|
{"bad pseudo escape sequence", ?_assertError(
|
|
|
|
badarg,
|
|
|
|
unescape(<<"\\uabcg">>, [])
|
2013-02-24 02:28:33 -08:00
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-24 01:50:17 -08:00
|
|
|
maybe_escape(Bin, Config) ->
|
|
|
|
[{string, String}, end_json] = decode(Bin, Config),
|
|
|
|
String.
|
|
|
|
|
|
|
|
escape_test_() ->
|
|
|
|
[
|
|
|
|
{"maybe_escape backspace", ?_assertEqual(
|
|
|
|
<<"\\b">>,
|
|
|
|
maybe_escape(<<34, "\\b"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"don't escape backspace", ?_assertEqual(
|
|
|
|
<<"\b">>,
|
|
|
|
maybe_escape(<<34, "\\b"/utf8, 34>>, [])
|
|
|
|
)},
|
|
|
|
{"maybe_escape tab", ?_assertEqual(
|
|
|
|
<<"\\t">>,
|
|
|
|
maybe_escape(<<34, "\\t"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape newline", ?_assertEqual(
|
|
|
|
<<"\\n">>,
|
|
|
|
maybe_escape(<<34, "\\n"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape formfeed", ?_assertEqual(
|
|
|
|
<<"\\f">>,
|
|
|
|
maybe_escape(<<34, "\\f"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape carriage return", ?_assertEqual(
|
|
|
|
<<"\\r">>,
|
|
|
|
maybe_escape(<<34, "\\r"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape quote", ?_assertEqual(
|
|
|
|
<<"\\\"">>,
|
|
|
|
maybe_escape(<<34, "\\\""/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape forward slash", ?_assertEqual(
|
|
|
|
<<"\\/">>,
|
|
|
|
maybe_escape(<<34, "/"/utf8, 34>>, [escaped_strings, escaped_forward_slashes])
|
|
|
|
)},
|
|
|
|
{"do not maybe_escape forward slash", ?_assertEqual(
|
|
|
|
<<"/">>,
|
|
|
|
maybe_escape(<<34, "/"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape backslash", ?_assertEqual(
|
|
|
|
<<"\\\\">>,
|
|
|
|
maybe_escape(<<34, "\\\\"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape jsonp (u2028)", ?_assertEqual(
|
|
|
|
<<"\\u2028">>,
|
|
|
|
maybe_escape(<<34, 16#2028/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"do not maybe_escape jsonp (u2028)", ?_assertEqual(
|
|
|
|
<<16#2028/utf8>>,
|
|
|
|
maybe_escape(<<34, 16#2028/utf8, 34>>, [escaped_strings, unescaped_jsonp])
|
|
|
|
)},
|
|
|
|
{"maybe_escape jsonp (u2029)", ?_assertEqual(
|
|
|
|
<<"\\u2029">>,
|
|
|
|
maybe_escape(<<34, 16#2029/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"do not maybe_escape jsonp (u2029)", ?_assertEqual(
|
|
|
|
<<16#2029/utf8>>,
|
|
|
|
maybe_escape(<<34, 16#2029/utf8, 34>>, [escaped_strings, unescaped_jsonp])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0000", ?_assertEqual(
|
|
|
|
<<"\\u0000">>,
|
|
|
|
maybe_escape(<<34, "\\u0000"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0001", ?_assertEqual(
|
|
|
|
<<"\\u0001">>,
|
|
|
|
maybe_escape(<<34, "\\u0001"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0002", ?_assertEqual(
|
|
|
|
<<"\\u0002">>,
|
|
|
|
maybe_escape(<<34, "\\u0002"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0003", ?_assertEqual(
|
|
|
|
<<"\\u0003">>,
|
|
|
|
maybe_escape(<<34, "\\u0003"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0004", ?_assertEqual(
|
|
|
|
<<"\\u0004">>,
|
|
|
|
maybe_escape(<<34, "\\u0004"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0005", ?_assertEqual(
|
|
|
|
<<"\\u0005">>,
|
|
|
|
maybe_escape(<<34, "\\u0005"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0006", ?_assertEqual(
|
|
|
|
<<"\\u0006">>,
|
|
|
|
maybe_escape(<<34, "\\u0006"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0007", ?_assertEqual(
|
|
|
|
<<"\\u0007">>,
|
|
|
|
maybe_escape(<<34, "\\u0007"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u000b", ?_assertEqual(
|
|
|
|
<<"\\u000b">>,
|
|
|
|
maybe_escape(<<34, "\\u000b"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u000e", ?_assertEqual(
|
|
|
|
<<"\\u000e">>,
|
|
|
|
maybe_escape(<<34, "\\u000e"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u000f", ?_assertEqual(
|
|
|
|
<<"\\u000f">>,
|
|
|
|
maybe_escape(<<34, "\\u000f"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0010", ?_assertEqual(
|
|
|
|
<<"\\u0010">>,
|
|
|
|
maybe_escape(<<34, "\\u0010"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0011", ?_assertEqual(
|
|
|
|
<<"\\u0011">>,
|
|
|
|
maybe_escape(<<34, "\\u0011"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0012", ?_assertEqual(
|
|
|
|
<<"\\u0012">>,
|
|
|
|
maybe_escape(<<34, "\\u0012"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0013", ?_assertEqual(
|
|
|
|
<<"\\u0013">>,
|
|
|
|
maybe_escape(<<34, "\\u0013"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0014", ?_assertEqual(
|
|
|
|
<<"\\u0014">>,
|
|
|
|
maybe_escape(<<34, "\\u0014"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0015", ?_assertEqual(
|
|
|
|
<<"\\u0015">>,
|
|
|
|
maybe_escape(<<34, "\\u0015"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0016", ?_assertEqual(
|
|
|
|
<<"\\u0016">>,
|
|
|
|
maybe_escape(<<34, "\\u0016"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0017", ?_assertEqual(
|
|
|
|
<<"\\u0017">>,
|
|
|
|
maybe_escape(<<34, "\\u0017"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0018", ?_assertEqual(
|
|
|
|
<<"\\u0018">>,
|
|
|
|
maybe_escape(<<34, "\\u0018"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u0019", ?_assertEqual(
|
|
|
|
<<"\\u0019">>,
|
|
|
|
maybe_escape(<<34, "\\u0019"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u001a", ?_assertEqual(
|
|
|
|
<<"\\u001a">>,
|
|
|
|
maybe_escape(<<34, "\\u001a"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u001b", ?_assertEqual(
|
|
|
|
<<"\\u001b">>,
|
|
|
|
maybe_escape(<<34, "\\u001b"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u001c", ?_assertEqual(
|
|
|
|
<<"\\u001c">>,
|
|
|
|
maybe_escape(<<34, "\\u001c"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u001d", ?_assertEqual(
|
|
|
|
<<"\\u001d">>,
|
|
|
|
maybe_escape(<<34, "\\u001d"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u001e", ?_assertEqual(
|
|
|
|
<<"\\u001e">>,
|
|
|
|
maybe_escape(<<34, "\\u001e"/utf8, 34>>, [escaped_strings])
|
|
|
|
)},
|
|
|
|
{"maybe_escape u001f", ?_assertEqual(
|
|
|
|
<<"\\u001f">>,
|
|
|
|
maybe_escape(<<34, "\\u001f"/utf8, 34>>, [escaped_strings])
|
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-21 00:05:12 -08:00
|
|
|
single_quoted_string_test_() ->
|
|
|
|
[
|
|
|
|
{"single quoted string", ?_assertEqual(
|
|
|
|
[{string, <<"hello world">>}, end_json],
|
|
|
|
decode(<<39, "hello world", 39>>, [single_quoted_strings])
|
|
|
|
)},
|
|
|
|
{"single quoted string with embedded double quotes", ?_assertEqual(
|
|
|
|
[{string, <<"quoth the raven, \"nevermore\"">>}, end_json],
|
|
|
|
decode(<<39, "quoth the raven, \"nevermore\"", 39>>, [single_quoted_strings])
|
|
|
|
)},
|
|
|
|
{"string with embedded single quotes", ?_assertEqual(
|
|
|
|
[{string, <<"quoth the raven, 'nevermore'">>}, end_json],
|
|
|
|
decode(<<34, "quoth the raven, 'nevermore'", 34>>, [])
|
2013-02-26 23:16:53 -08:00
|
|
|
)},
|
|
|
|
{"escaped single quote", ?_assertEqual(
|
|
|
|
[{string, <<"quoth the raven, 'nevermore'">>}, end_json],
|
|
|
|
decode(<<39, "quoth the raven, \\'nevermore\\'", 39>>, [single_quoted_strings])
|
|
|
|
)},
|
|
|
|
{"single quoted key", ?_assertEqual(
|
|
|
|
[start_object,
|
|
|
|
{key, <<"key">>}, {string, <<"value">>},
|
|
|
|
{key, <<"another key">>}, {string, <<"another value">>},
|
|
|
|
end_object, end_json],
|
|
|
|
decode(<<"{'key':'value','another key':'another value'}">>, [single_quoted_strings])
|
2013-02-21 00:05:12 -08:00
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-24 01:59:54 -08:00
|
|
|
ignored_bad_escapes_test_() ->
|
|
|
|
[
|
|
|
|
{"ignore unrecognized escape sequence", ?_assertEqual(
|
|
|
|
[{string, <<"\\x25">>}, end_json],
|
|
|
|
decode(<<"\"\\x25\"">>, [ignored_bad_escapes])
|
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-24 20:10:48 -08:00
|
|
|
bom_test_() ->
|
|
|
|
[
|
|
|
|
{"bom", ?_assertEqual(
|
|
|
|
[start_array, end_array, end_json],
|
|
|
|
decode(<<16#ef, 16#bb, 16#bf, "[]"/utf8>>, [])
|
|
|
|
)}
|
|
|
|
].
|
|
|
|
|
|
|
|
|
2013-02-24 01:59:54 -08:00
|
|
|
|
2011-10-21 18:16:16 -07:00
|
|
|
-endif.
|