integrate dmitry kolesnikov's changes to json_encode
This commit is contained in:
parent
29d5c28196
commit
821a8ac06e
4 changed files with 67 additions and 289 deletions
14
Makefile
14
Makefile
|
@ -1,14 +0,0 @@
|
||||||
|
|
||||||
all:
|
|
||||||
test -d ebin || mkdir ebin
|
|
||||||
erlc -b beam -o ebin src/*.erl
|
|
||||||
cp src/jsx.app.src ebin/jsx.app
|
|
||||||
|
|
||||||
clean:
|
|
||||||
rm -Rf ebin
|
|
||||||
|
|
||||||
test:
|
|
||||||
erlc -b beam -o ebin priv/b/*.erl
|
|
||||||
|
|
||||||
run:
|
|
||||||
erl -pa ./ebin -pa ./*/ebin
|
|
Binary file not shown.
175
priv/b/jsx_b.erl
175
priv/b/jsx_b.erl
|
@ -1,175 +0,0 @@
|
||||||
%% The MIT License
|
|
||||||
|
|
||||||
%% Copyright (c) 2012 Dmitry Kolesnikov <fogfish@ovi.com>
|
|
||||||
|
|
||||||
%% Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
||||||
%% of this software and associated documentation files (the "Software"), to deal
|
|
||||||
%% in the Software without restriction, including without limitation the rights
|
|
||||||
%% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
||||||
%% copies of the Software, and to permit persons to whom the Software is
|
|
||||||
%% furnished to do so, subject to the following conditions:
|
|
||||||
|
|
||||||
%% The above copyright notice and this permission notice shall be included in
|
|
||||||
%% all copies or substantial portions of the Software.
|
|
||||||
|
|
||||||
%% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
||||||
%% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
||||||
%% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
||||||
%% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
||||||
%% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
||||||
%% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
||||||
%% THE SOFTWARE.
|
|
||||||
-module(jsx_b).
|
|
||||||
|
|
||||||
-export([run/2, hot/0]).
|
|
||||||
|
|
||||||
-define(LEN_KEY, 32). %% upper bound of object attribute
|
|
||||||
-define(LEN_STR, 256). %% upper bound of string value
|
|
||||||
-define(LEN_INT, 7). %% upper bound of digits
|
|
||||||
-define(JSON, 20). %% number of attributes
|
|
||||||
-define(ALPHA,"qwertyuiopasdfghjklzxcvbnm").
|
|
||||||
-define(TEXT,"qwertyuiopasdfghjklzxcvbnmQWERTYUIOPASDFGHJKLZXCVBNM1234567890\"\\\b\f\n\r\t").
|
|
||||||
-define(DIGIT,"123456789").
|
|
||||||
|
|
||||||
|
|
||||||
run(Set, Loop) ->
|
|
||||||
Json = lists:map(fun(_) -> gen_json(?JSON) end, lists:seq(1, Set)),
|
|
||||||
Term = lists:map(fun(_) -> gen_term(?JSON) end, lists:seq(1, Set)),
|
|
||||||
[
|
|
||||||
{
|
|
||||||
b_jsx_json(Json, Loop)%,
|
|
||||||
%b_mochi_json(Json, Loop)
|
|
||||||
},
|
|
||||||
{
|
|
||||||
b_jsx_term(Term, Loop)%,
|
|
||||||
%b_mochi_term(Term, Loop)
|
|
||||||
}
|
|
||||||
].
|
|
||||||
|
|
||||||
hot() ->
|
|
||||||
b_jsx_term([gen_term(?JSON)], 100).
|
|
||||||
|
|
||||||
|
|
||||||
b_jsx_json(Set, Loop) ->
|
|
||||||
{T, _} = timer:tc(
|
|
||||||
fun() ->
|
|
||||||
lists:foreach(
|
|
||||||
fun(_) ->
|
|
||||||
lists:map(fun(X) -> jsx:to_term(X) end, Set)
|
|
||||||
end,
|
|
||||||
lists:seq(1, Loop)
|
|
||||||
)
|
|
||||||
end,
|
|
||||||
[]
|
|
||||||
),
|
|
||||||
{jsx, to_term, T / 1000, T / (Loop * length(Set) * 1000)}.
|
|
||||||
|
|
||||||
b_jsx_term(Set, Loop) ->
|
|
||||||
erlang:garbage_collect(),
|
|
||||||
{T, _} = timer:tc(
|
|
||||||
fun() ->
|
|
||||||
lists:foreach(
|
|
||||||
fun(_) ->
|
|
||||||
%error_logger:info_report([{mem_jsx, erlang:memory(processes)}]),
|
|
||||||
lists:map(fun(X) -> jsx:to_json(X) end, Set)
|
|
||||||
end,
|
|
||||||
lists:seq(1, Loop)
|
|
||||||
)
|
|
||||||
end,
|
|
||||||
[]
|
|
||||||
),
|
|
||||||
{jsx, to_json, T / 1000, T / (Loop * length(Set) * 1000)}.
|
|
||||||
|
|
||||||
|
|
||||||
b_mochi_json(Set, Loop) ->
|
|
||||||
{T, _} = timer:tc(
|
|
||||||
fun() ->
|
|
||||||
lists:foreach(
|
|
||||||
fun(_) ->
|
|
||||||
lists:map(fun(X) -> mochijson2:decode(X) end, Set)
|
|
||||||
end,
|
|
||||||
lists:seq(1, Loop)
|
|
||||||
)
|
|
||||||
end,
|
|
||||||
[]
|
|
||||||
),
|
|
||||||
{mochi, to_term, T / 1000, T / (Loop * length(Set) * 1000)}.
|
|
||||||
|
|
||||||
b_mochi_term(Set, Loop) ->
|
|
||||||
erlang:garbage_collect(),
|
|
||||||
{T, _} = timer:tc(
|
|
||||||
fun() ->
|
|
||||||
lists:foreach(
|
|
||||||
fun(_) ->
|
|
||||||
%error_logger:info_report([{mem_mochi, erlang:memory(processes)}]),
|
|
||||||
lists:map(fun(X) -> mochijson2:encode({struct, X})end, Set)
|
|
||||||
end,
|
|
||||||
lists:seq(1, Loop)
|
|
||||||
)
|
|
||||||
end,
|
|
||||||
[]
|
|
||||||
),
|
|
||||||
{mochi, to_json, T / 1000, T / (Loop * length(Set) * 1000)}.
|
|
||||||
|
|
||||||
|
|
||||||
%%
|
|
||||||
%% generates a json object
|
|
||||||
gen_json(Len) ->
|
|
||||||
list_to_binary(
|
|
||||||
io_lib:format("{~s}", [
|
|
||||||
string:join(
|
|
||||||
lists:map(
|
|
||||||
fun(_) ->
|
|
||||||
case random:uniform(2) of
|
|
||||||
1 ->
|
|
||||||
io_lib:format("\"~s\":\"~s\"",
|
|
||||||
[rstring(?LEN_KEY, ?ALPHA), rstring(?LEN_STR, ?ALPHA)]
|
|
||||||
);
|
|
||||||
2 ->
|
|
||||||
io_lib:format("\"~s\":~s",
|
|
||||||
[rstring(?LEN_KEY, ?ALPHA), rstring(?LEN_INT, ?DIGIT)]
|
|
||||||
)
|
|
||||||
end
|
|
||||||
end,
|
|
||||||
lists:seq(1,Len)
|
|
||||||
),
|
|
||||||
","
|
|
||||||
)
|
|
||||||
])
|
|
||||||
).
|
|
||||||
|
|
||||||
gen_term(Len) ->
|
|
||||||
lists:map(
|
|
||||||
fun(_) ->
|
|
||||||
case random:uniform(2) of
|
|
||||||
1 -> {
|
|
||||||
list_to_binary(rstring(?LEN_KEY, ?ALPHA)),
|
|
||||||
list_to_binary(rstring(?LEN_STR, ?ALPHA))
|
|
||||||
};
|
|
||||||
2 -> {
|
|
||||||
list_to_binary(rstring(?LEN_KEY, ?ALPHA)),
|
|
||||||
list_to_integer(rstring(?LEN_INT, ?DIGIT))
|
|
||||||
}
|
|
||||||
end
|
|
||||||
end,
|
|
||||||
lists:seq(1,Len)
|
|
||||||
).
|
|
||||||
|
|
||||||
%%
|
|
||||||
%%
|
|
||||||
rstring(Length, Alphabet) ->
|
|
||||||
ustring(random:uniform(Length), Alphabet).
|
|
||||||
|
|
||||||
%%
|
|
||||||
%% from http://blog.teemu.im/2009/11/07/generating-random-strings-in-erlang/
|
|
||||||
ustring(Length, AllowedChars) ->
|
|
||||||
lists:foldl(
|
|
||||||
fun(_, Acc) ->
|
|
||||||
[lists:nth(
|
|
||||||
random:uniform(length(AllowedChars)),
|
|
||||||
AllowedChars
|
|
||||||
)] ++ Acc
|
|
||||||
end,
|
|
||||||
[],
|
|
||||||
lists:seq(1, Length)
|
|
||||||
).
|
|
|
@ -29,15 +29,6 @@
|
||||||
|
|
||||||
-include("jsx_opts.hrl").
|
-include("jsx_opts.hrl").
|
||||||
|
|
||||||
-define(ESC(C),
|
|
||||||
<<H:L/binary, C, T/binary>> ->
|
|
||||||
B = unicode:characters_to_binary(json_escape_sequence(C)),
|
|
||||||
json_escape2(
|
|
||||||
<<H/binary, B/binary, T/binary>>,
|
|
||||||
Opts, L + size(B), Len + size(B) - 1
|
|
||||||
);
|
|
||||||
).
|
|
||||||
|
|
||||||
|
|
||||||
%% parsing of jsx opts
|
%% parsing of jsx opts
|
||||||
|
|
||||||
|
@ -94,96 +85,63 @@ extract_parser_opts([K|Rest], Acc) ->
|
||||||
%% everything else should be a legal json string component
|
%% everything else should be a legal json string component
|
||||||
|
|
||||||
json_escape(String, Opts) when is_binary(String) ->
|
json_escape(String, Opts) when is_binary(String) ->
|
||||||
%<< <<(case X of $.->$,; _->X end)>> || <<X>> <= String >>.
|
json_escape(String, Opts, 0, size(String)).
|
||||||
%json_escape(String, Opts, <<>>).
|
|
||||||
json_escape2(String, Opts, 0, size(String)).
|
|
||||||
|
|
||||||
json_escape2(Str, Opts, L, Len) when L < Len ->
|
json_escape(Str, Opts, L, Len) when L < Len ->
|
||||||
case Str of
|
case Str of
|
||||||
<<H:L/binary, $\", T/binary>> -> %"
|
<<H:L/binary, $\", T/binary>> -> %"
|
||||||
json_escape2(<<H/binary, $\\, $\", T/binary>>, Opts, L + 2, Len + 1);%"
|
json_escape(<<H/binary, $\\, $", T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H:L/binary, $\\, T/binary>> ->
|
<<H:L/binary, $\\, T/binary>> ->
|
||||||
json_escape2(<<H/binary, $\\, $\\, T/binary>>, Opts, L + 2, Len + 1);
|
json_escape(<<H/binary, $\\, $\\, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H:L/binary, $\b, T/binary>> ->
|
<<H:L/binary, $\b, T/binary>> ->
|
||||||
json_escape2(<<H/binary, $\\, $\b, T/binary>>, Opts, L + 2, Len + 1);
|
json_escape(<<H/binary, $\\, $b, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H:L/binary, $\f, T/binary>> ->
|
<<H:L/binary, $\f, T/binary>> ->
|
||||||
json_escape2(<<H/binary, $\\, $\f, T/binary>>, Opts, L + 2, Len + 1);
|
json_escape(<<H/binary, $\\, $f, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H:L/binary, $\n, T/binary>> ->
|
<<H:L/binary, $\n, T/binary>> ->
|
||||||
json_escape2(<<H/binary, $\\, $\n, T/binary>>, Opts, L + 2, Len + 1);
|
json_escape(<<H/binary, $\\, $n, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H:L/binary, $\r, T/binary>> ->
|
<<H:L/binary, $\r, T/binary>> ->
|
||||||
json_escape2(<<H/binary, $\\, $\r, T/binary>>, Opts, L + 2, Len + 1);
|
json_escape(<<H/binary, $\\, $r, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H:L/binary, $\t, T/binary>> ->
|
<<H:L/binary, $\t, T/binary>> ->
|
||||||
json_escape2(<<H/binary, $\\, $\t, T/binary>>, Opts, L + 2, Len + 1);
|
json_escape(<<H/binary, $\\, $t, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
% jsonp
|
<<H:L/binary, $/, T/binary>> ->
|
||||||
<<H:L/binary, 226, 128, 168, T/binary>> ->
|
case Opts#opts.escape_forward_slash of
|
||||||
B = unicode:characters_to_binary(json_escape_sequence(16#2028)),
|
true ->
|
||||||
json_escape2(
|
json_escape(<<H/binary, $\\, $/, T/binary>>, Opts, L + 2, Len + 1);
|
||||||
<<H/binary, B/binary, T/binary>>,
|
false ->
|
||||||
Opts, L + size(B), Len + size(B) - 1
|
json_escape(<<H/binary, $/, T/binary>>, Opts, L + 1, Len)
|
||||||
);
|
end;
|
||||||
<<H:L/binary, 226, 128, 169, T/binary>> ->
|
<<H:L/binary, 16#2028/utf8, T/binary>> ->
|
||||||
B = unicode:characters_to_binary(json_escape_sequence(16#2029)),
|
case Opts#opts.no_jsonp_escapes of
|
||||||
json_escape2(
|
true ->
|
||||||
<<H/binary, B/binary, T/binary>>,
|
json_escape(<<H/binary, 16#2028/utf8, T/binary>>, Opts, L + 3, Len);
|
||||||
Opts, L + size(B), Len + size(B) - 1
|
false ->
|
||||||
);
|
B = unicode:characters_to_binary(json_escape_sequence(16#2028)),
|
||||||
% C >= 0 and C < $\s
|
json_escape(<<H/binary, B/binary, T/binary>>, Opts, L + size(B), Len + size(B) - size(<<16#2028/utf8>>))
|
||||||
?ESC(00) ?ESC(01) ?ESC(02) ?ESC(03) ?ESC(04)
|
end;
|
||||||
?ESC(05) ?ESC(06) ?ESC(07)
|
<<H:L/binary, 16#2029/utf8, T/binary>> ->
|
||||||
?ESC(11) ?ESC(14)
|
case Opts#opts.no_jsonp_escapes of
|
||||||
?ESC(15) ?ESC(16) ?ESC(17) ?ESC(18) ?ESC(19)
|
true ->
|
||||||
?ESC(20) ?ESC(21) ?ESC(22) ?ESC(23) ?ESC(24)
|
json_escape(<<H/binary, 16#2029/utf8, T/binary>>, Opts, L + 3, Len);
|
||||||
?ESC(25) ?ESC(26) ?ESC(27) ?ESC(28) ?ESC(29)
|
false ->
|
||||||
?ESC(30) ?ESC(31)
|
B = unicode:characters_to_binary(json_escape_sequence(16#2029)),
|
||||||
_ ->
|
json_escape(<<H/binary, B/binary, T/binary>>, Opts, L + size(B), Len + size(B) - size(<<16#2029/utf8>>))
|
||||||
json_escape2(Str, Opts, L + 1, Len)
|
end;
|
||||||
end;
|
<<H:L/binary, X/utf8, T/binary>> when X < 32 ->
|
||||||
json_escape2(Str, _, L, Len) when L =:= Len ->
|
B = unicode:characters_to_binary(json_escape_sequence(X)),
|
||||||
Str.
|
json_escape(<<H/binary, B/binary, T/binary>>, Opts, L + size(B), Len + size(B) - size(<<X/utf8>>));
|
||||||
|
<<_:L/binary, X/utf8, _/binary>> when X < 16#0080 ->
|
||||||
%% double quote
|
json_escape(Str, Opts, L + 1, Len);
|
||||||
json_escape(<<$\", Rest/binary>>, Opts, Acc) -> %"
|
<<_:L/binary, X/utf8, _/binary>> when X < 16#0800 ->
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $\">>); %"
|
json_escape(Str, Opts, L + 2, Len);
|
||||||
%% backslash \ reverse solidus
|
<<_:L/binary, X/utf8, _/binary>> when X < 16#10000 ->
|
||||||
json_escape(<<$\\, Rest/binary>>, Opts, Acc) ->
|
json_escape(Str, Opts, L + 3, Len);
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $\\>>);
|
<<_:L/binary, _/utf8, _/binary>> ->
|
||||||
%% backspace
|
json_escape(Str, Opts, L + 4, Len);
|
||||||
json_escape(<<$\b, Rest/binary>>, Opts, Acc) ->
|
<<H:L/binary, X, T/binary>> ->
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $b>>);
|
erlang:error(badarg, [[<<H:L/binary, X, T/binary>>, Opts]])
|
||||||
%% form feed
|
end;
|
||||||
json_escape(<<$\f, Rest/binary>>, Opts, Acc) ->
|
json_escape(Str, _, L, Len) when L =:= Len ->
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $f>>);
|
Str.
|
||||||
%% newline
|
|
||||||
json_escape(<<$\n, Rest/binary>>, Opts, Acc) ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $n>>);
|
|
||||||
%% cr
|
|
||||||
json_escape(<<$\r, Rest/binary>>, Opts, Acc) ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $r>>);
|
|
||||||
%% tab
|
|
||||||
json_escape(<<$\t, Rest/binary>>, Opts, Acc) ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $t>>);
|
|
||||||
%% other control characters
|
|
||||||
json_escape(<<C/utf8, Rest/binary>>, Opts, Acc) when C >= 0, C < $\s ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, (json_escape_sequence(C))/binary>>);
|
|
||||||
%% escape forward slashes -- optionally -- to faciliate microsoft's retarded
|
|
||||||
%% date format
|
|
||||||
json_escape(<<$/, Rest/binary>>, Opts=#opts{escape_forward_slash=true}, Acc) ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, $\\, $/>>);
|
|
||||||
%% skip escaping u+2028 and u+2029
|
|
||||||
json_escape(<<C/utf8, Rest/binary>>, Opts=#opts{no_jsonp_escapes=true}, Acc)
|
|
||||||
when C == 16#2028; C == 16#2029 ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, C/utf8>>);
|
|
||||||
%% escape u+2028 and u+2029 to avoid problems with jsonp
|
|
||||||
json_escape(<<C/utf8, Rest/binary>>, Opts, Acc)
|
|
||||||
when C == 16#2028; C == 16#2029 ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, (json_escape_sequence(C))/binary>>);
|
|
||||||
%% any other legal codepoint
|
|
||||||
json_escape(<<C/utf8, Rest/binary>>, Opts, Acc) ->
|
|
||||||
json_escape(Rest, Opts, <<Acc/binary, C/utf8>>);
|
|
||||||
json_escape(<<>>, _Opts, Acc) ->
|
|
||||||
Acc;
|
|
||||||
json_escape(Bin, Opts, Acc) ->
|
|
||||||
erlang:error(badarg, [Bin, Opts, Acc]).
|
|
||||||
|
|
||||||
|
|
||||||
%% convert a codepoint to it's \uXXXX equiv.
|
%% convert a codepoint to it's \uXXXX equiv.
|
||||||
|
@ -217,8 +175,8 @@ binary_escape_test_() ->
|
||||||
},
|
},
|
||||||
{"json string hex escape",
|
{"json string hex escape",
|
||||||
?_assertEqual(
|
?_assertEqual(
|
||||||
json_escape(<<1, 2, 3, 11, 26, 30, 31>>, #opts{}),
|
json_escape(<<0, 1, 2, 3, 11, 26, 30, 31>>, #opts{}),
|
||||||
<<"\\u0001\\u0002\\u0003\\u000b\\u001a\\u001e\\u001f">>
|
<<"\\u0000\\u0001\\u0002\\u0003\\u000b\\u001a\\u001e\\u001f">>
|
||||||
)
|
)
|
||||||
},
|
},
|
||||||
{"jsonp protection",
|
{"jsonp protection",
|
||||||
|
@ -238,6 +196,15 @@ binary_escape_test_() ->
|
||||||
json_escape(<<"/Date(1303502009425)/">>, #opts{escape_forward_slash=true}),
|
json_escape(<<"/Date(1303502009425)/">>, #opts{escape_forward_slash=true}),
|
||||||
<<"\\/Date(1303502009425)\\/">>
|
<<"\\/Date(1303502009425)\\/">>
|
||||||
)
|
)
|
||||||
|
},
|
||||||
|
{"bad utf8",
|
||||||
|
?_assertError(badarg, json_escape(<<32, 64, 128, 256>>, #opts{}))
|
||||||
|
},
|
||||||
|
{"all sizes of codepoints",
|
||||||
|
?_assertEqual(
|
||||||
|
json_escape(unicode:characters_to_binary([0, 32, 16#80, 16#800, 16#10000]), #opts{}),
|
||||||
|
<<"\\u0000", 32/utf8, 16#80/utf8, 16#800/utf8, 16#10000/utf8>>
|
||||||
|
)
|
||||||
}
|
}
|
||||||
].
|
].
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue