2010-09-20 19:11:31 -07:00
|
|
|
%% The MIT License
|
|
|
|
|
|
|
|
%% Copyright (c) 2010 Alisdair Sullivan <alisdairsullivan@yahoo.ca>
|
|
|
|
|
|
|
|
%% Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
%% of this software and associated documentation files (the "Software"), to deal
|
|
|
|
%% in the Software without restriction, including without limitation the rights
|
|
|
|
%% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
%% copies of the Software, and to permit persons to whom the Software is
|
|
|
|
%% furnished to do so, subject to the following conditions:
|
|
|
|
|
|
|
|
%% The above copyright notice and this permission notice shall be included in
|
|
|
|
%% all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
%% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
%% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
%% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
%% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
%% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
%% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
%% THE SOFTWARE.
|
|
|
|
|
|
|
|
|
2011-03-22 18:53:02 -07:00
|
|
|
-module(jsx_utils).
|
2010-09-20 19:11:31 -07:00
|
|
|
|
2012-03-02 22:53:23 -08:00
|
|
|
-export([parse_opts/1]).
|
2012-03-04 18:40:00 -08:00
|
|
|
-export([extract_opts/1]).
|
2011-12-04 23:41:00 -08:00
|
|
|
-export([json_escape/2]).
|
2011-09-14 06:44:52 -07:00
|
|
|
|
2012-03-06 19:59:49 -08:00
|
|
|
-include("jsx_opts.hrl").
|
2010-09-20 19:11:31 -07:00
|
|
|
|
2010-09-22 23:22:55 -07:00
|
|
|
|
2011-10-19 06:51:36 -07:00
|
|
|
%% parsing of jsx opts
|
|
|
|
|
|
|
|
parse_opts(Opts) ->
|
|
|
|
parse_opts(Opts, #opts{}).
|
|
|
|
|
|
|
|
parse_opts([], Opts) ->
|
|
|
|
Opts;
|
|
|
|
parse_opts([loose_unicode|Rest], Opts) ->
|
|
|
|
parse_opts(Rest, Opts#opts{loose_unicode=true});
|
|
|
|
parse_opts([escape_forward_slash|Rest], Opts) ->
|
|
|
|
parse_opts(Rest, Opts#opts{escape_forward_slash=true});
|
2011-10-21 18:16:16 -07:00
|
|
|
parse_opts([explicit_end|Rest], Opts) ->
|
|
|
|
parse_opts(Rest, Opts#opts{explicit_end=true});
|
2012-03-14 23:01:59 -07:00
|
|
|
parse_opts([single_quotes|Rest], Opts) ->
|
|
|
|
parse_opts(Rest, Opts#opts{single_quotes=true});
|
2011-10-19 06:51:36 -07:00
|
|
|
parse_opts(_, _) ->
|
|
|
|
{error, badarg}.
|
|
|
|
|
|
|
|
|
2012-03-04 18:40:00 -08:00
|
|
|
extract_opts(Opts) ->
|
|
|
|
extract_parser_opts(Opts, []).
|
|
|
|
|
|
|
|
extract_parser_opts([], Acc) -> Acc;
|
|
|
|
extract_parser_opts([{K,V}|Rest], Acc) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
case lists:member(K, [loose_unicode, escape_forward_slash, explicit_end, single_quotes]) of
|
2012-03-04 18:40:00 -08:00
|
|
|
true -> extract_parser_opts(Rest, [{K,V}] ++ Acc)
|
|
|
|
; false -> extract_parser_opts(Rest, Acc)
|
|
|
|
end;
|
|
|
|
extract_parser_opts([K|Rest], Acc) ->
|
2012-03-14 23:01:59 -07:00
|
|
|
case lists:member(K, [loose_unicode, escape_forward_slash, explicit_end, single_quotes]) of
|
2012-03-04 18:40:00 -08:00
|
|
|
true -> extract_parser_opts(Rest, [K] ++ Acc)
|
|
|
|
; false -> extract_parser_opts(Rest, Acc)
|
|
|
|
end.
|
|
|
|
|
|
|
|
|
2011-09-14 06:44:52 -07:00
|
|
|
%% json string escaping, for utf8 binaries. escape the json control sequences to
|
|
|
|
%% their json equivalent, escape other control characters to \uXXXX sequences,
|
|
|
|
%% everything else should be a legal json string component
|
2011-10-19 06:51:36 -07:00
|
|
|
|
2011-09-14 06:44:52 -07:00
|
|
|
json_escape(String, Opts) when is_binary(String) ->
|
2011-11-29 20:32:47 -08:00
|
|
|
json_escape(String, Opts, <<>>).
|
2011-09-14 06:44:52 -07:00
|
|
|
|
|
|
|
%% double quote
|
|
|
|
json_escape(<<$\", Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $\">>);
|
|
|
|
%% backslash \ reverse solidus
|
|
|
|
json_escape(<<$\\, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $\\>>);
|
|
|
|
%% backspace
|
|
|
|
json_escape(<<$\b, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $b>>);
|
|
|
|
%% form feed
|
|
|
|
json_escape(<<$\f, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $f>>);
|
|
|
|
%% newline
|
|
|
|
json_escape(<<$\n, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $n>>);
|
|
|
|
%% cr
|
|
|
|
json_escape(<<$\r, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $r>>);
|
|
|
|
%% tab
|
|
|
|
json_escape(<<$\t, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $t>>);
|
|
|
|
%% other control characters
|
|
|
|
json_escape(<<C/utf8, Rest/binary>>, Opts, Acc) when C >= 0, C < $\s ->
|
|
|
|
json_escape(Rest,
|
|
|
|
Opts,
|
2011-11-30 19:08:38 -08:00
|
|
|
<<Acc/binary, (unicode:characters_to_binary(json_escape_sequence(C)))/binary>>
|
2011-09-14 06:44:52 -07:00
|
|
|
);
|
|
|
|
%% escape forward slashes -- optionally -- to faciliate microsoft's retarded
|
|
|
|
%% date format
|
|
|
|
json_escape(<<$/, Rest/binary>>, Opts=#opts{escape_forward_slash=true}, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, $\\, $/>>);
|
|
|
|
%% escape u+2028 and u+2029 to avoid problems with jsonp
|
|
|
|
json_escape(<<C/utf8, Rest/binary>>, Opts, Acc)
|
|
|
|
when C == 16#2028; C == 16#2029 ->
|
|
|
|
json_escape(Rest,
|
|
|
|
Opts,
|
2011-11-30 19:08:38 -08:00
|
|
|
<<Acc/binary, (unicode:characters_to_binary(json_escape_sequence(C)))/binary>>
|
2011-09-14 06:44:52 -07:00
|
|
|
);
|
|
|
|
%% any other legal codepoint
|
|
|
|
json_escape(<<C/utf8, Rest/binary>>, Opts, Acc) ->
|
|
|
|
json_escape(Rest, Opts, <<Acc/binary, C/utf8>>);
|
|
|
|
json_escape(<<>>, _Opts, Acc) ->
|
|
|
|
Acc;
|
|
|
|
json_escape(Rest, Opts, Acc) ->
|
|
|
|
erlang:error(badarg, [Rest, Opts, Acc]).
|
|
|
|
|
|
|
|
|
|
|
|
%% convert a codepoint to it's \uXXXX equiv.
|
|
|
|
json_escape_sequence(X) ->
|
|
|
|
<<A:4, B:4, C:4, D:4>> = <<X:16>>,
|
|
|
|
[$\\, $u, (to_hex(A)), (to_hex(B)), (to_hex(C)), (to_hex(D))].
|
|
|
|
|
|
|
|
|
|
|
|
to_hex(10) -> $a;
|
|
|
|
to_hex(11) -> $b;
|
|
|
|
to_hex(12) -> $c;
|
|
|
|
to_hex(13) -> $d;
|
|
|
|
to_hex(14) -> $e;
|
|
|
|
to_hex(15) -> $f;
|
|
|
|
to_hex(X) -> X + 48. %% ascii "1" is [49], "2" is [50], etc...
|
2010-09-20 19:11:31 -07:00
|
|
|
|
|
|
|
|
2011-12-04 23:41:00 -08:00
|
|
|
|
2010-09-20 19:11:31 -07:00
|
|
|
%% eunit tests
|
|
|
|
-ifdef(TEST).
|
2011-08-10 01:44:38 -07:00
|
|
|
-include_lib("eunit/include/eunit.hrl").
|
2010-09-20 19:11:31 -07:00
|
|
|
|
2011-09-14 06:44:52 -07:00
|
|
|
|
|
|
|
binary_escape_test_() ->
|
|
|
|
[
|
|
|
|
{"json string escaping",
|
|
|
|
?_assert(json_escape(
|
|
|
|
<<"\"\\\b\f\n\r\t">>, #opts{}
|
|
|
|
) =:= <<"\\\"\\\\\\b\\f\\n\\r\\t">>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"json string hex escape",
|
|
|
|
?_assert(json_escape(
|
|
|
|
<<1, 2, 3, 11, 26, 30, 31>>, #opts{}
|
|
|
|
) =:= <<"\\u0001\\u0002\\u0003\\u000b\\u001a\\u001e\\u001f">>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"jsonp protection",
|
|
|
|
?_assert(json_escape(
|
|
|
|
<<226, 128, 168, 226, 128, 169>>, #opts{}
|
|
|
|
) =:= <<"\\u2028\\u2029">>
|
|
|
|
)
|
|
|
|
},
|
|
|
|
{"microsoft i hate your date format",
|
|
|
|
?_assert(json_escape(<<"/Date(1303502009425)/">>,
|
|
|
|
#opts{escape_forward_slash=true}
|
|
|
|
) =:= <<"\\/Date(1303502009425)\\/">>
|
|
|
|
)
|
|
|
|
}
|
|
|
|
].
|
|
|
|
|
2010-09-20 19:11:31 -07:00
|
|
|
-endif.
|