Make binary Riak bucket/keys a special case

When leveled is used with Riak, buckets and keys are always binaries. So we can treat them as such. Want to move tictac tree testing away from the leveled internal tests, to a set of tests for the Riak scenario. so riak_SUITE created for this and other riak-specific backend tests.
2017-10-30 17:39:21 +00:00 · 2017-10-30 17:39:21 +00:00 · f5878548f9
commit f5878548f9
parent 6bb7ceef0c
3 changed files with 172 additions and 0 deletions
--- a/src/leveled_codec.erl
+++ b/src/leveled_codec.erl
@ -91,6 +91,9 @@ segment_hash(Key) when is_binary(Key) ->
    <<SegmentID:16/integer, ExtraHash:32/integer, _Rest/binary>> = 
        crypto:hash(md5, Key),
    {SegmentID, ExtraHash};
 segment_hash({?RIAK_TAG, Bucket, Key, null}) 
                                    when is_binary(Bucket), is_binary(Key) ->
    segment_hash(<<Bucket/binary, Key/binary>>);
 segment_hash(Key) ->
    segment_hash(term_to_binary(Key)).
--- a/test/end_to_end/riak_SUITE.erl
+++ b/test/end_to_end/riak_SUITE.erl
@ -0,0 +1,157 @@
 -module(riak_SUITE).
 -include_lib("common_test/include/ct.hrl").
 -include("include/leveled.hrl").
 -export([all/0]).
 -export([
            perbucket_aae/1
            ]).
 all() -> [
            perbucket_aae
            ].
 -define(MAGIC, 53). % riak_kv -> riak_object
 perbucket_aae(_Config) ->
    TreeSize = small,
    % Test requires multiple different databases, so want to mount them all
    % on individual file paths
    RootPathA = testutil:reset_filestructure("testA"),
    RootPathB = testutil:reset_filestructure("testB"),
    % Start the first database, load a test object, close it, start it again
    StartOpts1 = [{root_path, RootPathA},
                    {max_pencillercachesize, 16000},
                    {sync_strategy, riak_sync}],
    {ok, Bookie1} = leveled_bookie:book_start(StartOpts1),
    {B1, K1, V1, S1, MD} = {<<"Bucket">>,
                                <<"Key1.1.4567.4321">>,
                                <<"Value1">>,
                                [],
                                [{<<"MDK1">>, <<"MDV1">>}]},
    {TestObject, TestSpec} = testutil:generate_testobject(B1, K1, V1, S1, MD),
    ok = testutil:book_riakput(Bookie1, TestObject, TestSpec),
    testutil:check_forobject(Bookie1, TestObject),
    ok = leveled_bookie:book_close(Bookie1),
    StartOpts2 = [{root_path, RootPathA},
                    {max_journalsize, 500000000},
                    {max_pencillercachesize, 32000},
                    {sync_strategy, testutil:sync_strategy()}],
    {ok, Bookie2} = leveled_bookie:book_start(StartOpts2),
    testutil:check_forobject(Bookie2, TestObject),
    % Generate 200K objects to be sued within the test, and load them into
    % the first store (outputting the generated objects as a list of lists)
    % to be used elsewhere
    GenList = 
        [{binary, 2}, {binary, 40002}, {binary, 80002}, {binary, 120002}],
    CLs = testutil:load_objects(40000,
                                GenList,
                                Bookie2,
                                TestObject,
                                fun testutil:generate_smallobjects/2,
                                40000),
    % Start a new store, and load the same objects (except fot the original
    % test object) into this store
    StartOpts3 = [{root_path, RootPathB},
                    {max_journalsize, 200000000},
                    {max_pencillercachesize, 16000},
                    {sync_strategy, testutil:sync_strategy()}],
    {ok, Bookie3} = leveled_bookie:book_start(StartOpts3),
    lists:foreach(fun(ObjL) -> testutil:riakload(Bookie3, ObjL) end, CLs),
    % Now run a tictac query against both stores to see the extent to which
    % state between stores is consistent
    HeadTicTacFolder = 
        {foldheads_allkeys,
            ?RIAK_TAG,
            {fun head_tictac_foldfun/4, 
                {0, leveled_tictac:new_tree(test, TreeSize)}},
            false,
            true},
    SW_TT0 = os:timestamp(),
    {async, Book2TreeFolder} =
        leveled_bookie:book_returnfolder(Bookie2, HeadTicTacFolder),
    {async, Book3TreeFolder} =
        leveled_bookie:book_returnfolder(Bookie3, HeadTicTacFolder),
    {Count2, Book2Tree} = Book2TreeFolder(),
    {Count3, Book3Tree} = Book3TreeFolder(),
    Time_TT0 = timer:now_diff(os:timestamp(), SW_TT0)/1000,
    io:format("Two tree folds took ~w milliseconds ~n", [Time_TT0]),
    io:format("Fold over keys revealed counts of ~w and ~w~n", 
                [Count2, Count3]),
    1 = Count2 - Count3,
    DLs = leveled_tictac:find_dirtyleaves(Book2Tree, Book3Tree),
    io:format("Found dirty leaves with Riak fold_heads of ~w~n",
                [length(DLs)]),
    true = length(DLs) == 1,
    {ExpSeg, _ExpExtra} = leveled_codec:segment_hash(<<B1/binary, K1/binary>>),
    [ActualSeg] = DLs,
    true = ExpSeg == ActualSeg band 65535,
    HeadSegmentFolder = 
        {foldheads_allkeys,
            ?RIAK_TAG,
            {get_segment_folder(DLs, TreeSize),  []},
            false,
            true},
    SW_SL0 = os:timestamp(),
    {async, Book2SegFolder} =
        leveled_bookie:book_returnfolder(Bookie2, HeadSegmentFolder),
    {async, Book3SegFolder} =
        leveled_bookie:book_returnfolder(Bookie3, HeadSegmentFolder),
    Book2SegList = Book2SegFolder(),
    Book3SegList = Book3SegFolder(),
    Time_SL0 = timer:now_diff(os:timestamp(), SW_SL0)/1000,
    io:format("Two segment list folds took ~w milliseconds ~n", [Time_SL0]),
    io:format("Segment lists found ~w ~w~n", [Book2SegList, Book3SegList]),
    Delta = lists:subtract(Book2SegList, Book3SegList),
    true = length(Delta) == 1.
 get_segment_folder(SegmentList, TreeSize) ->
    fun(B, K, PO, KeysAndClocksAcc) ->
        SegmentH = leveled_tictac:keyto_segment32(<<B/binary, K/binary>>),
        Segment = leveled_tictac:get_segment(SegmentH, TreeSize),
        case lists:member(Segment, SegmentList) of
            true ->
                {VC, _Sz, _SC} = summary_from_binary(PO),
                [{B, K, VC}|KeysAndClocksAcc];
            false ->
                KeysAndClocksAcc
        end     
    end.
 head_tictac_foldfun(B, K, PO, {Count, TreeAcc}) ->
    ExtractFun = 
        fun({BBin, KBin}, Obj) ->
            {VC, _Sz, _SC} = summary_from_binary(Obj),
            {<<BBin/binary, KBin/binary>>, lists:sort(VC)}
        end,
    {Count + 1, 
        leveled_tictac:add_kv(TreeAcc, {B, K}, PO, ExtractFun)}.
 summary_from_binary(<<131, _Rest/binary>>=ObjBin) ->
    {proxy_object, HeadBin, ObjSize, _Fetcher} = binary_to_term(ObjBin),
    summary_from_binary(HeadBin, ObjSize);
 summary_from_binary(ObjBin) when is_binary(ObjBin) ->
    summary_from_binary(ObjBin, byte_size(ObjBin)).
 summary_from_binary(ObjBin, ObjSize) ->
    <<?MAGIC:8/integer, 
        1:8/integer, 
        VclockLen:32/integer, VclockBin:VclockLen/binary, 
        SibCount:32/integer, 
        _Rest/binary>> = ObjBin,
    {lists:usort(binary_to_term(VclockBin)), ObjSize, SibCount}.
--- a/test/end_to_end/testutil.erl
+++ b/test/end_to_end/testutil.erl
@ -356,6 +356,18 @@ generate_objects(Count, uuid, ObjL, Value, IndexGen, Bucket) ->
                        Value,
                        IndexGen,
                        Bucket);
 generate_objects(Count, {binary, KeyNumber}, ObjL, Value, IndexGen, Bucket) ->
    {Obj1, Spec1} = 
        set_object(list_to_binary(Bucket),
                    list_to_binary("Key" ++ integer_to_list(KeyNumber)),
                    Value,
                    IndexGen),
    generate_objects(Count - 1,
                        {binary, KeyNumber + 1},
                        ObjL ++ [{leveled_rand:uniform(), Obj1, Spec1}],
                        Value,
                        IndexGen,
                        Bucket);
 generate_objects(Count, KeyNumber, ObjL, Value, IndexGen, Bucket) ->
    {Obj1, Spec1} = set_object(Bucket,
                                "Key" ++ integer_to_list(KeyNumber),