Merge pull request #230 from martinsumner/mas-i229-loadrepeatedkey

Mas i229 loadrepeatedkey
2018-12-10 14:08:24 +00:00 · 2018-12-10 14:08:24 +00:00 · 4387837279
commit 4387837279
parent 401228c84e f274d2a63a
3 changed files with 109 additions and 3 deletions
--- a/src/leveled_bookie.erl
+++ b/src/leveled_bookie.erl
@ -2028,7 +2028,7 @@ addto_ledgercache({H, SQN, KeyChanges}, Cache) ->
                                    -> ledger_cache().
 %% @doc
 %% Add a set of changes associated witha single sequence number (journal 
-%% update) to the ledger cache.  This is used explicitly when laoding the
+%% update) to the ledger cache.  This is used explicitly when loading the
 %% ledger from the Journal (i.e. at startup) - and in this case the ETS insert
 %% can be bypassed, as all changes will be flushed to the Penciller before the
 %% load is complete.
--- a/src/leveled_pmem.erl
+++ b/src/leveled_pmem.erl
@ -200,7 +200,12 @@ merge_trees(StartKey, EndKey, TreeList, LevelMinus1) ->
 find_pos(<<>>, _Hash, PosList, _SlotID) ->
    PosList;
 find_pos(<<1:1/integer, Hash:23/integer, T/binary>>, Hash, PosList, SlotID) ->
-    find_pos(T, Hash, PosList ++ [SlotID], SlotID);
+    case lists:member(SlotID, PosList) of
        true ->
            find_pos(T, Hash, PosList, SlotID);
        false ->
            find_pos(T, Hash, PosList ++ [SlotID], SlotID)
    end;
 find_pos(<<1:1/integer, _Miss:23/integer, T/binary>>, Hash, PosList, SlotID) ->
    find_pos(T, Hash, PosList, SlotID);
 find_pos(<<0:1/integer, NxtSlot:7/integer, T/binary>>, Hash, PosList, _SlotID) ->
--- a/test/end_to_end/recovery_SUITE.erl
+++ b/test/end_to_end/recovery_SUITE.erl
@ -2,7 +2,9 @@
 -include_lib("common_test/include/ct.hrl").
 -include("include/leveled.hrl").
 -export([all/0]).
-export([hot_backup_simple/1,
+-export([
            recovery_with_samekeyupdates/1,
            hot_backup_simple/1,
            hot_backup_changes/1,
            retain_strategy/1,
            recovr_strategy/1,
@ -12,6 +14,7 @@
            ]).
 all() -> [
            recovery_with_samekeyupdates,
            hot_backup_simple,
            hot_backup_changes,
            retain_strategy,
@ -22,6 +25,104 @@ all() -> [
            ].
 recovery_with_samekeyupdates(_Config) ->
    % Setup to prove https://github.com/martinsumner/leveled/issues/229
    % run a test that involves many updates to the same key, and check that
    % this doesn't cause performance to flatline in either the normal "PUT"
    % case, or in the case of the recovery from a lost keystore
    AcceptableDuration = 180, % 3 minutes
    E2E_SW = os:timestamp(), % Used to track time for overall job
    RootPath = testutil:reset_filestructure(),
    BackupPath = testutil:reset_filestructure("backupSKU"),
    BookOpts = [{root_path, RootPath},
                    {cache_size, 2000},
                    {max_journalsize, 20000000},
                    {sync_strategy, testutil:sync_strategy()}],
    {ok, Book1} = leveled_bookie:book_start(BookOpts),
    % Load in 5K different keys
    % Load 5 keys in 5K times each
    % Load in 5K different keys
    io:format("Commence object generation and load~n"),
    ObjectGen = testutil:get_compressiblevalue_andinteger(),
    IndexGen = fun() -> [] end,
    ObjL1 = testutil:generate_objects(5000,
                                      {fixed_binary, 1},
                                      [],
                                      ObjectGen,
                                      IndexGen,
                                      <<"Bucket1">>),
    testutil:riakload(Book1, ObjL1),
    RepeatedLoadFun =
        fun(_I, _Acc) ->
            ObjRL =
                testutil:generate_objects(5,
                                            {fixed_binary, 5001},
                                            [],
                                            ObjectGen,
                                            IndexGen,
                                            <<"Bucket1">>),
            testutil:riakload(Book1, ObjRL),
            ObjRL
        end,
    FinalObjRL = lists:foldl(RepeatedLoadFun, [], lists:seq(1, 5000)),
    ObjL2 = testutil:generate_objects(5000,
                                      {fixed_binary, 6001},
                                      [],
                                      ObjectGen,
                                      IndexGen,
                                      <<"Bucket1">>),
    testutil:riakload(Book1, ObjL2),
    % Fetch all of ObjL1
    io:format("Check for presence of unique objects~n"),
    ok = testutil:checkhead_forlist(Book1, ObjL1),
    % Fetch all of ObjL2
    ok = testutil:checkhead_forlist(Book1, ObjL2),
    io:format("Check for presence of repeated objects~n"),
    % Fetch repeated objects 200 times each
    CheckFun1 = 
        fun(_I) -> ok = testutil:checkhead_forlist(Book1, FinalObjRL) end,
    lists:foreach(CheckFun1, lists:seq(1, 200)),
    io:format("Checks complete~n"),
    io:format("Backup - get journal with no ledger~n"),
    {async, BackupFun} = leveled_bookie:book_hotbackup(Book1),
    ok = BackupFun(BackupPath),
    io:format("Restarting without key store~n"),
    ok = leveled_bookie:book_close(Book1),
    BookOptsBackup = [{root_path, BackupPath},
                        {cache_size, 2000},
                        {max_journalsize, 20000000},
                        {sync_strategy, testutil:sync_strategy()}],
    {ok, Book2} = leveled_bookie:book_start(BookOptsBackup),
    % Fetch all of ObjL1
    io:format("Check for presence of unique objects~n"),
    ok = testutil:checkhead_forlist(Book2, ObjL1),
    % Fetch all of ObjL2
    ok = testutil:checkhead_forlist(Book2, ObjL2),
    io:format("Check for presence of repeated objects~n"),
    % Fetch repeated objects 200 times each
    CheckFun2 = 
        fun(_I) -> ok = testutil:checkhead_forlist(Book2, FinalObjRL) end,
    lists:foreach(CheckFun2, lists:seq(1, 200)),
    io:format("Checks complete from backup~n"),
    DurationOfTest = timer:now_diff(os:timestamp(), E2E_SW)/(1000 * 1000),
    io:format("Duration of test was ~w s~n", [DurationOfTest]),
    true = DurationOfTest < AcceptableDuration,
    ok = leveled_bookie:book_close(Book2),
    testutil:reset_filestructure(BackupPath),
    testutil:reset_filestructure().
 hot_backup_simple(_Config) ->
    % The journal may have a hot backup.  This allows for an online Bookie
    % to be sent a message to prepare a backup function, which an asynchronous