From 49490c38ef1a51ad085e978ab8876f979b7f3f0c Mon Sep 17 00:00:00 2001
From: Martin Sumner <martin.sumner@adaptip.co.uk>
Date: Tue, 19 Dec 2023 11:56:03 +0000
Subject: [PATCH] Add performance/profiling test (#424)

* Add performance/profiling test

Add test to perf_SUITE to do performance tests and also profile different activities in leveled.

This can then be used to highlight functions with unexpectedly high execution times, and prove the impact of changes.

Switch between riak_ctperf and riak_fullperf to change from standard test (with profile option) to full-scale performance test

* Change shape of default perfTest

* Change fullPerf

Change the fullPerf test to run more tests, but with fewer keys.

Given that RS of 512 is being pushed in Riak, 2M objects is till a 300M+ object cluster. 10M >> 1B.  so these are still reasonable sizes to test.

A profilePerf test also added to generate all the profiles base don 2M objects.

* Extend test

Queries where previously all returning a large number of index entries - changes made to make number of entries per query more realistic.  Also an update process added to show difference between loading and rotating keys.

* Relabel as AAE fold

* Test v5

Test mini-queries - where generally a small number of entries are returned

* Default to ctperf
---
 src/leveled_imanifest.erl       |   7 +-
 src/leveled_inker.erl           |  28 +-
 src/leveled_penciller.erl       |  20 +-
 src/leveled_pmanifest.erl       |  28 +-
 test/end_to_end/basic_SUITE.erl |  82 ++++-
 test/end_to_end/perf_SUITE.erl  | 586 ++++++++++++++++++++++++++++----
 test/end_to_end/testutil.erl    |  11 +
 7 files changed, 683 insertions(+), 79 deletions(-)

diff --git a/src/leveled_imanifest.erl b/src/leveled_imanifest.erl
index 8532af2..4248beb 100644
--- a/src/leveled_imanifest.erl
+++ b/src/leveled_imanifest.erl
@@ -19,7 +19,8 @@
         reader/2,
         writer/3,
         printer/1,
-        complete_filex/0
+        complete_filex/0,
+        get_cdbpids/1
         ]).         
 
 -define(MANIFEST_FILEX, "man").
@@ -218,6 +219,10 @@ from_list(Manifest) ->
     % reads are more common than stale reads
     lists:foldr(fun prepend_entry/2, [], Manifest).
 
+-spec get_cdbpids(manifest()) -> list(pid()).
+%% @doc return a list of PIDs within the manifest
+get_cdbpids(Manifest) ->
+    lists:map(fun(ME) -> element(3, ME) end, to_list(Manifest)).
 
 %%%============================================================================
 %%% Internal Functions
diff --git a/src/leveled_inker.erl b/src/leveled_inker.erl
index 3c52ab0..6e38151 100644
--- a/src/leveled_inker.erl
+++ b/src/leveled_inker.erl
@@ -118,14 +118,20 @@
         ink_loglevel/2,
         ink_addlogs/2,
         ink_removelogs/2,
-        ink_getjournalsqn/1]).
+        ink_getjournalsqn/1,
+        ink_getcdbpids/1,
+        ink_getclerkpid/1
+    ]).
 
 -export([filepath/2, filepath/3]).
 
 -ifdef(TEST).
--export([build_dummy_journal/0, clean_testdir/1]).
+-export(
+    [build_dummy_journal/0, clean_testdir/1]
+).
 -endif.
 
+
 -define(MANIFEST_FP, "journal_manifest").
 -define(FILES_FP, "journal_files").
 -define(COMPACT_FP, "post_compact").
@@ -480,6 +486,19 @@ ink_removelogs(Pid, ForcedLogs) ->
 ink_getjournalsqn(Pid) ->
     gen_server:call(Pid, get_journalsqn, infinity).
 
+-spec ink_getcdbpids(pid()) -> list(pid()).
+%% @doc
+%% Used for profiling in tests - get a list of SST PIDs to profile
+ink_getcdbpids(Pid) ->
+    gen_server:call(Pid, get_cdbpids).
+
+-spec ink_getclerkpid(pid()) -> pid().
+%% @doc
+%% Used for profiling in tests - get the clerk PID to profile
+ink_getclerkpid(Pid) ->
+    gen_server:call(Pid, get_clerkpid).
+
+
 %%%============================================================================
 %%% gen_server callbacks
 %%%============================================================================
@@ -673,6 +692,11 @@ handle_call({check_sqn, LedgerSQN}, _From, State) ->
     end;
 handle_call(get_journalsqn, _From, State) ->
     {reply, {ok, State#state.journal_sqn}, State};
+handle_call(get_cdbpids, _From, State) ->
+    CDBPids = leveled_imanifest:get_cdbpids(State#state.manifest),
+    {reply, [State#state.active_journaldb|CDBPids], State};
+handle_call(get_clerkpid, _From, State) ->
+    {reply, State#state.clerk, State};
 handle_call(close, _From, State=#state{is_snapshot=Snap}) when Snap == true ->
     ok = ink_releasesnapshot(State#state.source_inker, self()),
     {stop, normal, ok, State};
diff --git a/src/leveled_penciller.erl b/src/leveled_penciller.erl
index db2ef3b..97d7618 100644
--- a/src/leveled_penciller.erl
+++ b/src/leveled_penciller.erl
@@ -201,6 +201,8 @@
         sst_rootpath/1,
         sst_filename/3]).
 
+-export([pcl_getsstpids/1, pcl_getclerkpid/1]).
+
 -ifdef(TEST).
 -export([
         clean_testdir/1]).
@@ -614,6 +616,18 @@ pcl_addlogs(Pid, ForcedLogs) ->
 pcl_removelogs(Pid, ForcedLogs) ->
     gen_server:cast(Pid, {remove_logs, ForcedLogs}).
 
+-spec pcl_getsstpids(pid()) -> list(pid()).
+%% @doc
+%% Used for profiling in tests - get a list of SST PIDs to profile
+pcl_getsstpids(Pid) ->
+    gen_server:call(Pid, get_sstpids).
+
+-spec pcl_getclerkpid(pid()) -> pid().
+%% @doc
+%% Used for profiling in tests - get the clerk PID to profile
+pcl_getclerkpid(Pid) ->
+    gen_server:call(Pid, get_clerkpid).
+
 %%%============================================================================
 %%% gen_server callbacks
 %%%============================================================================
@@ -965,7 +979,11 @@ handle_call(check_for_work, _From, State) ->
     {_WL, WC} = leveled_pmanifest:check_for_work(State#state.manifest),
     {reply, WC > 0, State};
 handle_call(persisted_sqn, _From, State) ->
-    {reply, State#state.persisted_sqn, State}.
+    {reply, State#state.persisted_sqn, State};
+handle_call(get_sstpids, _From, State) ->
+    {reply, leveled_pmanifest:get_sstpids(State#state.manifest), State};
+handle_call(get_clerkpid, _From, State) ->
+    {reply, State#state.clerk, State}.
 
 handle_cast({manifest_change, Manifest}, State) ->
     NewManSQN = leveled_pmanifest:get_manifest_sqn(Manifest),
diff --git a/src/leveled_pmanifest.erl b/src/leveled_pmanifest.erl
index b951930..eb59ad0 100644
--- a/src/leveled_pmanifest.erl
+++ b/src/leveled_pmanifest.erl
@@ -46,7 +46,8 @@
         levelzero_present/1,
         check_bloom/3,
         report_manifest_level/2,
-        snapshot_pids/1
+        snapshot_pids/1,
+        get_sstpids/1
         ]).      
 
 -export([
@@ -699,6 +700,31 @@ check_bloom(Manifest, FP, Hash) ->
 snapshot_pids(Manifest) ->
     lists:map(fun(S) -> element(1, S) end, Manifest#manifest.snapshots).
 
+-spec get_sstpids(manifest()) -> list(pid()).
+%% @doc
+%% Return a list of all SST PIDs in the current manifest
+get_sstpids(Manifest) ->
+    FoldFun =
+        fun(I, Acc) ->
+            Level = array:get(I, Manifest#manifest.levels),
+            LevelAsList =
+                case I of
+                    I when I > 1 ->
+                        leveled_tree:to_list(Level);
+                    _ ->
+                        Level
+                end,
+            Pids =
+                lists:map(
+                    fun(MaybeME) ->
+                        ME = get_manifest_entry(MaybeME),
+                        ME#manifest_entry.owner
+                    end,
+                    LevelAsList),
+            Acc ++ Pids
+        end,
+    lists:foldl(FoldFun, [], lists:seq(0, Manifest#manifest.basement)).
+
 %%%============================================================================
 %%% Internal Functions
 %%%============================================================================
diff --git a/test/end_to_end/basic_SUITE.erl b/test/end_to_end/basic_SUITE.erl
index e5ed2e2..56d5657 100644
--- a/test/end_to_end/basic_SUITE.erl
+++ b/test/end_to_end/basic_SUITE.erl
@@ -14,7 +14,8 @@
             bigjournal_littlejournal/1,
             bigsst_littlesst/1,
             safereaderror_startup/1,
-            remove_journal_test/1
+            remove_journal_test/1,
+            bigpcl_bucketlist/1
             ]).
 
 all() -> [
@@ -30,7 +31,8 @@ all() -> [
             bigjournal_littlejournal,
             bigsst_littlesst,
             safereaderror_startup,
-            remove_journal_test
+            remove_journal_test,
+            bigpcl_bucketlist
             ].
 
 
@@ -1197,4 +1199,78 @@ safereaderror_startup(_Config) ->
     {ok, ReadBack} = leveled_bookie:book_get(Bookie2, B1, K1),
     io:format("Read back ~w", [ReadBack]),
     true = ReadBack == Obj2,
-    ok = leveled_bookie:book_close(Bookie2).
\ No newline at end of file
+    ok = leveled_bookie:book_close(Bookie2).
+
+bigpcl_bucketlist(_Config) ->
+    %% https://github.com/martinsumner/leveled/issues/326
+    %% In OTP 22+ there appear to be issues with anonymous functions which
+    %% have a reference to loop state, requiring a copy of all the loop state
+    %% to be made when returning the function.
+    %% This test creates  alarge loop state on the leveled_penciller to prove
+    %% this.
+    %% The problem can be resolved simply by renaming the element of the loop
+    %% state using within the anonymous function.
+    RootPath = testutil:reset_filestructure(),
+    BucketCount = 500,
+    ObjectCount = 100,
+    StartOpts1 = [{root_path, RootPath},
+                    {max_journalsize, 50000000},
+                    {cache_size, 4000},
+                    {max_pencillercachesize, 128000},
+                    {max_sstslots, 256},
+                    {sync_strategy, testutil:sync_strategy()}],
+    {ok, Bookie1} = leveled_bookie:book_start(StartOpts1),
+    BucketList =
+        lists:map(fun(I) -> list_to_binary(integer_to_list(I)) end,
+                    lists:seq(1, BucketCount)),
+
+    MapFun =
+        fun(B) ->
+            testutil:generate_objects(ObjectCount, 1, [], 
+                                        leveled_rand:rand_bytes(100), 
+                                        fun() -> [] end, 
+                                        B)
+        end,
+    ObjLofL = lists:map(MapFun, BucketList),
+    lists:foreach(fun(ObjL) -> testutil:riakload(Bookie1, ObjL) end, ObjLofL),
+    BucketFold =
+        fun(B, _K, _V, Acc) ->
+            case sets:is_element(B, Acc) of
+                true ->
+                    Acc;
+                false ->
+                    sets:add_element(B, Acc)
+            end
+        end,
+    FBAccT = {BucketFold, sets:new()},
+
+    {async, BucketFolder1} = 
+        leveled_bookie:book_headfold(Bookie1,
+                                        ?RIAK_TAG,
+                                        {bucket_list, BucketList},
+                                        FBAccT,
+                                        false, false, false),
+
+    {FoldTime1, BucketList1} = timer:tc(BucketFolder1, []),
+    true = BucketCount == sets:size(BucketList1),
+    ok = leveled_bookie:book_close(Bookie1),
+
+    {ok, Bookie2} = leveled_bookie:book_start(StartOpts1),
+    
+    {async, BucketFolder2} = 
+        leveled_bookie:book_headfold(Bookie2,
+                                        ?RIAK_TAG,
+                                        {bucket_list, BucketList},
+                                        FBAccT,
+                                        false, false, false),
+    {FoldTime2, BucketList2} = timer:tc(BucketFolder2, []),
+    true = BucketCount == sets:size(BucketList2),
+
+    io:format("Fold pre-close ~w ms post-close ~w ms~n",
+                [FoldTime1 div 1000, FoldTime2 div 1000]),
+
+    true = FoldTime1 < 10 * FoldTime2,
+    %% The fold in-memory should be the same order of magnitude of response
+    %% time as the fold post-persistence
+
+    ok = leveled_bookie:book_destroy(Bookie2).
\ No newline at end of file
diff --git a/test/end_to_end/perf_SUITE.erl b/test/end_to_end/perf_SUITE.erl
index 9ac6f39..1394f0a 100644
--- a/test/end_to_end/perf_SUITE.erl
+++ b/test/end_to_end/perf_SUITE.erl
@@ -1,85 +1,529 @@
 -module(perf_SUITE).
--include_lib("common_test/include/ct.hrl").
--include("include/leveled.hrl").
--export([all/0]).
--export([bigpcl_bucketlist/1
-            ]).
-
-all() -> [bigpcl_bucketlist].
+-include("../include/leveled.hrl").
+-define(INFO, info).
+-export([all/0, suite/0]).
+-export([
+    riak_ctperf/1, riak_fullperf/1, riak_profileperf/1
+]).
 
+all() -> [riak_ctperf].
+suite() -> [{timetrap, {hours, 16}}].
     
-bigpcl_bucketlist(_Config) ->
-    %% https://github.com/martinsumner/leveled/issues/326
-    %% In OTP 22+ there appear to be issues with anonymous functions which
-    %% have a reference to loop state, requiring a copy of all the loop state
-    %% to be made when returning the function.
-    %% This test creates  alarge loop state on the leveled_penciller to prove
-    %% this.
-    %% The problem can be resolved simply by renaming the element of the loop
-    %% state using within the anonymous function.
-    RootPath = testutil:reset_filestructure(),
-    BucketCount = 500,
-    ObjectCount = 100,
-    StartOpts1 = [{root_path, RootPath},
-                    {max_journalsize, 50000000},
-                    {cache_size, 4000},
-                    {max_pencillercachesize, 128000},
-                    {max_sstslots, 256},
-                    {sync_strategy, testutil:sync_strategy()},
-                    {compression_point, on_compact}],
-    {ok, Bookie1} = leveled_bookie:book_start(StartOpts1),
-    BucketList =
-        lists:map(fun(I) -> list_to_binary(integer_to_list(I)) end,
-                    lists:seq(1, BucketCount)),
 
-    MapFun =
-        fun(B) ->
-            testutil:generate_objects(ObjectCount, 1, [], 
-                                        leveled_rand:rand_bytes(100), 
-                                        fun() -> [] end, 
-                                        B)
-        end,
-    ObjLofL = lists:map(MapFun, BucketList),
-    lists:foreach(fun(ObjL) -> testutil:riakload(Bookie1, ObjL) end, ObjLofL),
-    BucketFold =
-        fun(B, _K, _V, Acc) ->
-            case sets:is_element(B, Acc) of
-                true ->
-                    Acc;
-                false ->
-                    sets:add_element(B, Acc)
+% For full performance test
+riak_fullperf(_Config) ->
+    R2A = riak_load_tester(<<"B0">>, 2000000, 2048, [], native),
+    output_result(R2A),
+    R2B = riak_load_tester(<<"B0">>, 2000000, 2048, [], native),
+    output_result(R2B),
+    R2C = riak_load_tester(<<"B0">>, 2000000, 2048, [], native),
+    output_result(R2C),
+    R5A = riak_load_tester(<<"B0">>, 5000000, 2048, [], native),
+    output_result(R5A),
+    R5B = riak_load_tester(<<"B0">>, 5000000, 2048, [], native),
+    output_result(R5B),
+    R10 = riak_load_tester(<<"B0">>, 10000000, 2048, [], native),
+    output_result(R10)
+    .
+
+riak_profileperf(_Config) ->
+    riak_load_tester(
+        <<"B0">>,
+        2000000,
+        2048,
+        [load, head, get, query, mini_query, full, guess, estimate, update],
+        native).
+
+% For standard ct test runs
+riak_ctperf(_Config) ->
+    riak_load_tester(<<"B0">>, 400000, 1024, [], native).
+
+riak_load_tester(Bucket, KeyCount, ObjSize, ProfileList, PressMethod) ->
+    ct:log(
+        ?INFO,
+        "Basic riak test with KeyCount ~w ObjSize ~w",
+        [KeyCount, ObjSize]
+    ),
+    IndexCount = 100000,
+
+    GetFetches = KeyCount div 4,
+    HeadFetches = KeyCount div 2,
+    IndexesReturned = KeyCount * 2,
+
+    RootPath = testutil:reset_filestructure("riakLoad"),
+    StartOpts1 =
+        [{root_path, RootPath},
+            {sync_strategy, testutil:sync_strategy()},
+            {log_level, warn},
+            {compression_method, PressMethod},
+            {forced_logs,
+                [b0015, b0016, b0017, b0018, p0032, sst12]}
+        ],
+
+    {ok, Bookie1} = leveled_bookie:book_start(StartOpts1),
+
+    IndexGenFun =
+        fun(ListID) ->
+            fun() ->
+                RandInt = leveled_rand:uniform(IndexCount - 1),
+                IntIndex = "integer" ++ integer_to_list(ListID) ++ "_int",
+                BinIndex = "binary" ++ integer_to_list(ListID) ++ "_bin",
+                [{add, list_to_binary(IntIndex), RandInt},
+                {add, list_to_binary(IntIndex), RandInt + 1},
+                {add, list_to_binary(BinIndex), <<RandInt:32/integer>>},
+                {add, list_to_binary(BinIndex), <<(RandInt + 1):32/integer>>}]
             end
         end,
-    FBAccT = {BucketFold, sets:new()},
 
-    {async, BucketFolder1} = 
-        leveled_bookie:book_headfold(Bookie1,
-                                        ?RIAK_TAG,
-                                        {bucket_list, BucketList},
-                                        FBAccT,
-                                        false, false, false),
+    CountPerList = KeyCount div 10,
 
-    {FoldTime1, BucketList1} = timer:tc(BucketFolder1, []),
-    true = BucketCount == sets:size(BucketList1),
-    ok = leveled_bookie:book_close(Bookie1),
+    TC4 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 4),
+    TC1 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 1),
+    TC9 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 9),
+    TC8 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 8),
+    TC5 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 5),
+    TC2 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 2),
+    TC6 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 6),
+    TC3 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 3),
+    TC7 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 7),
+    TC10 = load_chunk(Bookie1, CountPerList, ObjSize, IndexGenFun, Bucket, 10),
 
-    {ok, Bookie2} = leveled_bookie:book_start(StartOpts1),
+    ct:log(
+        ?INFO,
+        "Load time per group ~w ~w ~w ~w ~w ~w ~w ~w ~w ~w ms",
+        lists:map(
+            fun(T) -> T div 1000 end,
+            [TC4, TC1, TC9, TC8, TC5, TC2, TC6, TC3, TC7, TC10])
+    ),
+    TotalLoadTime =
+        (TC1 + TC2 + TC3 + TC4 + TC5 + TC6 + TC7 + TC8 + TC9 + TC10) div 1000,
+    ct:log(?INFO, "Total load time ~w ms", [TotalLoadTime]),
+
+    {MT0, MP0, MB0} = memory_usage(),
+
+    TotalHeadTime = 
+        random_fetches(head, Bookie1, Bucket, KeyCount, HeadFetches),
     
-    {async, BucketFolder2} = 
-        leveled_bookie:book_headfold(Bookie2,
-                                        ?RIAK_TAG,
-                                        {bucket_list, BucketList},
-                                        FBAccT,
-                                        false, false, false),
-    {FoldTime2, BucketList2} = timer:tc(BucketFolder2, []),
-    true = BucketCount == sets:size(BucketList2),
+    {MT1, MP1, MB1} = memory_usage(),
 
-    io:format("Fold pre-close ~w ms post-close ~w ms~n",
-                [FoldTime1 div 1000, FoldTime2 div 1000]),
+    TotalGetTime = 
+        random_fetches(get, Bookie1, Bucket, KeyCount, GetFetches),
 
-    true = FoldTime1 < 10 * FoldTime2,
-    %% The fold in-memory should be the same order of magnitude of response
-    %% time as the fold post-persistence
+    {MT2, MP2, MB2} = memory_usage(),
 
-    ok = leveled_bookie:book_destroy(Bookie2).
+    QuerySize = max(10, IndexCount div 1000),
+    MiniQuerySize = max(1, IndexCount div 50000),
+    TotalQueryTime =
+        random_queries(
+            Bookie1,
+            Bucket,
+            10,
+            IndexCount,
+            QuerySize,
+            IndexesReturned),
+    TotalMiniQueryTime =
+        random_queries(
+            Bookie1,
+            Bucket,
+            10,
+            IndexCount,
+            MiniQuerySize,
+            IndexesReturned div 8),
 
+    {MT3, MP3, MB3} = memory_usage(),
+
+    {FullFoldTime, SegFoldTime} = size_estimate_summary(Bookie1),
+
+    {MT4, MP4, MB4} = memory_usage(),
+
+    TotalUpdateTime =
+        rotate_chunk(Bookie1, <<"UpdBucket">>, KeyCount div 50, ObjSize),
+
+    {MT5, MP5, MB5} = memory_usage(),
+
+    DiskSpace = lists:nth(1, string:tokens(os:cmd("du -sh riakLoad"), "\t")),
+    ct:log(?INFO, "Disk space taken by test ~s", [DiskSpace]),
+
+    MemoryUsage = erlang:memory(),
+    ct:log(?INFO, "Memory in use at end of test ~p", [MemoryUsage]),
+
+    ProfileData =
+        {Bookie1, Bucket, KeyCount, ObjSize, IndexCount, IndexesReturned},
+    lists:foreach(
+        fun(P) ->
+            ct:log(?INFO, "Profile of ~w", [P]),
+            P0 =
+                case P of
+                    mini_query ->
+                        {mini_query, MiniQuerySize};
+                    query ->
+                        {query, QuerySize};
+                    head ->
+                        {head, HeadFetches};
+                    get ->
+                        {get, GetFetches};
+                    load ->
+                        {load, IndexGenFun};
+                    P ->
+                        P
+                end,
+            ProFun = profile_fun(P0, ProfileData),
+            profile_test(Bookie1, ProFun)
+        end,
+        ProfileList),
+
+    {_Inker, _Pcl, SSTPids, _PClerk, CDBPids, _IClerk} = get_pids(Bookie1),
+    leveled_bookie:book_destroy(Bookie1),
+    
+    {KeyCount, ObjSize, PressMethod,
+        TotalLoadTime,
+        TotalHeadTime, TotalGetTime,
+        TotalQueryTime, TotalMiniQueryTime, FullFoldTime, SegFoldTime,
+        TotalUpdateTime,
+        DiskSpace,
+        {(MT0 + MT1 + MT2 + MT3 + MT4 + MT5) div 6000000,
+            (MP0 + MP1 + MP2 + MP3 + MP4 + MP5) div 6000000,
+            (MB0 + MB1 + MB2 + MB3 + MB4 + MB5) div 6000000},
+        SSTPids, CDBPids}.
+
+
+profile_test(Bookie, ProfileFun) ->
+    {Inker, Pcl, SSTPids, PClerk, CDBPids, IClerk} = get_pids(Bookie),
+    TestPid = self(),
+    profile_app(
+        [TestPid, Bookie, Inker, IClerk, Pcl, PClerk] ++ SSTPids ++ CDBPids,
+        ProfileFun).
+
+get_pids(Bookie) ->
+    {ok, Inker, Pcl} = leveled_bookie:book_returnactors(Bookie),
+    SSTPids = leveled_penciller:pcl_getsstpids(Pcl),
+    PClerk = leveled_penciller:pcl_getclerkpid(Pcl),
+    CDBPids = leveled_inker:ink_getcdbpids(Inker),
+    IClerk = leveled_inker:ink_getclerkpid(Inker),
+    {Inker, Pcl, SSTPids, PClerk, CDBPids, IClerk}.
+
+output_result(
+    {KeyCount, ObjSize, PressMethod,
+        TotalLoadTime,
+        TotalHeadTime, TotalGetTime,
+        TotalQueryTime, TotalMiniQueryTime, TotalFullFoldTime, TotalSegFoldTime,
+        TotalUpdateTime,
+        DiskSpace,
+        {TotalMemoryMB, ProcessMemoryMB, BinaryMemoryMB},
+        SSTPids, CDBPids}
+) ->
+    %% TODO ct:pal not working?  even with rebar3 ct --verbose?
+    io:format(
+        user,
+        "~n"
+        "Outputs from profiling with KeyCount ~w ObjSize ~w Compression ~w:~n"
+        "TotalLoadTime - ~w ms~n"
+        "TotalHeadTime - ~w ms~n"
+        "TotalGetTime - ~w ms~n"
+        "TotalQueryTime - ~w ms~n"
+        "TotalMiniQueryTime - ~w ms~n"
+        "TotalFullFoldTime - ~w ms~n"
+        "TotalAAEFoldTime - ~w ms~n"
+        "TotalUpdateTime - ~w ms~n"
+        "Disk space required for test - ~s~n"
+        "Average Memory usage for test - Total ~p Proc ~p Bin ~p MB~n"
+        "Closing count of SST Files - ~w~n"
+        "Closing count of CDB Files - ~w~n",
+        [KeyCount, ObjSize, PressMethod,
+            TotalLoadTime, TotalHeadTime, TotalGetTime,
+            TotalQueryTime, TotalMiniQueryTime, TotalFullFoldTime, TotalSegFoldTime,
+            TotalUpdateTime,
+            DiskSpace,
+            TotalMemoryMB, ProcessMemoryMB, BinaryMemoryMB,
+            length(SSTPids), length(CDBPids)]
+    ).
+
+memory_usage() ->
+    garbage_collect(), % GC the test process
+    MemoryUsage = erlang:memory(),
+    {element(2, lists:keyfind(total, 1, MemoryUsage)),
+        element(2, lists:keyfind(processes, 1, MemoryUsage)),
+        element(2, lists:keyfind(binary, 1, MemoryUsage))}.
+
+profile_app(Pids, ProfiledFun) ->
+
+    eprof:start(),
+    eprof:start_profiling(Pids),
+
+    ProfiledFun(),
+
+    eprof:stop_profiling(),
+    eprof:analyze(total),
+    eprof:stop().
+
+size_estimate_summary(Bookie) ->
+    Loops = 10,
+    ct:log(
+        ?INFO,
+        "Size Estimate Tester (SET) started with Loops ~w",
+        [Loops]
+    ),
+    {{TotalGuessTime, TotalEstimateTime, TotalCountTime}, 
+            {TotalEstimateVariance, TotalGuessVariance}} =
+        lists:foldl(
+            fun(_I, {{GT, ET, CT}, {AET, AGT}}) ->
+                {{GT0, ET0, CT0}, {AE0, AG0}} = size_estimate_tester(Bookie),
+                {{GT + GT0, ET + ET0, CT + CT0}, {AET + AE0, AGT + AG0}}
+            end,
+            {{0, 0, 0}, {0, 0}},
+            lists:seq(1, Loops)
+        ),
+    ct:log(
+        ?INFO,
+        "SET: MeanGuess ~w ms MeanEstimate ~w ms MeanCount ~w ms",
+        [TotalGuessTime div 10000,
+            TotalEstimateTime div 10000,
+            TotalCountTime div 10000]
+    ),
+    ct:log(
+        ?INFO,
+        "Mean variance in Estimate ~w Guess ~w",
+        [TotalEstimateVariance div Loops, TotalGuessVariance div Loops]
+    ),
+    %% Assume that segment-list folds are 10 * as common as all folds
+    {TotalCountTime div 1000, (TotalGuessTime + TotalEstimateTime) div 1000}.
+
+
+rotate_chunk(Bookie, Bucket, KeyCount, ObjSize) ->
+    ct:log(
+        ?INFO,
+        "Rotating an ObjList ~w - "
+        "time includes object generation",
+        [KeyCount]),
+    V1 = base64:encode(leveled_rand:rand_bytes(ObjSize)),
+    V2 = base64:encode(leveled_rand:rand_bytes(ObjSize)),
+    V3 = base64:encode(leveled_rand:rand_bytes(ObjSize)),
+    {TC, ok} = 
+        timer:tc(
+            fun() ->
+                testutil:rotation_withnocheck(
+                    Bookie, Bucket, KeyCount, V1, V2, V3)
+            end),
+    TC div 1000.
+
+load_chunk(Bookie, CountPerList, ObjSize, IndexGenFun, Bucket, Chunk) ->
+    ct:log(?INFO, "Generating and loading ObjList ~w", [Chunk]),
+    ObjList =
+        generate_chunk(CountPerList, ObjSize, IndexGenFun, Bucket, Chunk),
+    {TC, ok} = timer:tc(fun() -> testutil:riakload(Bookie, ObjList) end),
+    garbage_collect(),
+    timer:sleep(2000),
+    TC.
+
+generate_chunk(CountPerList, ObjSize, IndexGenFun, Bucket, Chunk) ->
+    testutil:generate_objects(
+        CountPerList, 
+        {fixed_binary, (Chunk - 1) * CountPerList + 1}, [],
+        base64:encode(leveled_rand:rand_bytes(ObjSize)),
+        IndexGenFun(Chunk),
+        Bucket
+    ).
+
+size_estimate_tester(Bookie) ->
+    %% Data size test - calculate data size, then estimate data size
+    {CountTS, Count} = counter(Bookie, full),
+    {CountTSEstimate, CountEstimate} = counter(Bookie, estimate),
+    {CountTSGuess, CountGuess} = counter(Bookie, guess),
+    {GuessTolerance, EstimateTolerance} =
+        case Count of
+            C when C < 500000 ->
+                {0.20, 0.15};
+            C when C < 1000000 ->
+                {0.12, 0.1};
+            C when C < 2000000 ->
+                {0.1, 0.08};
+            _C ->
+                {0.08, 0.05}
+        end,
+
+    true =
+        ((CountGuess / Count) > (1.0 - GuessTolerance))
+            and ((CountGuess / Count) < (1.0 + GuessTolerance)),
+    true =
+        ((CountEstimate / Count) > (1.0 - EstimateTolerance))
+            and ((CountEstimate / Count) < (1.0 + EstimateTolerance)),
+    {{CountTSGuess, CountTSEstimate, CountTS},
+        {abs(CountEstimate - Count), abs(CountGuess - Count)}}.
+
+counter(Bookie, full) ->
+    {async, DataSizeCounter} =
+        leveled_bookie:book_headfold(
+            Bookie,
+            ?RIAK_TAG,
+            {fun(_B, _K, _V, AccC) ->  AccC + 1 end, 0},
+            false,
+            true,
+            false
+        ),
+    timer:tc(DataSizeCounter);
+counter(Bookie, guess) ->
+    TictacTreeSize = 1024 * 1024,
+    RandomSegment = rand:uniform(TictacTreeSize - 32) - 1,
+    {async, DataSizeGuesser} =
+        leveled_bookie:book_headfold(
+            Bookie,
+            ?RIAK_TAG,
+            {fun(_B, _K, _V, AccC) ->  AccC + 1024 end, 0},
+            false,
+            true,
+            lists:seq(RandomSegment, RandomSegment + 31)
+        ),
+    timer:tc(DataSizeGuesser);
+counter(Bookie, estimate) ->
+    TictacTreeSize = 1024 * 1024,
+    RandomSegment = rand:uniform(TictacTreeSize - 128) - 1,
+    {async, DataSizeEstimater} =
+        leveled_bookie:book_headfold(
+            Bookie,
+            ?RIAK_TAG,
+            {fun(_B, _K, _V, AccC) ->  AccC + 256 end, 0},
+            false,
+            true,
+            lists:seq(RandomSegment, RandomSegment + 127)
+        ),
+    timer:tc(DataSizeEstimater).
+    
+
+random_fetches(FetchType, Bookie, Bucket, ObjCount, Fetches) ->
+    KeysToFetch =
+        lists:map(
+            fun(I) ->
+                Twenty = ObjCount div 5,
+                case I rem 5 of
+                    1 ->
+                        testutil:fixed_bin_key(
+                            Twenty + leveled_rand:uniform(ObjCount - Twenty));
+                    _ ->
+                        testutil:fixed_bin_key(leveled_rand:uniform(Twenty))
+                end
+            end,
+            lists:seq(1, Fetches)
+        ),
+    {TC, ok} =
+        timer:tc(
+            fun() ->
+                lists:foreach(
+                    fun(K) ->
+                        {ok, _} =
+                            case FetchType of
+                                get ->
+                                    testutil:book_riakget(Bookie, Bucket, K);
+                                head ->
+                                    testutil:book_riakhead(Bookie, Bucket, K)
+                            end
+                    end,
+                    KeysToFetch
+                )
+            end
+        ),
+    ct:log(
+        ?INFO,
+        "Fetch of type ~w ~w keys in ~w ms",
+        [FetchType, Fetches, TC div 1000]
+    ),
+    TC div 1000.
+    
+random_queries(Bookie, Bucket, IDs, IdxCnt, MaxRange, IndexesReturned) ->
+    QueryFun =
+        fun() ->
+            ID = leveled_rand:uniform(IDs), 
+            BinIndex =
+                list_to_binary("binary" ++ integer_to_list(ID) ++ "_bin"),
+            Twenty = IdxCnt div 5,
+            RI = leveled_rand:uniform(MaxRange),
+            [Start, End] =
+                case RI of
+                    RI when RI < (MaxRange div 5) ->
+                        R0 = leveled_rand:uniform(IdxCnt - (Twenty + RI)),
+                        [R0 + Twenty, R0 + Twenty + RI];
+                    _ ->
+                        R0 = leveled_rand:uniform(Twenty - RI),
+                        [R0, R0 + RI]
+                end,
+            FoldKeysFun =  fun(_B, _K, Cnt) -> Cnt + 1 end,
+            {async, R} =
+                leveled_bookie:book_indexfold(
+                    Bookie,
+                    {Bucket, <<>>}, 
+                    {FoldKeysFun, 0},
+                    {BinIndex, <<Start:32/integer>>, <<End:32/integer>>},
+                    {true, undefined}),
+            R()
+        end,
+    
+    {TC, {QC, EF}} =
+        timer:tc(fun() -> run_queries(QueryFun, 0, 0, IndexesReturned) end),
+    ct:log(
+        ?INFO,
+        "Fetch of ~w index entries in ~w queries took ~w ms",
+        [EF, QC, TC div 1000]
+    ),
+    TC div 1000.
+
+
+run_queries(_QueryFun, QueryCount, EntriesFound, TargetEntries)
+        when EntriesFound >= TargetEntries ->
+    {QueryCount, EntriesFound};
+run_queries(QueryFun, QueryCount, EntriesFound, TargetEntries) ->
+    Matches = QueryFun(),
+    run_queries(
+        QueryFun, QueryCount + 1, EntriesFound + Matches, TargetEntries).
+
+profile_fun(false, _ProfileData) ->
+    fun() -> ok end;
+profile_fun(
+        {mini_query, QuerySize},
+        {Bookie, Bucket, _KeyCount, _ObjSize, IndexCount, IndexesReturned}) ->
+    fun() ->
+        random_queries(
+            Bookie, Bucket, 10, IndexCount, QuerySize, IndexesReturned div 8)
+    end;
+profile_fun(
+        {query, QuerySize},
+        {Bookie, Bucket, _KeyCount, _ObjSize, IndexCount, IndexesReturned}) ->
+    fun() ->
+        random_queries(
+            Bookie, Bucket, 10, IndexCount, QuerySize, IndexesReturned)
+    end;
+profile_fun(
+        {head, HeadFetches},
+        {Bookie, Bucket, KeyCount, _ObjSize, _IndexCount, _IndexesReturned}) ->
+    fun() ->
+        random_fetches(head, Bookie, Bucket, KeyCount, HeadFetches)
+    end;
+profile_fun(
+        {get, GetFetches},
+        {Bookie, Bucket, KeyCount, _ObjSize, _IndexCount, _IndexesReturned}) ->
+    fun() ->
+        random_fetches(get, Bookie, Bucket, KeyCount, GetFetches)
+    end;
+profile_fun(
+        {load, IndexGenFun},
+        {Bookie, Bucket, KeyCount, ObjSize, _IndexCount, _IndexesReturned}) ->
+    ObjList11 =
+        generate_chunk(KeyCount div 10, ObjSize, IndexGenFun, Bucket, 11),
+    fun() ->
+        testutil:riakload(Bookie, ObjList11)
+    end;
+profile_fun(
+        update,
+        {Bookie, _Bucket, KeyCount, ObjSize, _IndexCount, _IndexesReturned}) ->
+    fun() ->
+        rotate_chunk(Bookie, <<"ProfileB">>, KeyCount div 50, ObjSize)
+    end;
+profile_fun(
+        CounterFold,
+        {Bookie, _Bucket, _KeyCount, _ObjSize, _IndexCount, _IndexesReturned}) ->
+    fun() ->
+        lists:foreach(
+            fun(_I) ->
+                _ = counter(Bookie, CounterFold)
+            end,
+            lists:seq(1, 10)
+        )
+    end.
diff --git a/test/end_to_end/testutil.erl b/test/end_to_end/testutil.erl
index 84774fa..f8d786a 100644
--- a/test/end_to_end/testutil.erl
+++ b/test/end_to_end/testutil.erl
@@ -44,11 +44,13 @@
             update_some_objects/3,
             delete_some_objects/3,
             put_indexed_objects/3,
+            put_indexed_objects/4,
             put_altered_indexed_objects/3,
             put_altered_indexed_objects/4,
             put_altered_indexed_objects/5,
             check_indexed_objects/4,
             rotating_object_check/3,
+            rotation_withnocheck/6,
             corrupt_journal/5,
             restore_file/2,
             restore_topending/2,
@@ -754,6 +756,9 @@ check_indexed_objects(Book, B, KSpecL, V) ->
 
 put_indexed_objects(Book, Bucket, Count) ->
     V = get_compressiblevalue(),
+    put_indexed_objects(Book, Bucket, Count, V).
+
+put_indexed_objects(Book, Bucket, Count, V) ->
     IndexGen = get_randomindexes_generator(1),
     SW = os:timestamp(),
     ObjL1 = 
@@ -837,6 +842,12 @@ rotating_object_check(RootPath, B, NumberOfObjects) ->
     ok = leveled_bookie:book_close(Book2),
     ok.
     
+rotation_withnocheck(Book1, B, NumberOfObjects, V1, V2, V3) ->
+    {KSpcL1, _V1} = put_indexed_objects(Book1, B, NumberOfObjects, V1),
+    {KSpcL2, _V2} = put_altered_indexed_objects(Book1, B, KSpcL1, true, V2),
+    {_KSpcL3, _V3} = put_altered_indexed_objects(Book1, B, KSpcL2, true, V3),
+    ok.
+
 corrupt_journal(RootPath, FileName, Corruptions, BasePosition, GapSize) ->
     OriginalPath = RootPath ++ "/journal/journal_files/" ++ FileName,
     BackupPath = RootPath ++ "/journal/journal_files/" ++