riak_test/tests/ensemble_ring_changes.erl

159 lines
6.0 KiB
Erlang
Raw Normal View History

%% -------------------------------------------------------------------
%%
%% Copyright (c) 2013-2014 Basho Technologies, Inc.
%%
%% This file is provided to you under the Apache License,
%% Version 2.0 (the "License"); you may not use this file
%% except in compliance with the License. You may obtain
%% a copy of the License at
%%
%% http://www.apache.org/licenses/LICENSE-2.0
%%
%% Unless required by applicable law or agreed to in writing,
%% software distributed under the License is distributed on an
%% "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
%% KIND, either express or implied. See the License for the
%% specific language governing permissions and limitations
%% under the License.
%%
%% -------------------------------------------------------------------
-module(ensemble_ring_changes).
-export([confirm/0]).
-include_lib("eunit/include/eunit.hrl").
-define(NVAL, 3).
-define(RING_SIZE, 16).
config() ->
[{riak_core, [{default_bucket_props,
[
{n_val, 5},
{allow_mult, true},
{dvv_enabled, true}
]},
{vnode_management_timer, 1000},
{ring_creation_size, ?RING_SIZE},
{enable_consensus, true},
{target_n_val, 8}]}].
confirm() ->
Config = config(),
{ok, Joined, NotJoined} = build_initial_cluster(Config),
Node = hd(Joined),
Bucket = {<<"strong">>, <<"test">>},
Key = <<"test-key">>,
Val = <<"test-val">>,
create_strong_bucket_type(Node, ?NVAL),
{ok, PL} = get_preflist(Node, Bucket, Key, ?NVAL),
?assertEqual(?NVAL, length(PL)),
lager:info("PREFERENCE LIST: ~n ~p", [PL]),
{{Idx0, _Node0}, primary} = hd(PL),
Ensemble = {kv, Idx0, 3},
lager:info("Ensemble = ~p", [Ensemble]),
PBC = rt:pbc(Node),
{ok, Obj} = initial_write(PBC, Bucket, Key, Val),
{ok, _Obj2} = assert_update(PBC, Bucket, Key, Obj, <<"test-val2">>),
Replacements = expand_cluster(Joined, NotJoined),
{_Vsn, [View]} = rpc:call(Node, riak_ensemble_manager, get_views, [Ensemble]),
{_, F1} = hd(lists:reverse(View)),
{_, F2} = hd(tl(lists:reverse(View))),
lager:info("F1= ~p, F2=~p", [F1, F2]),
read_modify_write(PBC, Bucket, Key, <<"test-val2">>, <<"test-val3">>),
[R1, R2] = Replacements,
replace_node(Node, F1, R1),
read_modify_write(PBC, Bucket, Key, <<"test-val3">>, <<"test-val4">>),
force_replace_node(Node, F2, R2),
read_modify_write(PBC, Bucket, Key, <<"test-val4">>, <<"test-val5">>),
pass.
read_modify_write(PBC, Bucket, Key, Expected, NewVal) ->
Obj = rt:pbc_read(PBC, Bucket, Key),
?assertEqual(Expected, riakc_obj:get_value(Obj)),
assert_update(PBC, Bucket, Key, Obj, NewVal).
assert_update(PBC, Bucket, Key, Obj, NewVal) ->
ok = update(PBC, Obj, NewVal),
Obj2 = rt:pbc_read(PBC, Bucket, Key),
?assertEqual(NewVal, riakc_obj:get_value(Obj2)),
{ok, Obj2}.
update(PBC, Obj0, NewVal) ->
lager:info("Updating Key with ~p", [NewVal]),
Obj = riakc_obj:update_value(Obj0, NewVal),
riakc_pb_socket:put(PBC, Obj).
initial_write(PBC, Bucket, Key, Val) ->
%% maps to a riak_ensemble put_once since there is no vclock
lager:info("Writing a consistent key"),
ok = rt:pbc_write(PBC, Bucket, Key, Val),
lager:info("Read key to verify it exists"),
Obj = rt:pbc_read(PBC, Bucket, Key),
?assertEqual(Val, riakc_obj:get_value(Obj)),
{ok, Obj}.
get_preflist(Node, Bucket, Key, NVal) ->
DocIdx = rpc:call(Node, riak_core_util, chash_std_keyfun, [{Bucket, Key}]),
PL = rpc:call(Node, riak_core_apl, get_primary_apl, [DocIdx, NVal, riak_kv]),
{ok, PL}.
create_strong_bucket_type(Node, NVal) ->
lager:info("Creating/activating 'strong' bucket type"),
rt:create_and_activate_bucket_type(Node, <<"strong">>,
[{consistent, true}, {n_val, NVal}]),
ensemble_util:wait_until_stable(Node, NVal).
replace_node(Node, OldNode, NewNode) ->
lager:info("Replacing ~p with ~p", [OldNode, NewNode]),
Nodes = [OldNode, NewNode],
rt:staged_join(NewNode, Node),
?assertEqual(ok, rt:wait_until_ring_converged(Nodes)),
ok = rpc:call(Node, riak_core_claimant, replace, Nodes),
rt:plan_and_commit(Node),
rt:try_nodes_ready(Nodes, 3, 500),
?assertEqual(ok, rt:wait_until_nodes_ready(Nodes)).
force_replace_node(Node, OldNode, NewNode) ->
lager:info("Force Replacing ~p with ~p", [OldNode, NewNode]),
Nodes = [OldNode, NewNode],
rt:staged_join(NewNode, Node),
?assertEqual(ok, rt:wait_until_ring_converged(Nodes)),
ok = rpc:call(Node, riak_core_claimant, force_replace, Nodes),
rt:plan_and_commit(Node),
rt:try_nodes_ready(Nodes, 3, 500),
?assertEqual(ok, rt:wait_until_nodes_ready(Nodes)).
expand_cluster(OldNodes, NewNodes0) ->
%% Always have 2 replacement nodes
{NewNodes, Replacements} = lists:split(length(NewNodes0)-2, NewNodes0),
lager:info("Expanding Cluster from ~p to ~p nodes", [length(OldNodes),
length(OldNodes) + length(NewNodes)]),
PNode = hd(OldNodes),
Nodes = OldNodes ++ NewNodes,
[rt:staged_join(Node, PNode) || Node <- NewNodes],
rt:plan_and_commit(PNode),
rt:try_nodes_ready(Nodes, 3, 500),
?assertEqual(ok, rt:wait_until_nodes_ready(Nodes)),
%% Ensure each node owns a portion of the ring
rt:wait_until_nodes_agree_about_ownership(Nodes),
?assertEqual(ok, rt:wait_until_no_pending_changes(Nodes)),
ensemble_util:wait_until_cluster(Nodes),
ensemble_util:wait_for_membership(PNode),
ensemble_util:wait_until_stable(PNode, ?NVAL),
Replacements.
build_initial_cluster(Config) ->
TotalNodes = 8,
InitialNodes = 3,
Nodes = rt:deploy_nodes(TotalNodes, Config),
Node = hd(Nodes),
{ToJoin, NotToJoin} = lists:split(InitialNodes, Nodes),
rt:join_cluster(ToJoin),
ensemble_util:wait_until_cluster(ToJoin),
ensemble_util:wait_for_membership(Node),
ensemble_util:wait_until_stable(Node, InitialNodes),
vnode_util:load(Nodes),
ensemble_util:wait_until_stable(Node, InitialNodes),
{ok, ToJoin, NotToJoin}.