-
Notifications
You must be signed in to change notification settings - Fork 392
/
riak_core_status.erl
176 lines (157 loc) · 6.54 KB
/
riak_core_status.erl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
%% -------------------------------------------------------------------
%%
%% Riak: A lightweight, decentralized key-value store.
%%
%% Copyright (c) 2007-2011 Basho Technologies, Inc. All Rights Reserved.
%%
%% This file is provided to you under the Apache License,
%% Version 2.0 (the "License"); you may not use this file
%% except in compliance with the License. You may obtain
%% a copy of the License at
%%
%% http://www.apache.org/licenses/LICENSE-2.0
%%
%% Unless required by applicable law or agreed to in writing,
%% software distributed under the License is distributed on an
%% "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
%% KIND, either express or implied. See the License for the
%% specific language governing permissions and limitations
%% under the License.
%%
%% -------------------------------------------------------------------
-module(riak_core_status).
-export([ringready/0,
all_active_transfers/0,
transfers/0,
ring_status/0]).
-spec(ringready() -> {ok, [atom()]} | {error, any()}).
ringready() ->
case get_rings() of
{[], Rings} ->
{N1,R1}=hd(Rings),
case rings_match(hash_ring(R1), tl(Rings)) of
true ->
Nodes = [N || {N,_} <- Rings],
{ok, Nodes};
{false, N2} ->
{error, {different_owners, N1, N2}}
end;
{Down, _Rings} ->
{error, {nodes_down, Down}}
end.
-spec(transfers() -> {[atom()], [{waiting_to_handoff, atom(), integer()} |
{stopped, atom(), integer()}]}).
transfers() ->
{Down, Rings} = get_rings(),
%% Work out which vnodes are running and which partitions they claim
F = fun({N,R}, Acc) ->
{_Pri, Sec, Stopped} = partitions(N, R),
Acc1 = case Sec of
[] ->
[];
_ ->
[{waiting_to_handoff, N, length(Sec)}]
end,
case Stopped of
[] ->
Acc1 ++ Acc;
_ ->
Acc1 ++ [{stopped, N, length(Stopped)} | Acc]
end
end,
{Down, lists:foldl(F, [], Rings)}.
%% @doc Produce status for all active transfers in the cluster.
-spec all_active_transfers() -> {Xfers::list(), Down::list()}.
all_active_transfers() ->
{Xfers, Down} =
riak_core_util:rpc_every_member(riak_core_handoff_manager,
status,
[{direction, outbound}],
5000),
{Xfers, Down}.
ring_status() ->
%% Determine which nodes are reachable as well as what vnode modules
%% are running on each node.
{ok, Ring} = riak_core_ring_manager:get_raw_ring(),
{AllMods, Down} =
riak_core_util:rpc_every_member_ann(riak_core, vnode_modules, [], 1000),
%% Check if the claimant is running and if it believes the ring is ready
Claimant = riak_core_ring:claimant(Ring),
case rpc:call(Claimant, riak_core_ring, ring_ready, [], 5000) of
{badrpc, _} ->
Down2 = lists:usort([Claimant|Down]),
RingReady = undefined;
RingReady ->
Down2 = Down,
RingReady = RingReady
end,
%% Get the list of pending ownership changes
Changes = riak_core_ring:pending_changes(Ring),
%% Group pending changes by (Owner, NextOwner)
Merged = lists:foldl(
fun({Idx, Owner, NextOwner, Mods, Status}, Acc) ->
orddict:append({Owner, NextOwner},
{Idx, Mods, Status},
Acc)
end, [], Changes),
%% For each pending transfer, determine which vnode modules have completed
%% handoff and which we are still waiting on.
%% Final result is of the form:
%% [{Owner, NextOwner}, [{Index, WaitingMods, CompletedMods, Status}]]
TransferStatus =
orddict:map(
fun({Owner, _}, Transfers) ->
case orddict:find(Owner, AllMods) of
error ->
[{Idx, down, Mods, Status}
|| {Idx, Mods, Status} <- Transfers];
{ok, OwnerMods} ->
NodeMods = [Mod || {_App, Mod} <- OwnerMods],
[{Idx, NodeMods -- Mods, Mods, Status}
|| {Idx, Mods, Status} <- Transfers]
end
end, Merged),
MarkedDown = riak_core_ring:down_members(Ring),
{Claimant, RingReady, Down2, MarkedDown, TransferStatus}.
%% ===================================================================
%% Internal functions
%% ===================================================================
%% Retrieve the rings for all other nodes by RPC
get_rings() ->
{RawRings, Down} = riak_core_util:rpc_every_member(
riak_core_ring_manager, get_my_ring, [], 30000),
RawRings2 = [riak_core_ring:upgrade(R) || {ok, R} <- RawRings],
Rings = orddict:from_list([{riak_core_ring:owner_node(R), R} || R <- RawRings2]),
{lists:sort(Down), Rings}.
%% Produce a hash of the 'chash' portion of the ring
hash_ring(R) ->
erlang:phash2(riak_core_ring:all_owners(R)).
%% Check if all rings match given a hash and a list of [{N,P}] to check
rings_match(_, []) ->
true;
rings_match(R1hash, [{N2, R2} | Rest]) ->
case hash_ring(R2) of
R1hash ->
rings_match(R1hash, Rest);
_ ->
{false, N2}
end.
%% Get a list of active partition numbers - regardless of vnode type
active_partitions(Node) ->
VNodes = gen_server:call({riak_core_vnode_manager, Node}, all_vnodes, 30000),
lists:foldl(fun({_, P, _}, Ps) ->
ordsets:add_element(P, Ps)
end, [], VNodes).
%% Return a list of active primary partitions, active secondary partitions (to be handed off)
%% and stopped partitions that should be started
partitions(Node, Ring) ->
Owners = riak_core_ring:all_owners(Ring),
Owned = ordsets:from_list(owned_partitions(Owners, Node)),
Active = ordsets:from_list(active_partitions(Node)),
Stopped = ordsets:subtract(Owned, Active),
Secondary = ordsets:subtract(Active, Owned),
Primary = ordsets:subtract(Active, Secondary),
{Primary, Secondary, Stopped}.
%% Return the list of partitions owned by a node
owned_partitions(Owners, Node) ->
[P || {P, Owner} <- Owners, Owner =:= Node].