Permalink
Show file tree
Hide file tree
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Browse files
Merge remote-tracking branch 'custodian/master' into custodian-merge
- Loading branch information
Showing
9 changed files
with
775 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,8 @@ | ||
Custodian is responsible for the data stored in Cloudant databases. | ||
|
||
Custodian scans the "dbs" database, which details the location of | ||
every shard of every database and ensures that operators are aware of | ||
any shard that is under-replicated (has less than N copies). | ||
|
||
Custodian accounts for data in transit (as indicated by the | ||
mem3.redirects section) as well as nodes not recently known to be up. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,19 @@ | ||
% Copyright 2013 Cloudant. All rights reserved. | ||
|
||
{application, custodian, | ||
[ | ||
{description, "in your cluster, looking after your stuff"}, | ||
{vsn, git}, | ||
{registered, []}, | ||
{applications, [ | ||
kernel, | ||
stdlib, | ||
couch_log, | ||
config, | ||
couch_event, | ||
couch, | ||
mem3 | ||
]}, | ||
{mod, { custodian_app, []}}, | ||
{env, []} | ||
]}. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,11 @@ | ||
% Copyright 2013 Cloudant. All rights reserved. | ||
|
||
-module(custodian). | ||
|
||
-export([report/0, summary/0]). | ||
|
||
report() -> | ||
custodian_util:report(). | ||
|
||
summary() -> | ||
custodian_util:summary(). |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
% Copyright 2013 Cloudant. All rights reserved. | ||
|
||
-define(CUSTODIAN_ID, <<"_design/custodian">>). | ||
|
||
-define(CUSTODIAN_VALIDATION, | ||
<<"function(newDoc, oldDoc) { | ||
var i, range, node; | ||
if(newDoc['_id'].substring(0, 8) === \"_design/\") return; | ||
if(newDoc['_deleted'] === true) return; | ||
if (!newDoc.by_node) { | ||
throw({forbidden: \"by_node is mandatory\"}); | ||
} | ||
if (!newDoc.by_range) { | ||
throw({forbidden: \"by_range is mandatory\"}); | ||
} | ||
for (node in newDoc.by_node) { | ||
for (i in newDoc.by_node[node]) { | ||
range = newDoc.by_node[node][i]; | ||
if(!newDoc.by_range[range]) { | ||
throw({forbidden: \"by_range for \" + range + \" is missing\"}); | ||
} | ||
if(newDoc.by_range[range].indexOf(node) === -1) { | ||
throw({forbidden : \"by_range for \" + range + \" is missing \" + node}); | ||
} | ||
} | ||
} | ||
for (range in newDoc.by_range) { | ||
for (i in newDoc.by_range[range]) { | ||
node = newDoc.by_range[range][i]; | ||
if(!newDoc.by_node[node]) { | ||
throw({forbidden: \"by_node for \" + node + \" is missing\"}); | ||
} | ||
if (newDoc.by_node[node].indexOf(range) === -1) { | ||
throw({forbidden: \"by_node for \" + node + \" is missing \" + range}); | ||
} | ||
} | ||
} | ||
} | ||
">>). |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
% Copyright 2013 Cloudant. All rights reserved. | ||
|
||
-module(custodian_app). | ||
|
||
-behaviour(application). | ||
|
||
%% Application callbacks | ||
-export([start/2, stop/1]). | ||
|
||
%% =================================================================== | ||
%% Application callbacks | ||
%% =================================================================== | ||
|
||
start(_StartType, _StartArgs) -> | ||
custodian_sup:start_link(). | ||
|
||
stop(_State) -> | ||
ok. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,155 @@ | ||
% Copyright 2013 Cloudant. All rights reserved. | ||
|
||
-module(custodian_db_checker). | ||
-behaviour(gen_server). | ||
-vsn(1). | ||
|
||
|
||
-export([start_link/0]). | ||
|
||
|
||
-export([ | ||
init/1, | ||
terminate/2, | ||
handle_call/3, | ||
handle_cast/2, | ||
handle_info/2, | ||
code_change/3 | ||
]). | ||
|
||
-export([ | ||
check_dbs/0 | ||
]). | ||
|
||
|
||
-record(st, { | ||
checker | ||
}). | ||
|
||
|
||
start_link() -> | ||
gen_server:start_link({local, ?MODULE}, ?MODULE, [], []). | ||
|
||
|
||
init(_) -> | ||
process_flag(trap_exit, true), | ||
net_kernel:monitor_nodes(true), | ||
{ok, restart_checker(#st{})}. | ||
|
||
|
||
terminate(_Reason, St) -> | ||
couch_util:shutdown_sync(St#st.checker), | ||
ok. | ||
|
||
|
||
handle_call(Msg, _From, St) -> | ||
{stop, {invalid_call, Msg}, {invalid_call, Msg}, St}. | ||
|
||
|
||
handle_cast(refresh, St) -> | ||
{noreply, restart_checker(St)}; | ||
|
||
handle_cast(Msg, St) -> | ||
{stop, {invalid_cast, Msg}, St}. | ||
|
||
|
||
handle_info({nodeup, _}, St) -> | ||
{noreply, restart_checker(St)}; | ||
|
||
handle_info({nodedown, _}, St) -> | ||
{noreply, restart_checker(St)}; | ||
|
||
handle_info({'EXIT', Pid, normal}, #st{checker=Pid}=St) -> | ||
{noreply, St#st{checker=undefined}}; | ||
|
||
handle_info({'EXIT', Pid, Reason}, #st{checker=Pid}=St) -> | ||
couch_log:notice("custodian db checker died ~p", [Reason]), | ||
{noreply, restart_checker(St#st{checker=undefined})}; | ||
|
||
handle_info(Msg, St) -> | ||
{stop, {invalid_info, Msg}, St}. | ||
|
||
|
||
code_change(_OldVsn, St, _Extra) -> | ||
{ok, St}. | ||
|
||
|
||
restart_checker(#st{checker=undefined}=St) -> | ||
Pid = spawn_link(fun ?MODULE:check_dbs/0), | ||
St#st{checker=Pid}; | ||
restart_checker(#st{checker=Pid}=St) when is_pid(Pid) -> | ||
St. | ||
|
||
|
||
check_dbs() -> | ||
{ok, DbsDb} = custodian_util:ensure_dbs_exists(), | ||
try | ||
Missing = lists:foldl(fun(DbName, Count) -> | ||
case check_db(DbsDb, DbName) of | ||
ok -> Count; | ||
missing -> Count + 1 | ||
end | ||
end, 0, get_dbs()), | ||
case Missing == 0 of | ||
true -> clear_missing_dbs_alert(); | ||
false -> ok | ||
end | ||
after | ||
couch_db:close(DbsDb) | ||
end. | ||
|
||
|
||
check_db(DbsDb, DbName) when is_binary(DbName) -> | ||
try | ||
case couch_db:open_doc(DbsDb, DbName, []) of | ||
{ok, _} -> | ||
ok; | ||
_ -> | ||
send_missing_db_alert(DbName), | ||
missing | ||
end | ||
catch _:_ -> | ||
send_missing_db_alert(DbName), | ||
missing | ||
end. | ||
|
||
|
||
get_dbs() -> | ||
lists:flatten([ | ||
get_users_db(), | ||
get_stats_db() | ||
]). | ||
|
||
|
||
get_users_db() -> | ||
UsersDb = config:get("couch_httpd_auth", "authentication_db", "users"), | ||
[list_to_binary(UsersDb)]. | ||
|
||
|
||
get_stats_db() -> | ||
case application:get_env(ioq, stats_db) of | ||
{ok, DbName} when is_binary(DbName) -> | ||
[DbName]; | ||
{ok, DbName} when is_list(DbName) -> | ||
[iolist_to_binary(DbName)]; | ||
_ -> | ||
[] | ||
end. | ||
|
||
|
||
send_missing_db_alert(DbName) -> | ||
couch_log:notice("Missing system database ~s", [DbName]), | ||
Command = [ | ||
"send-sensu-event --standalone --critical", | ||
" --output=\"Missing system database ", | ||
binary_to_list(DbName), | ||
"\" --handler=default custodian-missing-db-check"], | ||
os:cmd(lists:concat(Command)). | ||
|
||
clear_missing_dbs_alert() -> | ||
couch_log:notice("All system databases exist.", []), | ||
Command = [ | ||
"send-sensu-event --standalone --ok", | ||
" --output=\"All system databases exist\"", | ||
" --handler=default custodian-missing-db-check"], | ||
os:cmd(lists:concat(Command)). |
Oops, something went wrong.