emqx/apps/emqx_machine/src/emqx_machine_boot.erl

255 lines
8.4 KiB
Erlang

%%--------------------------------------------------------------------
%% Copyright (c) 2021-2023 EMQ Technologies Co., Ltd. All Rights Reserved.
%%
%% Licensed under the Apache License, Version 2.0 (the "License");
%% you may not use this file except in compliance with the License.
%% You may obtain a copy of the License at
%%
%% http://www.apache.org/licenses/LICENSE-2.0
%%
%% Unless required by applicable law or agreed to in writing, software
%% distributed under the License is distributed on an "AS IS" BASIS,
%% WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
%% See the License for the specific language governing permissions and
%% limitations under the License.
%%--------------------------------------------------------------------
-module(emqx_machine_boot).
-include_lib("emqx/include/logger.hrl").
-include_lib("snabbkaffe/include/snabbkaffe.hrl").
-export([post_boot/0]).
-export([stop_apps/0, ensure_apps_started/0]).
-export([sorted_reboot_apps/0]).
-export([start_autocluster/0]).
-export([stop_port_apps/0]).
-dialyzer({no_match, [basic_reboot_apps/0]}).
-ifdef(TEST).
-export([sorted_reboot_apps/1, reboot_apps/0]).
-endif.
%% These apps are always (re)started by emqx_machine:
-define(BASIC_REBOOT_APPS, [gproc, esockd, ranch, cowboy, emqx]).
%% If any of these applications crash, the entire EMQX node shuts down:
-define(BASIC_PERMANENT_APPS, [mria, ekka, esockd, emqx]).
%% These apps are optional, they may or may not be present in the
%% release, depending on the build flags:
-define(OPTIONAL_APPS, [bcrypt, observer]).
post_boot() ->
ok = ensure_apps_started(),
ok = print_vsn(),
ok = start_autocluster(),
ignore.
-ifdef(TEST).
print_vsn() -> ok.
% TEST
-else.
print_vsn() ->
?ULOG("~ts ~ts is running now!~n", [emqx_app:get_description(), emqx_app:get_release()]).
% TEST
-endif.
start_autocluster() ->
ekka:callback(stop, fun emqx_machine_boot:stop_apps/0),
ekka:callback(start, fun emqx_machine_boot:ensure_apps_started/0),
%% returns 'ok' or a pid or 'any()' as in spec
_ = ekka:autocluster(emqx),
ok.
stop_apps() ->
?SLOG(notice, #{msg => "stopping_emqx_apps"}),
_ = emqx_alarm_handler:unload(),
ok = emqx_conf_app:unset_config_loaded(),
lists:foreach(fun stop_one_app/1, lists:reverse(sorted_reboot_apps())).
%% Those port apps are terminated after the main apps
%% Don't need to stop when reboot.
stop_port_apps() ->
Loaded = application:loaded_applications(),
lists:foreach(
fun(App) ->
case lists:keymember(App, 1, Loaded) of
true -> stop_one_app(App);
false -> ok
end
end,
[os_mon, jq]
).
stop_one_app(App) ->
?SLOG(debug, #{msg => "stopping_app", app => App}),
try
_ = application:stop(App)
catch
C:E ->
?SLOG(error, #{
msg => "failed_to_stop_app",
app => App,
exception => C,
reason => E
})
end.
ensure_apps_started() ->
?SLOG(notice, #{msg => "(re)starting_emqx_apps"}),
lists:foreach(fun start_one_app/1, sorted_reboot_apps()),
?tp(emqx_machine_boot_apps_started, #{}).
start_one_app(App) ->
?SLOG(debug, #{msg => "starting_app", app => App}),
case application:ensure_all_started(App, restart_type(App)) of
{ok, Apps} ->
?SLOG(debug, #{msg => "started_apps", apps => Apps});
{error, Reason} ->
?SLOG(critical, #{msg => "failed_to_start_app", app => App, reason => Reason}),
error({failed_to_start_app, App, Reason})
end.
restart_type(App) ->
PermanentApps =
?BASIC_PERMANENT_APPS ++ application:get_env(emqx_machine, permanent_applications, []),
case lists:member(App, PermanentApps) of
true ->
permanent;
false ->
temporary
end.
%% list of app names which should be rebooted when:
%% 1. due to static config change
%% 2. after join a cluster
%% the list of (re)started apps depends on release type/edition
reboot_apps() ->
ConfigApps0 = application:get_env(emqx_machine, applications, []),
BaseRebootApps = basic_reboot_apps(),
ConfigApps = lists:filter(fun(App) -> not lists:member(App, BaseRebootApps) end, ConfigApps0),
BaseRebootApps ++ ConfigApps.
basic_reboot_apps() ->
PrivDir = code:priv_dir(emqx_machine),
RebootListPath = filename:join([PrivDir, "reboot_lists.eterm"]),
{ok, [
#{
common_business_apps := CommonBusinessApps,
ee_business_apps := EEBusinessApps,
ce_business_apps := CEBusinessApps
}
]} = file:consult(RebootListPath),
EditionSpecificApps =
case emqx_release:edition() of
ee -> EEBusinessApps;
ce -> CEBusinessApps;
_ -> []
end,
BusinessApps = CommonBusinessApps ++ EditionSpecificApps,
?BASIC_REBOOT_APPS ++ (BusinessApps -- excluded_apps()).
excluded_apps() ->
%% Optional apps _should_ be (re)started automatically, but only
%% when they are found in the release:
[App || App <- ?OPTIONAL_APPS, not is_app(App)].
is_app(Name) ->
case application:load(Name) of
ok -> true;
{error, {already_loaded, _}} -> true;
_ -> false
end.
sorted_reboot_apps() ->
RebootApps = reboot_apps(),
Apps0 = [{App, app_deps(App, RebootApps)} || App <- RebootApps],
Apps = emqx_machine_boot_runtime_deps:inject(Apps0, runtime_deps()),
sorted_reboot_apps(Apps).
app_deps(App, RebootApps) ->
case application:get_key(App, applications) of
undefined -> undefined;
{ok, List} -> lists:filter(fun(A) -> lists:member(A, RebootApps) end, List)
end.
runtime_deps() ->
[
%% `emqx_bridge' is special in that it needs all the bridges apps to
%% be started before it, so that, when it loads the bridges from
%% configuration, the bridge app and its dependencies need to be up.
{emqx_bridge, fun(App) -> lists:prefix("emqx_bridge_", atom_to_list(App)) end},
%% `emqx_connector' also needs to start all connector dependencies for the same reason.
%% Since standalone apps like `emqx_mongodb' are already dependencies of `emqx_bridge_*'
%% apps, we may apply the same tactic for `emqx_connector' and inject individual bridges
%% as its dependencies.
{emqx_connector, fun(App) -> lists:prefix("emqx_bridge_", atom_to_list(App)) end},
%% emqx_fdb is an EE app
{emqx_durable_storage, emqx_fdb},
{emqx_dashboard, emqx_license}
].
sorted_reboot_apps(Apps) ->
G = digraph:new(),
try
NoDepApps = add_apps_to_digraph(G, Apps),
case digraph_utils:topsort(G) of
Sorted when is_list(Sorted) ->
%% ensure emqx_conf boot up first
AllApps = Sorted ++ (NoDepApps -- Sorted),
[emqx_conf | lists:delete(emqx_conf, AllApps)];
false ->
Loops = find_loops(G),
error({circular_application_dependency, Loops})
end
after
digraph:delete(G)
end.
%% Build a dependency graph from the provided application list.
%% Return top-sort result of the apps.
%% Isolated apps without which are not dependency of any other apps are
%% put to the end of the list in the original order.
add_apps_to_digraph(G, Apps) ->
lists:foldl(
fun
({App, undefined}, Acc) ->
?SLOG(debug, #{msg => "app_is_not_loaded", app => App}),
Acc;
({App, []}, Acc) ->
%% use '++' to keep the original order
Acc ++ [App];
({App, Deps}, Acc) ->
add_app_deps_to_digraph(G, App, Deps),
Acc
end,
[],
Apps
).
add_app_deps_to_digraph(G, App, undefined) ->
?SLOG(debug, #{msg => "app_is_not_loaded", app => App}),
%% not loaded
add_app_deps_to_digraph(G, App, []);
add_app_deps_to_digraph(_G, _App, []) ->
ok;
add_app_deps_to_digraph(G, App, [Dep | Deps]) ->
digraph:add_vertex(G, App),
digraph:add_vertex(G, Dep),
%% dep -> app as dependency
digraph:add_edge(G, Dep, App),
add_app_deps_to_digraph(G, App, Deps).
find_loops(G) ->
lists:filtermap(
fun(App) ->
case digraph:get_short_cycle(G, App) of
false -> false;
Apps -> {true, Apps}
end
end,
digraph:vertices(G)
).