fix(emqx_rule_monitor): sleep before retry but not after
This commit is contained in:
parent
6ae2b06ba1
commit
9b194baf69
|
@ -79,8 +79,6 @@
|
||||||
, action_instance_params/0
|
, action_instance_params/0
|
||||||
]).
|
]).
|
||||||
|
|
||||||
-define(T_RETRY, 60000).
|
|
||||||
|
|
||||||
%% redefine this macro to confine the appup scope
|
%% redefine this macro to confine the appup scope
|
||||||
-undef(RAISE).
|
-undef(RAISE).
|
||||||
-define(RAISE(_EXP_, _ERROR_CONTEXT_),
|
-define(RAISE(_EXP_, _ERROR_CONTEXT_),
|
||||||
|
@ -684,8 +682,7 @@ init_resource_with_retrier(Module, OnCreate, ResId, Config) ->
|
||||||
status = #{is_alive => true}},
|
status = #{is_alive => true}},
|
||||||
emqx_rule_registry:add_resource_params(ResParams)
|
emqx_rule_registry:add_resource_params(ResParams)
|
||||||
catch Class:Reason:ST ->
|
catch Class:Reason:ST ->
|
||||||
Interval = persistent_term:get({emqx_rule_engine, resource_restart_interval}, ?T_RETRY),
|
emqx_rule_monitor:ensure_resource_retrier(ResId),
|
||||||
emqx_rule_monitor:ensure_resource_retrier(ResId, Interval),
|
|
||||||
erlang:raise(Class, {init_resource, Reason}, ST)
|
erlang:raise(Class, {init_resource, Reason}, ST)
|
||||||
end.
|
end.
|
||||||
|
|
||||||
|
|
|
@ -32,10 +32,18 @@
|
||||||
-export([ start_link/0
|
-export([ start_link/0
|
||||||
, stop/0
|
, stop/0
|
||||||
, async_refresh_resources_rules/0
|
, async_refresh_resources_rules/0
|
||||||
, ensure_resource_retrier/2
|
, ensure_resource_retrier/1
|
||||||
, retry_loop/3
|
, retry_loop/3
|
||||||
]).
|
]).
|
||||||
|
|
||||||
|
%% fot test
|
||||||
|
-export([ put_retry_interval/1
|
||||||
|
, get_retry_interval/0
|
||||||
|
, erase_retry_interval/0
|
||||||
|
]).
|
||||||
|
|
||||||
|
-define(T_RETRY, 60000).
|
||||||
|
|
||||||
start_link() ->
|
start_link() ->
|
||||||
gen_server:start_link({local, ?MODULE}, ?MODULE, [], []).
|
gen_server:start_link({local, ?MODULE}, ?MODULE, [], []).
|
||||||
|
|
||||||
|
@ -46,10 +54,22 @@ init([]) ->
|
||||||
_ = erlang:process_flag(trap_exit, true),
|
_ = erlang:process_flag(trap_exit, true),
|
||||||
{ok, #{retryers => #{}}}.
|
{ok, #{retryers => #{}}}.
|
||||||
|
|
||||||
|
put_retry_interval(I) when is_integer(I) andalso I >= 10 ->
|
||||||
|
_ = persistent_term:put({?MODULE, resource_restart_interval}, I),
|
||||||
|
ok.
|
||||||
|
|
||||||
|
erase_retry_interval() ->
|
||||||
|
_ = persistent_term:erase({?MODULE, resource_restart_interval}),
|
||||||
|
ok.
|
||||||
|
|
||||||
|
get_retry_interval() ->
|
||||||
|
persistent_term:get({?MODULE, resource_restart_interval}, ?T_RETRY).
|
||||||
|
|
||||||
async_refresh_resources_rules() ->
|
async_refresh_resources_rules() ->
|
||||||
gen_server:cast(?MODULE, async_refresh).
|
gen_server:cast(?MODULE, async_refresh).
|
||||||
|
|
||||||
ensure_resource_retrier(ResId, Interval) ->
|
ensure_resource_retrier(ResId) ->
|
||||||
|
Interval = get_retry_interval(),
|
||||||
gen_server:cast(?MODULE, {create_restart_handler, resource, ResId, Interval}).
|
gen_server:cast(?MODULE, {create_restart_handler, resource, ResId, Interval}).
|
||||||
|
|
||||||
handle_call(_Msg, _From, State) ->
|
handle_call(_Msg, _From, State) ->
|
||||||
|
@ -111,11 +131,12 @@ update_object(Tag, Obj, Retryer, State) ->
|
||||||
}.
|
}.
|
||||||
|
|
||||||
create_restart_handler(Tag, Obj, Interval) ->
|
create_restart_handler(Tag, Obj, Interval) ->
|
||||||
?LOG(info, "keep restarting ~p ~p, interval: ~p", [Tag, Obj, Interval]),
|
?LOG(info, "starting_a_retry_loop for ~p ~p, with delay interval: ~p", [Tag, Obj, Interval]),
|
||||||
%% spawn a dedicated process to handle the restarting asynchronously
|
%% spawn a dedicated process to handle the restarting asynchronously
|
||||||
spawn_link(?MODULE, retry_loop, [Tag, Obj, Interval]).
|
spawn_link(?MODULE, retry_loop, [Tag, Obj, Interval]).
|
||||||
|
|
||||||
retry_loop(resource, ResId, Interval) ->
|
retry_loop(resource, ResId, Interval) ->
|
||||||
|
timer:sleep(Interval),
|
||||||
case emqx_rule_registry:find_resource(ResId) of
|
case emqx_rule_registry:find_resource(ResId) of
|
||||||
{ok, #resource{type = Type, config = Config}} ->
|
{ok, #resource{type = Type, config = Config}} ->
|
||||||
try
|
try
|
||||||
|
@ -124,10 +145,15 @@ retry_loop(resource, ResId, Interval) ->
|
||||||
ok = emqx_rule_engine:init_resource(M, F, ResId, Config),
|
ok = emqx_rule_engine:init_resource(M, F, ResId, Config),
|
||||||
refresh_and_enable_rules_of_resource(ResId)
|
refresh_and_enable_rules_of_resource(ResId)
|
||||||
catch
|
catch
|
||||||
Err:Reason:ST ->
|
Err:Reason:Stacktrace ->
|
||||||
?LOG(warning, "init_resource failed: ~p, ~0p",
|
%% do not log stacktrace if it's a throw
|
||||||
[{Err, Reason}, ST]),
|
LogContext =
|
||||||
timer:sleep(Interval),
|
case Err of
|
||||||
|
throw -> Reason;
|
||||||
|
_ -> {Reason, Stacktrace}
|
||||||
|
end,
|
||||||
|
?LOG_SENSITIVE(warning, "init_resource_retry_failed ~p, ~0p", [ResId, LogContext]),
|
||||||
|
%% keep looping
|
||||||
?MODULE:retry_loop(resource, ResId, Interval)
|
?MODULE:retry_loop(resource, ResId, Interval)
|
||||||
end;
|
end;
|
||||||
not_found ->
|
not_found ->
|
||||||
|
|
|
@ -48,7 +48,7 @@ end_per_suite(_Config) ->
|
||||||
ok.
|
ok.
|
||||||
|
|
||||||
init_per_testcase(t_restart_resource, Config) ->
|
init_per_testcase(t_restart_resource, Config) ->
|
||||||
persistent_term:put({emqx_rule_engine, resource_restart_interval}, 100),
|
emqx_rule_monitor:put_retry_interval(100),
|
||||||
Opts = [public, named_table, set, {read_concurrency, true}],
|
Opts = [public, named_table, set, {read_concurrency, true}],
|
||||||
_ = ets:new(?RES_PARAMS_TAB, [{keypos, #resource_params.id}|Opts]),
|
_ = ets:new(?RES_PARAMS_TAB, [{keypos, #resource_params.id}|Opts]),
|
||||||
ets:new(t_restart_resource, [named_table, public]),
|
ets:new(t_restart_resource, [named_table, public]),
|
||||||
|
@ -77,7 +77,6 @@ init_per_testcase(_, Config) ->
|
||||||
Config.
|
Config.
|
||||||
|
|
||||||
end_per_testcase(t_restart_resource, Config) ->
|
end_per_testcase(t_restart_resource, Config) ->
|
||||||
persistent_term:put({emqx_rule_engine, resource_restart_interval}, 60000),
|
|
||||||
ets:delete(t_restart_resource),
|
ets:delete(t_restart_resource),
|
||||||
common_end_per_testcases(),
|
common_end_per_testcases(),
|
||||||
Config;
|
Config;
|
||||||
|
@ -91,7 +90,9 @@ end_per_testcase(_, Config) ->
|
||||||
|
|
||||||
common_init_per_testcase() ->
|
common_init_per_testcase() ->
|
||||||
{ok, _} = emqx_rule_monitor:start_link().
|
{ok, _} = emqx_rule_monitor:start_link().
|
||||||
|
|
||||||
common_end_per_testcases() ->
|
common_end_per_testcases() ->
|
||||||
|
emqx_rule_monitor:erase_retry_interval(),
|
||||||
emqx_rule_monitor:stop().
|
emqx_rule_monitor:stop().
|
||||||
|
|
||||||
t_restart_resource(_) ->
|
t_restart_resource(_) ->
|
||||||
|
|
Loading…
Reference in New Issue