feat(schema_registry): add support for protobuf schemas

Fixes https://emqx.atlassian.net/browse/EMQX-9470
This commit is contained in:
Thales Macedo Garitezi 2023-04-14 17:33:25 -03:00
parent 14e807adeb
commit 9d15247dd5
15 changed files with 640 additions and 101 deletions

5
build
View File

@ -124,10 +124,7 @@ make_docs() {
} }
assert_no_compile_time_only_deps() { assert_no_compile_time_only_deps() {
if [ "$("$FIND" "_build/$PROFILE/rel/emqx/lib/" -maxdepth 1 -name 'gpb-*' -type d)" != "" ]; then :
echo "gpb should not be included in the release"
exit 1
fi
} }
make_rel() { make_rel() {

View File

@ -0,0 +1 @@
Add support for [Protocol Buffers](https://protobuf.dev/) schemas in Schema Registry.

View File

@ -10,14 +10,19 @@
-define(SCHEMA_REGISTRY_SHARD, emqx_ee_schema_registry_shard). -define(SCHEMA_REGISTRY_SHARD, emqx_ee_schema_registry_shard).
-define(SERDE_TAB, emqx_ee_schema_registry_serde_tab). -define(SERDE_TAB, emqx_ee_schema_registry_serde_tab).
-define(PROTOBUF_CACHE_TAB, emqx_ee_schema_registry_protobuf_cache_tab).
-type schema_name() :: binary(). -type schema_name() :: binary().
-type schema_source() :: binary(). -type schema_source() :: binary().
-type encoded_data() :: iodata(). -type encoded_data() :: iodata().
-type decoded_data() :: map(). -type decoded_data() :: map().
-type serializer() :: fun((decoded_data()) -> encoded_data()). -type serializer() ::
-type deserializer() :: fun((encoded_data()) -> decoded_data()). fun((decoded_data()) -> encoded_data())
| fun((decoded_data(), term()) -> encoded_data()).
-type deserializer() ::
fun((encoded_data()) -> decoded_data())
| fun((encoded_data(), term()) -> decoded_data()).
-type destructor() :: fun(() -> ok). -type destructor() :: fun(() -> ok).
-type serde_type() :: avro. -type serde_type() :: avro.
-type serde_opts() :: map(). -type serde_opts() :: map().
@ -29,6 +34,18 @@
destructor :: destructor() destructor :: destructor()
}). }).
-type serde() :: #serde{}. -type serde() :: #serde{}.
-record(protobuf_cache, {
fingerprint,
module,
module_binary
}).
-type protobuf_cache() :: #protobuf_cache{
fingerprint :: binary(),
module :: module(),
module_binary :: binary()
}.
-type serde_map() :: #{ -type serde_map() :: #{
name := schema_name(), name := schema_name(),
serializer := serializer(), serializer := serializer(),

View File

@ -4,7 +4,8 @@
{deps, [ {deps, [
{emqx, {path, "../../apps/emqx"}}, {emqx, {path, "../../apps/emqx"}},
{emqx_utils, {path, "../../apps/emqx_utils"}}, {emqx_utils, {path, "../../apps/emqx_utils"}},
{erlavro, {git, "https://github.com/klarna/erlavro.git", {tag, "2.9.8"}}} {erlavro, {git, "https://github.com/klarna/erlavro.git", {tag, "2.9.8"}}},
{gpb, "4.19.7"}
]}. ]}.
{shell, [ {shell, [

View File

@ -6,7 +6,8 @@
{applications, [ {applications, [
kernel, kernel,
stdlib, stdlib,
erlavro erlavro,
gpb
]}, ]},
{env, []}, {env, []},
{modules, []}, {modules, []},

View File

@ -176,7 +176,14 @@ create_tables() ->
{record_name, serde}, {record_name, serde},
{attributes, record_info(fields, serde)} {attributes, record_info(fields, serde)}
]), ]),
ok = mria:wait_for_tables([?SERDE_TAB]), ok = mria:create_table(?PROTOBUF_CACHE_TAB, [
{type, set},
{rlog_shard, ?SCHEMA_REGISTRY_SHARD},
{storage, disc_only_copies},
{record_name, protobuf_cache},
{attributes, record_info(fields, protobuf_cache)}
]),
ok = mria:wait_for_tables([?SERDE_TAB, ?PROTOBUF_CACHE_TAB]),
ok. ok.
do_build_serdes(Schemas) -> do_build_serdes(Schemas) ->

View File

@ -53,10 +53,20 @@ fields(avro) ->
mk(emqx_schema:json_binary(), #{required => true, desc => ?DESC("schema_source")})}, mk(emqx_schema:json_binary(), #{required => true, desc => ?DESC("schema_source")})},
{description, mk(binary(), #{default => <<>>, desc => ?DESC("schema_description")})} {description, mk(binary(), #{default => <<>>, desc => ?DESC("schema_description")})}
]; ];
fields(protobuf) ->
[
{type, mk(protobuf, #{required => true, desc => ?DESC("schema_type")})},
{source, mk(binary(), #{required => true, desc => ?DESC("schema_source")})},
{description, mk(binary(), #{default => <<>>, desc => ?DESC("schema_description")})}
];
fields("get_avro") -> fields("get_avro") ->
[{name, mk(binary(), #{required => true, desc => ?DESC("schema_name")})} | fields(avro)]; [{name, mk(binary(), #{required => true, desc => ?DESC("schema_name")})} | fields(avro)];
fields("get_protobuf") ->
[{name, mk(binary(), #{required => true, desc => ?DESC("schema_name")})} | fields(protobuf)];
fields("put_avro") -> fields("put_avro") ->
fields(avro); fields(avro);
fields("put_protobuf") ->
fields(protobuf);
fields("post_" ++ Type) -> fields("post_" ++ Type) ->
fields("get_" ++ Type). fields("get_" ++ Type).
@ -64,6 +74,8 @@ desc(?CONF_KEY_ROOT) ->
?DESC("schema_registry_root"); ?DESC("schema_registry_root");
desc(avro) -> desc(avro) ->
?DESC("avro_type"); ?DESC("avro_type");
desc(protobuf) ->
?DESC("protobuf_type");
desc(_) -> desc(_) ->
undefined. undefined.
@ -96,7 +108,7 @@ mk(Type, Meta) -> hoconsc:mk(Type, Meta).
ref(Name) -> hoconsc:ref(?MODULE, Name). ref(Name) -> hoconsc:ref(?MODULE, Name).
supported_serde_types() -> supported_serde_types() ->
[avro]. [avro, protobuf].
refs() -> refs() ->
[ref(Type) || Type <- supported_serde_types()]. [ref(Type) || Type <- supported_serde_types()].
@ -105,6 +117,8 @@ refs(#{<<"type">> := TypeAtom} = Value) when is_atom(TypeAtom) ->
refs(Value#{<<"type">> := atom_to_binary(TypeAtom)}); refs(Value#{<<"type">> := atom_to_binary(TypeAtom)});
refs(#{<<"type">> := <<"avro">>}) -> refs(#{<<"type">> := <<"avro">>}) ->
[ref(avro)]; [ref(avro)];
refs(#{<<"type">> := <<"protobuf">>}) ->
[ref(protobuf)];
refs(_) -> refs(_) ->
Expected = lists:join(" | ", [atom_to_list(T) || T <- supported_serde_types()]), Expected = lists:join(" | ", [atom_to_list(T) || T <- supported_serde_types()]),
throw(#{ throw(#{
@ -113,12 +127,14 @@ refs(_) ->
}). }).
refs_get_api() -> refs_get_api() ->
[ref("get_avro")]. [ref("get_avro"), ref("get_protobuf")].
refs_get_api(#{<<"type">> := TypeAtom} = Value) when is_atom(TypeAtom) -> refs_get_api(#{<<"type">> := TypeAtom} = Value) when is_atom(TypeAtom) ->
refs(Value#{<<"type">> := atom_to_binary(TypeAtom)}); refs(Value#{<<"type">> := atom_to_binary(TypeAtom)});
refs_get_api(#{<<"type">> := <<"avro">>}) -> refs_get_api(#{<<"type">> := <<"avro">>}) ->
[ref("get_avro")]; [ref("get_avro")];
refs_get_api(#{<<"type">> := <<"protobuf">>}) ->
[ref("get_protobuf")];
refs_get_api(_) -> refs_get_api(_) ->
Expected = lists:join(" | ", [atom_to_list(T) || T <- supported_serde_types()]), Expected = lists:join(" | ", [atom_to_list(T) || T <- supported_serde_types()]),
throw(#{ throw(#{

View File

@ -4,8 +4,11 @@
-module(emqx_ee_schema_registry_serde). -module(emqx_ee_schema_registry_serde).
-include("emqx_ee_schema_registry.hrl"). -include("emqx_ee_schema_registry.hrl").
-include_lib("emqx/include/logger.hrl").
-include_lib("snabbkaffe/include/snabbkaffe.hrl"). -include_lib("snabbkaffe/include/snabbkaffe.hrl").
-elvis([{elvis_style, invalid_dynamic_call, #{ignore => [emqx_ee_schema_registry_serde]}}]).
%% API %% API
-export([ -export([
decode/2, decode/2,
@ -55,6 +58,27 @@ make_serde(avro, Name, Source0) ->
?tp(serde_destroyed, #{type => avro, name => Name}), ?tp(serde_destroyed, #{type => avro, name => Name}),
ok ok
end, end,
{Serializer, Deserializer, Destructor};
make_serde(protobuf, Name, Source) ->
SerdeMod = make_protobuf_serde_mod(Name, Source),
Serializer =
fun(DecodedData0, MessageName0) ->
DecodedData = emqx_utils_maps:safe_atom_key_map(DecodedData0),
MessageName = binary_to_existing_atom(MessageName0, utf8),
SerdeMod:encode_msg(DecodedData, MessageName)
end,
Deserializer =
fun(EncodedData, MessageName0) ->
MessageName = binary_to_existing_atom(MessageName0, utf8),
Decoded = SerdeMod:decode_msg(EncodedData, MessageName),
emqx_utils_maps:binary_key_map(Decoded)
end,
Destructor =
fun() ->
unload_code(SerdeMod),
?tp(serde_destroyed, #{type => protobuf, name => Name}),
ok
end,
{Serializer, Deserializer, Destructor}. {Serializer, Deserializer, Destructor}.
%%------------------------------------------------------------------------------ %%------------------------------------------------------------------------------
@ -68,3 +92,111 @@ inject_avro_name(Name, Source0) ->
Schema0 = emqx_utils_json:decode(Source0, [return_maps]), Schema0 = emqx_utils_json:decode(Source0, [return_maps]),
Schema = Schema0#{<<"name">> => Name}, Schema = Schema0#{<<"name">> => Name},
emqx_utils_json:encode(Schema). emqx_utils_json:encode(Schema).
-spec make_protobuf_serde_mod(schema_name(), schema_source()) -> module().
make_protobuf_serde_mod(Name, Source) ->
{SerdeMod0, SerdeModFileName} = protobuf_serde_mod_name(Name),
case lazy_generate_protobuf_code(SerdeMod0, Source) of
{ok, SerdeMod, ModBinary} ->
load_code(SerdeMod, SerdeModFileName, ModBinary),
SerdeMod;
{error, #{error := Error, warnings := Warnings}} ->
?SLOG(
warning,
#{
msg => "error_generating_protobuf_code",
error => Error,
warnings => Warnings
}
),
error({invalid_protobuf_schema, Error})
end.
-spec protobuf_serde_mod_name(schema_name()) -> {module(), string()}.
protobuf_serde_mod_name(Name) ->
%% must be a string (list)
SerdeModName = "$schema_parser_" ++ binary_to_list(Name),
SerdeMod = list_to_atom(SerdeModName),
%% the "path" to the module, for `code:load_binary'.
SerdeModFileName = SerdeModName ++ ".memory",
{SerdeMod, SerdeModFileName}.
-spec lazy_generate_protobuf_code(module(), schema_source()) ->
{ok, module(), binary()} | {error, #{error := term(), warnings := [term()]}}.
lazy_generate_protobuf_code(SerdeMod0, Source) ->
%% We run this inside a transaction with locks to avoid running
%% the compile on all nodes; only one will get the lock, compile
%% the schema, and other nodes will simply read the final result.
{atomic, Res} = mria:transaction(
?SCHEMA_REGISTRY_SHARD,
fun lazy_generate_protobuf_code_trans/2,
[SerdeMod0, Source]
),
Res.
-spec lazy_generate_protobuf_code_trans(module(), schema_source()) ->
{ok, module(), binary()} | {error, #{error := term(), warnings := [term()]}}.
lazy_generate_protobuf_code_trans(SerdeMod0, Source) ->
Fingerprint = erlang:md5(Source),
_ = mnesia:lock({record, ?PROTOBUF_CACHE_TAB, Fingerprint}, write),
case mnesia:read(?PROTOBUF_CACHE_TAB, Fingerprint) of
[#protobuf_cache{module = SerdeMod, module_binary = ModBinary}] ->
?tp(schema_registry_protobuf_cache_hit, #{}),
{ok, SerdeMod, ModBinary};
[] ->
?tp(schema_registry_protobuf_cache_miss, #{}),
case generate_protobuf_code(SerdeMod0, Source) of
{ok, SerdeMod, ModBinary} ->
CacheEntry = #protobuf_cache{
fingerprint = Fingerprint,
module = SerdeMod,
module_binary = ModBinary
},
ok = mnesia:write(?PROTOBUF_CACHE_TAB, CacheEntry, write),
{ok, SerdeMod, ModBinary};
{ok, SerdeMod, ModBinary, _Warnings} ->
CacheEntry = #protobuf_cache{
fingerprint = Fingerprint,
module = SerdeMod,
module_binary = ModBinary
},
ok = mnesia:write(?PROTOBUF_CACHE_TAB, CacheEntry, write),
{ok, SerdeMod, ModBinary};
error ->
{error, #{error => undefined, warnings => []}};
{error, Error} ->
{error, #{error => Error, warnings => []}};
{error, Error, Warnings} ->
{error, #{error => Error, warnings => Warnings}}
end
end.
generate_protobuf_code(SerdeMod, Source) ->
gpb_compile:string(
SerdeMod,
Source,
[
binary,
strings_as_binaries,
{maps, true},
%% Fixme: currently, some bug in `gpb' prevents this
%% option from working with `oneof' types... We're then
%% forced to use atom key maps.
%% {maps_key_type, binary},
{maps_oneof, flat},
{verify, always},
{maps_unset_optional, omitted}
]
).
-spec load_code(module(), string(), binary()) -> ok.
load_code(SerdeMod, SerdeModFileName, ModBinary) ->
_ = code:purge(SerdeMod),
{module, SerdeMod} = code:load_binary(SerdeMod, SerdeModFileName, ModBinary),
ok.
-spec unload_code(module()) -> ok.
unload_code(SerdeMod) ->
_ = code:purge(SerdeMod),
_ = code:delete(SerdeMod),
ok.

View File

@ -21,11 +21,19 @@
%%------------------------------------------------------------------------------ %%------------------------------------------------------------------------------
all() -> all() ->
[{group, avro}]. [{group, avro}, {group, protobuf}].
groups() -> groups() ->
TCs = emqx_common_test_helpers:all(?MODULE), AllTCs = emqx_common_test_helpers:all(?MODULE),
[{avro, TCs}]. ProtobufOnlyTCs = protobuf_only_tcs(),
TCs = AllTCs -- ProtobufOnlyTCs,
[{avro, TCs}, {protobuf, AllTCs}].
protobuf_only_tcs() ->
[
t_protobuf_union_encode,
t_protobuf_union_decode
].
init_per_suite(Config) -> init_per_suite(Config) ->
emqx_config:save_schema_mod_and_names(emqx_ee_schema_registry_schema), emqx_config:save_schema_mod_and_names(emqx_ee_schema_registry_schema),
@ -38,6 +46,8 @@ end_per_suite(_Config) ->
init_per_group(avro, Config) -> init_per_group(avro, Config) ->
[{serde_type, avro} | Config]; [{serde_type, avro} | Config];
init_per_group(protobuf, Config) ->
[{serde_type, protobuf} | Config];
init_per_group(_Group, Config) -> init_per_group(_Group, Config) ->
Config. Config.
@ -95,8 +105,12 @@ create_rule_http(RuleParams) ->
Path = emqx_mgmt_api_test_util:api_path(["rules"]), Path = emqx_mgmt_api_test_util:api_path(["rules"]),
AuthHeader = emqx_mgmt_api_test_util:auth_header_(), AuthHeader = emqx_mgmt_api_test_util:auth_header_(),
case emqx_mgmt_api_test_util:request_api(post, Path, "", AuthHeader, Params) of case emqx_mgmt_api_test_util:request_api(post, Path, "", AuthHeader, Params) of
{ok, Res} -> {ok, emqx_utils_json:decode(Res, [return_maps])}; {ok, Res0} ->
Error -> Error Res = #{<<"id">> := RuleId} = emqx_utils_json:decode(Res0, [return_maps]),
on_exit(fun() -> ok = emqx_rule_engine:delete_rule(RuleId) end),
{ok, Res};
Error ->
Error
end. end.
schema_params(avro) -> schema_params(avro) ->
@ -108,35 +122,174 @@ schema_params(avro) ->
] ]
}, },
SourceBin = emqx_utils_json:encode(Source), SourceBin = emqx_utils_json:encode(Source),
#{type => avro, source => SourceBin}. #{type => avro, source => SourceBin};
schema_params(protobuf) ->
SourceBin =
<<
"message Person {\n"
" required string name = 1;\n"
" required int32 id = 2;\n"
" optional string email = 3;\n"
" }\n"
"message UnionValue {\n"
" oneof u {\n"
" int32 a = 1;\n"
" string b = 2;\n"
" }\n"
"}\n"
>>,
#{type => protobuf, source => SourceBin}.
create_serde(SerdeType, SerdeName) -> create_serde(SerdeType, SerdeName) ->
Schema = schema_params(SerdeType), Schema = schema_params(SerdeType),
ok = emqx_ee_schema_registry:add_schema(SerdeName, Schema), ok = emqx_ee_schema_registry:add_schema(SerdeName, Schema),
ok. ok.
sql_for(avro, encode_decode1) -> test_params_for(avro, encode_decode1) ->
<< SQL =
"select\n" <<
" schema_decode('my_serde',\n" "select\n"
" schema_encode('my_serde', json_decode(payload))) as decoded,\n" " schema_decode('my_serde',\n"
" decoded.i as decoded_int,\n" " schema_encode('my_serde', json_decode(payload))) as decoded,\n\n"
" decoded.s as decoded_string\n" " decoded.i as decoded_int,\n"
" from t" " decoded.s as decoded_string\n"
>>; "from t\n"
sql_for(avro, encode1) -> >>,
<< Payload = #{<<"i">> => 10, <<"s">> => <<"text">>},
"select\n" ExpectedRuleOutput =
" schema_encode('my_serde', json_decode(payload)) as encoded\n" #{
" from t" <<"decoded">> => #{<<"i">> => 10, <<"s">> => <<"text">>},
>>; <<"decoded_int">> => 10,
sql_for(avro, decode1) -> <<"decoded_string">> => <<"text">>
<< },
"select\n" ExtraArgs = [],
" schema_decode('my_serde', payload) as decoded\n" #{
" from t" sql => SQL,
>>; payload => Payload,
sql_for(Type, Name) -> expected_rule_output => ExpectedRuleOutput,
extra_args => ExtraArgs
};
test_params_for(avro, encode1) ->
SQL =
<<
"select\n"
" schema_encode('my_serde', json_decode(payload)) as encoded\n"
"from t\n"
>>,
Payload = #{<<"i">> => 10, <<"s">> => <<"text">>},
ExtraArgs = [],
#{
sql => SQL,
payload => Payload,
extra_args => ExtraArgs
};
test_params_for(avro, decode1) ->
SQL =
<<
"select\n"
" schema_decode('my_serde', payload) as decoded\n"
"from t\n"
>>,
Payload = #{<<"i">> => 10, <<"s">> => <<"text">>},
ExtraArgs = [],
#{
sql => SQL,
payload => Payload,
extra_args => ExtraArgs
};
test_params_for(protobuf, encode_decode1) ->
SQL =
<<
"select\n"
" schema_decode('my_serde',\n"
" schema_encode('my_serde', json_decode(payload), 'Person'),\n"
" 'Person') as decoded,\n"
" decoded.name as decoded_name,\n"
" decoded.email as decoded_email,\n"
" decoded.id as decoded_id\n"
"from t\n"
>>,
Payload = #{<<"name">> => <<"some name">>, <<"id">> => 10, <<"email">> => <<"emqx@emqx.io">>},
ExpectedRuleOutput =
#{
<<"decoded">> =>
#{
<<"email">> => <<"emqx@emqx.io">>,
<<"id">> => 10,
<<"name">> => <<"some name">>
},
<<"decoded_email">> => <<"emqx@emqx.io">>,
<<"decoded_id">> => 10,
<<"decoded_name">> => <<"some name">>
},
ExtraArgs = [<<"Person">>],
#{
sql => SQL,
payload => Payload,
extra_args => ExtraArgs,
expected_rule_output => ExpectedRuleOutput
};
test_params_for(protobuf, decode1) ->
SQL =
<<
"select\n"
" schema_decode('my_serde', payload, 'Person') as decoded\n"
"from t\n"
>>,
Payload = #{<<"name">> => <<"some name">>, <<"id">> => 10, <<"email">> => <<"emqx@emqx.io">>},
ExtraArgs = [<<"Person">>],
#{
sql => SQL,
payload => Payload,
extra_args => ExtraArgs
};
test_params_for(protobuf, encode1) ->
SQL =
<<
"select\n"
" schema_encode('my_serde', json_decode(payload), 'Person') as encoded\n"
"from t\n"
>>,
Payload = #{<<"name">> => <<"some name">>, <<"id">> => 10, <<"email">> => <<"emqx@emqx.io">>},
ExtraArgs = [<<"Person">>],
#{
sql => SQL,
payload => Payload,
extra_args => ExtraArgs
};
test_params_for(protobuf, union1) ->
SQL =
<<
"select\n"
" schema_decode('my_serde', payload, 'UnionValue') as decoded,\n"
" decoded.a as decoded_a,\n"
" decoded.b as decoded_b\n"
"from t\n"
>>,
PayloadA = #{<<"a">> => 10},
PayloadB = #{<<"b">> => <<"string">>},
ExtraArgs = [<<"UnionValue">>],
#{
sql => SQL,
payload => #{a => PayloadA, b => PayloadB},
extra_args => ExtraArgs
};
test_params_for(protobuf, union2) ->
SQL =
<<
"select\n"
" schema_encode('my_serde', json_decode(payload), 'UnionValue') as encoded\n"
"from t\n"
>>,
PayloadA = #{<<"a">> => 10},
PayloadB = #{<<"b">> => <<"string">>},
ExtraArgs = [<<"UnionValue">>],
#{
sql => SQL,
payload => #{a => PayloadA, b => PayloadB},
extra_args => ExtraArgs
};
test_params_for(Type, Name) ->
ct:fail("unimplemented: ~p", [{Type, Name}]). ct:fail("unimplemented: ~p", [{Type, Name}]).
clear_schemas() -> clear_schemas() ->
@ -238,6 +391,40 @@ wait_for_cluster_rpc(Node) ->
true = is_pid(erpc:call(Node, erlang, whereis, [emqx_config_handler])) true = is_pid(erpc:call(Node, erlang, whereis, [emqx_config_handler]))
). ).
serde_deletion_calls_destructor_spec(#{serde_type := SerdeType}, Trace) ->
?assert(
?strict_causality(
#{?snk_kind := will_delete_schema},
#{?snk_kind := serde_destroyed, type := SerdeType},
Trace
)
),
ok.
protobuf_unique_cache_hit_spec(#{serde_type := protobuf} = Res, Trace) ->
#{nodes := Nodes} = Res,
CacheEvents = ?of_kind(
[
schema_registry_protobuf_cache_hit,
schema_registry_protobuf_cache_miss
],
Trace
),
?assertMatch(
[
schema_registry_protobuf_cache_hit,
schema_registry_protobuf_cache_miss
],
lists:sort(?projection(?snk_kind, CacheEvents))
),
?assertEqual(
lists:usort(Nodes),
lists:usort([N || #{?snk_meta := #{node := N}} <- CacheEvents])
),
ok;
protobuf_unique_cache_hit_spec(_Res, _Trace) ->
ok.
%%------------------------------------------------------------------------------ %%------------------------------------------------------------------------------
%% Testcases %% Testcases
%%------------------------------------------------------------------------------ %%------------------------------------------------------------------------------
@ -259,27 +446,16 @@ t_encode_decode(Config) ->
SerdeType = ?config(serde_type, Config), SerdeType = ?config(serde_type, Config),
SerdeName = my_serde, SerdeName = my_serde,
ok = create_serde(SerdeType, SerdeName), ok = create_serde(SerdeType, SerdeName),
{ok, #{<<"id">> := RuleId}} = create_rule_http(#{sql => sql_for(SerdeType, encode_decode1)}), #{
on_exit(fun() -> ok = emqx_rule_engine:delete_rule(RuleId) end), sql := SQL,
Payload = #{<<"i">> => 10, <<"s">> => <<"text">>}, payload := Payload,
expected_rule_output := ExpectedRuleOutput
} = test_params_for(SerdeType, encode_decode1),
{ok, _} = create_rule_http(#{sql => SQL}),
PayloadBin = emqx_utils_json:encode(Payload), PayloadBin = emqx_utils_json:encode(Payload),
emqx:publish(emqx_message:make(<<"t">>, PayloadBin)), emqx:publish(emqx_message:make(<<"t">>, PayloadBin)),
Res = receive_action_results(), Res = receive_action_results(),
?assertMatch( ?assertMatch(#{data := ExpectedRuleOutput}, Res),
#{
data :=
#{
<<"decoded">> :=
#{
<<"i">> := 10,
<<"s">> := <<"text">>
},
<<"decoded_int">> := 10,
<<"decoded_string">> := <<"text">>
}
},
Res
),
ok. ok.
t_delete_serde(Config) -> t_delete_serde(Config) ->
@ -308,9 +484,12 @@ t_encode(Config) ->
SerdeType = ?config(serde_type, Config), SerdeType = ?config(serde_type, Config),
SerdeName = my_serde, SerdeName = my_serde,
ok = create_serde(SerdeType, SerdeName), ok = create_serde(SerdeType, SerdeName),
{ok, #{<<"id">> := RuleId}} = create_rule_http(#{sql => sql_for(SerdeType, encode1)}), #{
on_exit(fun() -> ok = emqx_rule_engine:delete_rule(RuleId) end), sql := SQL,
Payload = #{<<"i">> => 10, <<"s">> => <<"text">>}, payload := Payload,
extra_args := ExtraArgs
} = test_params_for(SerdeType, encode1),
{ok, _} = create_rule_http(#{sql => SQL}),
PayloadBin = emqx_utils_json:encode(Payload), PayloadBin = emqx_utils_json:encode(Payload),
emqx:publish(emqx_message:make(<<"t">>, PayloadBin)), emqx:publish(emqx_message:make(<<"t">>, PayloadBin)),
Published = receive_published(?LINE), Published = receive_published(?LINE),
@ -320,18 +499,21 @@ t_encode(Config) ->
), ),
#{payload := #{<<"encoded">> := Encoded}} = Published, #{payload := #{<<"encoded">> := Encoded}} = Published,
{ok, #{deserializer := Deserializer}} = emqx_ee_schema_registry:get_serde(SerdeName), {ok, #{deserializer := Deserializer}} = emqx_ee_schema_registry:get_serde(SerdeName),
?assertEqual(Payload, Deserializer(Encoded)), ?assertEqual(Payload, apply(Deserializer, [Encoded | ExtraArgs])),
ok. ok.
t_decode(Config) -> t_decode(Config) ->
SerdeType = ?config(serde_type, Config), SerdeType = ?config(serde_type, Config),
SerdeName = my_serde, SerdeName = my_serde,
ok = create_serde(SerdeType, SerdeName), ok = create_serde(SerdeType, SerdeName),
{ok, #{<<"id">> := RuleId}} = create_rule_http(#{sql => sql_for(SerdeType, decode1)}), #{
on_exit(fun() -> ok = emqx_rule_engine:delete_rule(RuleId) end), sql := SQL,
Payload = #{<<"i">> => 10, <<"s">> => <<"text">>}, payload := Payload,
extra_args := ExtraArgs
} = test_params_for(SerdeType, decode1),
{ok, _} = create_rule_http(#{sql => SQL}),
{ok, #{serializer := Serializer}} = emqx_ee_schema_registry:get_serde(SerdeName), {ok, #{serializer := Serializer}} = emqx_ee_schema_registry:get_serde(SerdeName),
EncodedBin = Serializer(Payload), EncodedBin = apply(Serializer, [Payload | ExtraArgs]),
emqx:publish(emqx_message:make(<<"t">>, EncodedBin)), emqx:publish(emqx_message:make(<<"t">>, EncodedBin)),
Published = receive_published(?LINE), Published = receive_published(?LINE),
?assertMatch( ?assertMatch(
@ -342,6 +524,76 @@ t_decode(Config) ->
?assertEqual(Payload, Decoded), ?assertEqual(Payload, Decoded),
ok. ok.
t_protobuf_union_encode(Config) ->
SerdeType = ?config(serde_type, Config),
?assertEqual(protobuf, SerdeType),
SerdeName = my_serde,
ok = create_serde(SerdeType, SerdeName),
#{
sql := SQL,
payload := #{a := PayloadA, b := PayloadB},
extra_args := ExtraArgs
} = test_params_for(SerdeType, union1),
{ok, _} = create_rule_http(#{sql => SQL}),
{ok, #{serializer := Serializer}} = emqx_ee_schema_registry:get_serde(SerdeName),
EncodedBinA = apply(Serializer, [PayloadA | ExtraArgs]),
emqx:publish(emqx_message:make(<<"t">>, EncodedBinA)),
PublishedA = receive_published(?LINE),
?assertMatch(
#{payload := #{<<"decoded">> := _}},
PublishedA
),
#{payload := #{<<"decoded">> := DecodedA}} = PublishedA,
?assertEqual(PayloadA, DecodedA),
EncodedBinB = apply(Serializer, [PayloadB | ExtraArgs]),
emqx:publish(emqx_message:make(<<"t">>, EncodedBinB)),
PublishedB = receive_published(?LINE),
?assertMatch(
#{payload := #{<<"decoded">> := _}},
PublishedB
),
#{payload := #{<<"decoded">> := DecodedB}} = PublishedB,
?assertEqual(PayloadB, DecodedB),
ok.
t_protobuf_union_decode(Config) ->
SerdeType = ?config(serde_type, Config),
?assertEqual(protobuf, SerdeType),
SerdeName = my_serde,
ok = create_serde(SerdeType, SerdeName),
#{
sql := SQL,
payload := #{a := PayloadA, b := PayloadB},
extra_args := ExtraArgs
} = test_params_for(SerdeType, union2),
{ok, _} = create_rule_http(#{sql => SQL}),
{ok, #{deserializer := Deserializer}} = emqx_ee_schema_registry:get_serde(SerdeName),
EncodedBinA = emqx_utils_json:encode(PayloadA),
emqx:publish(emqx_message:make(<<"t">>, EncodedBinA)),
PublishedA = receive_published(?LINE),
?assertMatch(
#{payload := #{<<"encoded">> := _}},
PublishedA
),
#{payload := #{<<"encoded">> := EncodedA}} = PublishedA,
?assertEqual(PayloadA, apply(Deserializer, [EncodedA | ExtraArgs])),
EncodedBinB = emqx_utils_json:encode(PayloadB),
emqx:publish(emqx_message:make(<<"t">>, EncodedBinB)),
PublishedB = receive_published(?LINE),
?assertMatch(
#{payload := #{<<"encoded">> := _}},
PublishedB
),
#{payload := #{<<"encoded">> := EncodedB}} = PublishedB,
?assertEqual(PayloadB, apply(Deserializer, [EncodedB | ExtraArgs])),
ok.
t_fail_rollback(Config) -> t_fail_rollback(Config) ->
SerdeType = ?config(serde_type, Config), SerdeType = ?config(serde_type, Config),
OkSchema = emqx_utils_maps:binary_key_map(schema_params(SerdeType)), OkSchema = emqx_utils_maps:binary_key_map(schema_params(SerdeType)),
@ -369,6 +621,10 @@ t_cluster_serde_build(Config) ->
Cluster = cluster(Config), Cluster = cluster(Config),
SerdeName = my_serde, SerdeName = my_serde,
Schema = schema_params(SerdeType), Schema = schema_params(SerdeType),
#{
payload := Payload,
extra_args := ExtraArgs
} = test_params_for(SerdeType, encode_decode1),
?check_trace( ?check_trace(
begin begin
Nodes = [N1, N2 | _] = start_cluster(Cluster), Nodes = [N1, N2 | _] = start_cluster(Cluster),
@ -385,8 +641,14 @@ t_cluster_serde_build(Config) ->
Res0 = emqx_ee_schema_registry:get_serde(SerdeName), Res0 = emqx_ee_schema_registry:get_serde(SerdeName),
?assertMatch({ok, #{}}, Res0, #{node => N}), ?assertMatch({ok, #{}}, Res0, #{node => N}),
{ok, #{serializer := Serializer, deserializer := Deserializer}} = Res0, {ok, #{serializer := Serializer, deserializer := Deserializer}} = Res0,
Payload = #{<<"i">> => 10, <<"s">> => <<"text">>}, ?assertEqual(
?assertEqual(Payload, Deserializer(Serializer(Payload)), #{node => N}), Payload,
apply(
Deserializer,
[apply(Serializer, [Payload | ExtraArgs]) | ExtraArgs]
),
#{node => N}
),
ok ok
end) end)
end, end,
@ -417,17 +679,11 @@ t_cluster_serde_build(Config) ->
end, end,
Nodes Nodes
), ),
ok #{serde_type => SerdeType, nodes => Nodes}
end, end,
fun(Trace) -> [
?assert( {"destructor is always called", fun ?MODULE:serde_deletion_calls_destructor_spec/2},
?strict_causality( {"protobuf is only built on one node", fun ?MODULE:protobuf_unique_cache_hit_spec/2}
#{?snk_kind := will_delete_schema}, ]
#{?snk_kind := serde_destroyed, type := SerdeType},
Trace
)
),
ok
end
), ),
ok. ok.

View File

@ -19,7 +19,17 @@
%%------------------------------------------------------------------------------ %%------------------------------------------------------------------------------
all() -> all() ->
emqx_common_test_helpers:all(?MODULE). [
{group, avro},
{group, protobuf}
].
groups() ->
AllTCs = emqx_common_test_helpers:all(?MODULE),
[
{avro, AllTCs},
{protobuf, AllTCs}
].
init_per_suite(Config) -> init_per_suite(Config) ->
emqx_config:save_schema_mod_and_names(emqx_ee_schema_registry_schema), emqx_config:save_schema_mod_and_names(emqx_ee_schema_registry_schema),
@ -30,6 +40,48 @@ end_per_suite(_Config) ->
emqx_mgmt_api_test_util:end_suite(lists:reverse(?APPS)), emqx_mgmt_api_test_util:end_suite(lists:reverse(?APPS)),
ok. ok.
init_per_group(avro, Config) ->
Source = #{
type => record,
fields => [
#{name => <<"i">>, type => <<"int">>},
#{name => <<"s">>, type => <<"string">>}
]
},
SourceBin = emqx_utils_json:encode(Source),
InvalidSourceBin = <<"{}">>,
[
{serde_type, avro},
{schema_source, SourceBin},
{invalid_schema_source, InvalidSourceBin}
| Config
];
init_per_group(protobuf, Config) ->
SourceBin =
<<
"message Person {\n"
" required string name = 1;\n"
" required int32 id = 2;\n"
" optional string email = 3;\n"
" }\n"
"message UnionValue {\n"
" oneof u {\n"
" int32 a = 1;\n"
" string b = 2;\n"
" }\n"
"}\n"
>>,
InvalidSourceBin = <<"xxxx">>,
[
{serde_type, protobuf},
{schema_source, SourceBin},
{invalid_schema_source, InvalidSourceBin}
| Config
].
end_per_group(_Group, _Config) ->
ok.
init_per_testcase(_TestCase, Config) -> init_per_testcase(_TestCase, Config) ->
clear_schemas(), clear_schemas(),
ok = snabbkaffe:start_trace(), ok = snabbkaffe:start_trace(),
@ -93,18 +145,14 @@ clear_schemas() ->
%% Testcases %% Testcases
%%------------------------------------------------------------------------------ %%------------------------------------------------------------------------------
t_crud(_Config) -> t_crud(Config) ->
SchemaName = <<"my_avro_schema">>, SerdeType = ?config(serde_type, Config),
Source = #{ SourceBin = ?config(schema_source, Config),
type => record, InvalidSourceBin = ?config(invalid_schema_source, Config),
fields => [ SerdeTypeBin = atom_to_binary(SerdeType),
#{name => <<"i">>, type => <<"int">>}, SchemaName = <<"my_schema">>,
#{name => <<"s">>, type => <<"string">>}
]
},
SourceBin = emqx_utils_json:encode(Source),
Params = #{ Params = #{
<<"type">> => <<"avro">>, <<"type">> => SerdeTypeBin,
<<"source">> => SourceBin, <<"source">> => SourceBin,
<<"name">> => SchemaName, <<"name">> => SchemaName,
<<"description">> => <<"My schema">> <<"description">> => <<"My schema">>
@ -138,7 +186,7 @@ t_crud(_Config) ->
%% create a schema %% create a schema
?assertMatch( ?assertMatch(
{ok, 201, #{ {ok, 201, #{
<<"type">> := <<"avro">>, <<"type">> := SerdeTypeBin,
<<"source">> := SourceBin, <<"source">> := SourceBin,
<<"name">> := SchemaName, <<"name">> := SchemaName,
<<"description">> := <<"My schema">> <<"description">> := <<"My schema">>
@ -147,7 +195,7 @@ t_crud(_Config) ->
), ),
?assertMatch( ?assertMatch(
{ok, 200, #{ {ok, 200, #{
<<"type">> := <<"avro">>, <<"type">> := SerdeTypeBin,
<<"source">> := SourceBin, <<"source">> := SourceBin,
<<"name">> := SchemaName, <<"name">> := SchemaName,
<<"description">> := <<"My schema">> <<"description">> := <<"My schema">>
@ -157,7 +205,7 @@ t_crud(_Config) ->
?assertMatch( ?assertMatch(
{ok, 200, [ {ok, 200, [
#{ #{
<<"type">> := <<"avro">>, <<"type">> := SerdeTypeBin,
<<"source">> := SourceBin, <<"source">> := SourceBin,
<<"name">> := SchemaName, <<"name">> := SchemaName,
<<"description">> := <<"My schema">> <<"description">> := <<"My schema">>
@ -168,7 +216,7 @@ t_crud(_Config) ->
UpdateParams1 = UpdateParams#{<<"description">> := <<"My new schema">>}, UpdateParams1 = UpdateParams#{<<"description">> := <<"My new schema">>},
?assertMatch( ?assertMatch(
{ok, 200, #{ {ok, 200, #{
<<"type">> := <<"avro">>, <<"type">> := SerdeTypeBin,
<<"source">> := SourceBin, <<"source">> := SourceBin,
<<"name">> := SchemaName, <<"name">> := SchemaName,
<<"description">> := <<"My new schema">> <<"description">> := <<"My new schema">>
@ -188,9 +236,9 @@ t_crud(_Config) ->
{ok, 400, #{ {ok, 400, #{
<<"code">> := <<"BAD_REQUEST">>, <<"code">> := <<"BAD_REQUEST">>,
<<"message">> := <<"message">> :=
<<"{post_config_update,emqx_ee_schema_registry,{not_found,<<\"type\">>}}">> <<"{post_config_update,emqx_ee_schema_registry,", _/binary>>
}}, }},
request({put, SchemaName, UpdateParams#{<<"source">> := <<"{}">>}}) request({put, SchemaName, UpdateParams#{<<"source">> := InvalidSourceBin}})
), ),
?assertMatch( ?assertMatch(
@ -229,9 +277,9 @@ t_crud(_Config) ->
{ok, 400, #{ {ok, 400, #{
<<"code">> := <<"BAD_REQUEST">>, <<"code">> := <<"BAD_REQUEST">>,
<<"message">> := <<"message">> :=
<<"{post_config_update,emqx_ee_schema_registry,{not_found,<<\"type\">>}}">> <<"{post_config_update,emqx_ee_schema_registry,", _/binary>>
}}, }},
request({post, Params#{<<"source">> := <<"{}">>}}) request({post, Params#{<<"source">> := InvalidSourceBin}})
), ),
%% unknown serde type %% unknown serde type

View File

@ -60,7 +60,25 @@ schema_params(avro) ->
] ]
}, },
SourceBin = emqx_utils_json:encode(Source), SourceBin = emqx_utils_json:encode(Source),
#{type => avro, source => SourceBin}. #{type => avro, source => SourceBin};
schema_params(protobuf) ->
SourceBin =
<<
"\n"
" message Person {\n"
" required string name = 1;\n"
" required int32 id = 2;\n"
" optional string email = 3;\n"
" }\n"
" message UnionValue {\n"
" oneof u {\n"
" int32 a = 1;\n"
" string b = 2;\n"
" }\n"
" }\n"
" "
>>,
#{type => protobuf, source => SourceBin}.
assert_roundtrip(SerdeName, Original) -> assert_roundtrip(SerdeName, Original) ->
Encoded = emqx_ee_schema_registry_serde:encode(SerdeName, Original), Encoded = emqx_ee_schema_registry_serde:encode(SerdeName, Original),
@ -119,3 +137,36 @@ t_serde_not_found(_Config) ->
emqx_ee_schema_registry_serde:decode(NonexistentSerde, Original) emqx_ee_schema_registry_serde:decode(NonexistentSerde, Original)
), ),
ok. ok.
t_roundtrip_protobuf(_Config) ->
SerdeName = my_serde,
Params = schema_params(protobuf),
ok = emqx_ee_schema_registry:add_schema(SerdeName, Params),
ExtraArgsPerson = [<<"Person">>],
Original0 = #{<<"name">> => <<"some name">>, <<"id">> => 10, <<"email">> => <<"emqx@emqx.io">>},
assert_roundtrip(SerdeName, Original0, ExtraArgsPerson, ExtraArgsPerson),
%% removing optional field
Original1 = #{<<"name">> => <<"some name">>, <<"id">> => 10},
assert_roundtrip(SerdeName, Original1, ExtraArgsPerson, ExtraArgsPerson),
%% `oneof' fields
ExtraArgsUnion = [<<"UnionValue">>],
Original2 = #{<<"a">> => 1},
assert_roundtrip(SerdeName, Original2, ExtraArgsUnion, ExtraArgsUnion),
Original3 = #{<<"b">> => <<"string">>},
assert_roundtrip(SerdeName, Original3, ExtraArgsUnion, ExtraArgsUnion),
ok.
t_protobuf_invalid_schema(_Config) ->
SerdeName = my_serde,
Params = schema_params(protobuf),
WrongParams = Params#{source := <<"xxxx">>},
?assertMatch(
{error, {post_config_update, _, {invalid_protobuf_schema, _}}},
emqx_ee_schema_registry:add_schema(SerdeName, WrongParams)
),
ok.

View File

@ -94,7 +94,7 @@ defmodule EMQXUmbrella.MixProject do
{:ranch, {:ranch,
github: "ninenines/ranch", ref: "a692f44567034dacf5efcaa24a24183788594eb7", override: true}, github: "ninenines/ranch", ref: "a692f44567034dacf5efcaa24a24183788594eb7", override: true},
# in conflict by grpc and eetcd # in conflict by grpc and eetcd
{:gpb, "4.19.5", override: true, runtime: false}, {:gpb, "4.19.7", override: true, runtime: false},
{:hackney, github: "emqx/hackney", tag: "1.18.1-1", override: true} {:hackney, github: "emqx/hackney", tag: "1.18.1-1", override: true}
] ++ ] ++
emqx_apps(profile_info, version) ++ emqx_apps(profile_info, version) ++

View File

@ -53,7 +53,7 @@
[ {lc, {git, "https://github.com/emqx/lc.git", {tag, "0.3.2"}}} [ {lc, {git, "https://github.com/emqx/lc.git", {tag, "0.3.2"}}}
, {redbug, "2.0.8"} , {redbug, "2.0.8"}
, {covertool, {git, "https://github.com/zmstone/covertool", {tag, "2.0.4.1"}}} , {covertool, {git, "https://github.com/zmstone/covertool", {tag, "2.0.4.1"}}}
, {gpb, "4.19.5"} %% gpb only used to build, but not for release, pin it here to avoid fetching a wrong version due to rebar plugins scattered in all the deps , {gpb, "4.19.7"}
, {typerefl, {git, "https://github.com/ieQu1/typerefl", {tag, "0.9.1"}}} , {typerefl, {git, "https://github.com/ieQu1/typerefl", {tag, "0.9.1"}}}
, {gun, {git, "https://github.com/emqx/gun", {tag, "1.3.9"}}} , {gun, {git, "https://github.com/emqx/gun", {tag, "1.3.9"}}}
, {ehttpc, {git, "https://github.com/emqx/ehttpc", {tag, "0.4.7"}}} , {ehttpc, {git, "https://github.com/emqx/ehttpc", {tag, "0.4.7"}}}

View File

@ -6,6 +6,12 @@ avro_type.desc:
avro_type.label: avro_type.label:
"""Apache Avro""" """Apache Avro"""
protobuf_type.desc:
"""[Protocol Buffers](https://protobuf.dev/) serialization format."""
protobuf_type.label:
"""Protocol Buffers"""
schema_description.desc: schema_description.desc:
"""A description for this schema.""" """A description for this schema."""

View File

@ -6,6 +6,12 @@ avro_type.desc:
avro_type.label: avro_type.label:
"""阿帕奇-阿夫罗""" """阿帕奇-阿夫罗"""
protobuf_type.desc:
"""[协议缓冲器](https://protobuf.dev/) 序列化格式。"""
protobuf_type.label:
"""协议缓冲器"""
schema_description.desc: schema_description.desc:
"""对该模式的描述。""" """对该模式的描述。"""