./ct_report/coverage/mod_mam_rdbms_arch.COVER.html

1 %%%-------------------------------------------------------------------
2 %%% @author Uvarov Michael <arcusfelis@gmail.com>
3 %%% @copyright (C) 2013, Uvarov Michael
4 %%% @doc RDBMS backend for Message Archive Management.
5 %%% @end
6 %%%-------------------------------------------------------------------
7 -module(mod_mam_rdbms_arch).
8
9 %% ----------------------------------------------------------------------
10 %% Exports
11
12 %% gen_mod handlers
13 -export([start/2, stop/1, hooks/1, supported_features/0]).
14
15 %% MAM hook handlers
16 -behaviour(ejabberd_gen_mam_archive).
17 -behaviour(gen_mod).
18 -behaviour(mongoose_module_metrics).
19
20 -callback encode(term()) -> binary().
21 -callback decode(binary()) -> term().
22
23 -export([archive_size/3,
24 archive_message/3,
25 lookup_messages/3,
26 remove_archive/3,
27 remove_domain/3,
28 get_mam_pm_gdpr_data/3]).
29
30 %% Called from mod_mam_rdbms_async_pool_writer
31 -export([prepare_message/2, retract_message/2, prepare_insert/2]).
32
33 -type host_type() :: mongooseim:host_type().
34
35 %% ----------------------------------------------------------------------
36 %% Imports
37
38 -include("mongoose.hrl").
39 -include("jlib.hrl").
40 -include("mongoose_mam.hrl").
41
42 %% ----------------------------------------------------------------------
43 %% Types
44
45 -type env_vars() :: #{
46 host_type := host_type(),
47 archive_jid := jid:jid(),
48 table := atom(),
49 index_hint_fn := fun((env_vars()) -> mam_lookup_sql:sql_part()),
50 columns_sql_fn := fun((mam_lookup_sql:query_type()) -> mam_lookup_sql:sql_part()),
51 column_to_id_fn := fun((mam_lookup_sql:column()) -> string()),
52 lookup_fn := mam_lookup_sql:lookup_query_fn(),
53 decode_row_fn := fun((Row :: tuple(), env_vars()) -> Decoded :: tuple()),
54 has_message_retraction := boolean(),
55 has_full_text_search := boolean(),
56 db_jid_codec := module(),
57 db_message_codec := module()
58 }.
59
60 -export_type([env_vars/0]).
61
62 %% ----------------------------------------------------------------------
63 %% gen_mod callbacks
64 %% Starting and stopping functions for users' archives
65
66 -spec start(host_type(), gen_mod:module_opts()) -> ok.
67 start(_HostType, Opts) ->
68 1 register_prepared_queries(Opts),
69 1 ok.
70
71 -spec stop(host_type()) -> ok.
72 stop(_HostType) ->
73
:-(
ok.
74
75 -spec supported_features() -> [atom()].
76 supported_features() ->
77
:-(
[dynamic_domains].
78
79 -spec get_mam_pm_gdpr_data(Acc, Params, Extra) -> {ok, Acc} when
80 Acc :: ejabberd_gen_mam_archive:mam_pm_gdpr_data(),
81 Params :: #{jid := jid:jid()},
82 Extra :: gen_hook:extra().
83 get_mam_pm_gdpr_data(Acc,
84 #{jid := #jid{luser = LUser, lserver = LServer} = ArcJID},
85 #{host_type := HostType}) ->
86
:-(
case mod_mam_pm:archive_id(LServer, LUser) of
87 undefined ->
88
:-(
{ok, Acc};
89 ArcID ->
90
:-(
Env = env_vars(HostType, ArcJID),
91
:-(
{selected, Rows} = extract_gdpr_messages(Env, ArcID),
92
:-(
{ok, [uniform_to_gdpr(row_to_uniform_format(Row, Env)) || Row <- Rows] ++ Acc}
93 end.
94
95 -spec uniform_to_gdpr(mod_mam:message_row()) -> tuple().
96 uniform_to_gdpr(#{id := MessID, jid := RemoteJID, packet := Packet}) ->
97
:-(
{integer_to_binary(MessID), jid:to_binary(RemoteJID), exml:to_binary(Packet)}.
98
99 %% ----------------------------------------------------------------------
100 %% Add hooks for mod_mam_pm
101
102 -spec hooks(mongooseim:host_type()) -> gen_hook:hook_list().
103 hooks(HostType) ->
104 case gen_mod:get_module_opt(HostType, ?MODULE, no_writer) of
105 true ->
106
:-(
[];
107 false ->
108 1 [{mam_archive_message, HostType, fun ?MODULE:archive_message/3, #{}, 50}]
109 1 end ++
110 [{mam_archive_size, HostType, fun ?MODULE:archive_size/3, #{}, 50},
111 {mam_lookup_messages, HostType, fun ?MODULE:lookup_messages/3, #{}, 50},
112 {mam_remove_archive, HostType, fun ?MODULE:remove_archive/3, #{}, 50},
113 {get_mam_pm_gdpr_data, HostType, fun ?MODULE:get_mam_pm_gdpr_data/3, #{}, 50},
114 {remove_domain, HostType, fun ?MODULE:remove_domain/3, #{}, 50}].
115
116 %% ----------------------------------------------------------------------
117 %% SQL queries
118
119 register_prepared_queries(Opts) ->
120 1 prepare_insert(insert_mam_message, 1),
121 1 mongoose_rdbms:prepare(mam_archive_remove, mam_message, [user_id],
122 <<"DELETE FROM mam_message "
123 "WHERE user_id = ?">>),
124
125 %% Domain Removal
126 1 prepare_remove_domain(Opts),
127
128 1 mongoose_rdbms:prepare(mam_make_tombstone, mam_message, [message, user_id, id],
129 <<"UPDATE mam_message SET message = ?, search_body = '' "
130 "WHERE user_id = ? AND id = ?">>),
131 1 {LimitSQL, LimitMSSQL} = rdbms_queries:get_db_specific_limits_binaries(1),
132 1 mongoose_rdbms:prepare(mam_select_messages_to_retract_on_origin_id, mam_message,
133 [user_id, remote_bare_jid, origin_id, direction],
134 <<"SELECT ", LimitMSSQL/binary,
135 " id, message FROM mam_message"
136 " WHERE user_id = ? AND remote_bare_jid = ? "
137 " AND origin_id = ? AND direction = ?"
138 " ORDER BY id DESC ", LimitSQL/binary>>),
139 1 mongoose_rdbms:prepare(mam_select_messages_to_retract_on_stanza_id, mam_message,
140 [user_id, remote_bare_jid, id, direction],
141 <<"SELECT ", LimitMSSQL/binary,
142 " origin_id, message FROM mam_message"
143 " WHERE user_id = ? AND remote_bare_jid = ? "
144 " AND id = ? AND direction = ?"
145 " ORDER BY id DESC ", LimitSQL/binary>>).
146
147 prepare_remove_domain(#{delete_domain_limit := infinity}) ->
148 1 mongoose_rdbms:prepare(mam_remove_domain, mam_message, ['mam_server_user.server'],
149 <<"DELETE FROM mam_message "
150 "WHERE user_id IN "
151 "(SELECT id from mam_server_user WHERE server = ?)">>),
152 1 mongoose_rdbms:prepare(mam_remove_domain_prefs, mam_config, ['mam_server_user.server'],
153 <<"DELETE FROM mam_config "
154 "WHERE user_id IN "
155 "(SELECT id from mam_server_user WHERE server = ?)">>),
156 1 mongoose_rdbms:prepare(mam_remove_domain_users, mam_server_user, [server],
157 <<"DELETE FROM mam_server_user WHERE server = ?">>);
158 prepare_remove_domain(#{delete_domain_limit := Limit}) ->
159
:-(
LimitSQL = case mongoose_rdbms:db_type() of
160
:-(
mssql -> throw(delete_domain_limit_not_supported_for_mssql);
161
:-(
_ -> {MaybeLimitSQL, _} = rdbms_queries:get_db_specific_limits_binaries(Limit),
162
:-(
MaybeLimitSQL
163 end,
164
:-(
IdTable = <<"(SELECT * FROM ",
165 "(SELECT msg.user_id, msg.id FROM mam_message msg",
166 " INNER JOIN mam_server_user msu ON msu.id=msg.user_id",
167 " WHERE msu.server = ? ", LimitSQL/binary, ") AS T)">>,
168
:-(
mongoose_rdbms:prepare(mam_incr_remove_domain, mam_message, ['mam_server_user.server'],
169 <<"DELETE FROM mam_message WHERE (user_id, id) IN ", IdTable/binary>>),
170
:-(
CfgTable = <<"(SELECT * FROM ",
171 "(SELECT cfg.user_id, cfg.remote_jid FROM mam_config cfg",
172 " INNER JOIN mam_server_user msu ON msu.id=cfg.user_id",
173 " WHERE msu.server = ? ", LimitSQL/binary, ") AS T)">>,
174
:-(
mongoose_rdbms:prepare(mam_incr_remove_domain_prefs, mam_config, ['mam_server_user.server'],
175 <<"DELETE FROM mam_config "
176 "WHERE (user_id, remote_jid) IN ", CfgTable/binary>>),
177
:-(
ServerTable = <<"(SELECT * FROM ",
178 "(SELECT id FROM mam_server_user WHERE server = ? ", LimitSQL/binary, ") as t)">>,
179
:-(
mongoose_rdbms:prepare(mam_incr_remove_domain_users, mam_server_user, [server],
180 <<"DELETE FROM mam_server_user WHERE id IN ", ServerTable/binary>>).
181
182
183 %% ----------------------------------------------------------------------
184 %% Declarative logic
185
186 db_mappings() ->
187 %% One entry per the database field
188 61 [#db_mapping{column = id, param = message_id, format = int},
189 #db_mapping{column = user_id, param = archive_id, format = int},
190 #db_mapping{column = remote_bare_jid, param = remote_jid, format = bare_jid},
191 #db_mapping{column = remote_resource, param = remote_jid, format = jid_resource},
192 #db_mapping{column = direction, param = direction, format = direction},
193 #db_mapping{column = from_jid, param = source_jid, format = jid},
194 #db_mapping{column = origin_id, param = origin_id, format = maybe_string},
195 #db_mapping{column = message, param = packet, format = xml},
196 #db_mapping{column = search_body, param = packet, format = search}].
197
198 lookup_fields() ->
199 %% Describe each possible filtering option
200 12 [#lookup_field{op = equal, column = user_id, param = archive_id, required = true},
201 #lookup_field{op = ge, column = id, param = start_id},
202 #lookup_field{op = le, column = id, param = end_id},
203 #lookup_field{op = equal, column = remote_bare_jid, param = remote_bare_jid},
204 #lookup_field{op = equal, column = remote_resource, param = remote_resource},
205 #lookup_field{op = like, column = search_body, param = norm_search_text, value_maker = search_words}].
206
207 -spec env_vars(host_type(), jid:jid()) -> env_vars().
208 env_vars(HostType, ArcJID) ->
209 %% Please, minimize the usage of the host_type field.
210 %% It's only for passing into RDBMS.
211 72 #{host_type => HostType,
212 archive_jid => ArcJID,
213 table => mam_message,
214 index_hint_fn => fun index_hint_sql/1,
215 columns_sql_fn => fun columns_sql/1,
216 column_to_id_fn => fun column_to_id/1,
217 lookup_fn => fun lookup_query/5,
218 decode_row_fn => fun row_to_uniform_format/2,
219 has_message_retraction => mod_mam_utils:has_message_retraction(mod_mam_pm, HostType),
220 has_full_text_search => mod_mam_utils:has_full_text_search(mod_mam_pm, HostType),
221 db_jid_codec => mod_mam_utils:db_jid_codec(HostType, ?MODULE),
222 db_message_codec => mod_mam_utils:db_message_codec(HostType, ?MODULE)}.
223
224 row_to_uniform_format(Row, Env) ->
225 8 mam_decoder:decode_row(Row, Env).
226
227 -spec index_hint_sql(env_vars()) -> string().
228 index_hint_sql(#{host_type := HostType}) ->
229 1 case mongoose_rdbms:db_engine(HostType) of
230
:-(
mysql -> "USE INDEX(PRIMARY, i_mam_message_rem) ";
231 1 _ -> ""
232 end.
233
234 1 columns_sql(lookup) -> "id, from_jid, message";
235
:-(
columns_sql(count) -> "COUNT(*)".
236
237 %% For each unique column in lookup_fields()
238
:-(
column_to_id(id) -> "i";
239 12 column_to_id(user_id) -> "u";
240
:-(
column_to_id(remote_bare_jid) -> "b";
241
:-(
column_to_id(remote_resource) -> "r";
242
:-(
column_to_id(search_body) -> "s".
243
244 column_names(Mappings) ->
245 1 [Column || #db_mapping{column = Column} <- Mappings].
246
247 %% ----------------------------------------------------------------------
248 %% Options
249
250 -spec get_retract_id(exml:element(), env_vars()) -> none | mod_mam_utils:retraction_id().
251 get_retract_id(Packet, #{has_message_retraction := Enabled}) ->
252 60 mod_mam_utils:get_retract_id(Enabled, Packet).
253
254 %% ----------------------------------------------------------------------
255 %% Internal functions and callbacks
256
257 -spec archive_size(Acc, Params, Extra) -> {ok, Acc} when
258 Acc :: integer(),
259 Params :: #{archive_id := mod_mam:archive_id() | undefined, owner := jid:jid()},
260 Extra :: gen_hook:extra().
261 archive_size(Size, #{archive_id := ArcID, owner := ArcJID}, #{host_type := HostType}) when is_integer(Size) ->
262
:-(
Filter = [{equal, user_id, ArcID}],
263
:-(
Env = env_vars(HostType, ArcJID),
264
:-(
Result = lookup_query(count, Env, Filter, unordered, all),
265
:-(
{ok, mongoose_rdbms:selected_to_integer(Result)}.
266
267 -spec archive_message(Acc, Params, Extra) -> {ok, Acc} when
268 Acc :: ok,
269 Params :: mod_mam:archive_message_params(),
270 Extra :: gen_hook:extra().
271 archive_message(_Result, #{local_jid := ArcJID} = Params, #{host_type := HostType}) ->
272 60 try
273 60 assert_archive_id_provided(Params),
274 60 Env = env_vars(HostType, ArcJID),
275 60 do_archive_message(HostType, Params, Env),
276 60 retract_message(HostType, Params, Env),
277 60 {ok, ok}
278 catch error:Reason:StackTrace ->
279
:-(
?LOG_ERROR(#{what => archive_message_failed,
280 host_type => HostType, mam_params => Params,
281
:-(
reason => Reason, stacktrace => StackTrace}),
282
:-(
erlang:raise(error, Reason, StackTrace)
283 end.
284
285 do_archive_message(HostType, Params, Env) ->
286 60 Row = mam_encoder:encode_message(Params, Env, db_mappings()),
287 60 {updated, 1} = mongoose_rdbms:execute_successfully(HostType, insert_mam_message, Row).
288
289 %% Retraction logic
290 %% Called after inserting a new message
291 -spec retract_message(host_type(), mod_mam:archive_message_params()) -> ok.
292 retract_message(HostType, #{local_jid := ArcJID} = Params) ->
293
:-(
Env = env_vars(HostType, ArcJID),
294
:-(
retract_message(HostType, Params, Env).
295
296 -spec retract_message(host_type(), mod_mam:archive_message_params(), env_vars()) -> ok.
297 retract_message(HostType, #{archive_id := ArcID, remote_jid := RemJID,
298 direction := Dir, packet := Packet} = Params, Env) ->
299 60 case get_retract_id(Packet, Env) of
300 60 none -> ok;
301 RetractionId ->
302
:-(
Info = get_retraction_info(HostType, ArcID, RemJID, RetractionId, Dir, Env),
303
:-(
make_tombstone(HostType, ArcID, RetractionId, Info, Params, Env)
304 end.
305
306 get_retraction_info(HostType, ArcID, RemJID, RetractionId, Dir, Env) ->
307 %% Code style notice:
308 %% - Add Ext prefix for all externally encoded data
309 %% (in cases, when we usually add Bin, B, S Esc prefixes)
310
:-(
ExtBareRemJID = mam_encoder:encode_jid(jid:to_bare(RemJID), Env),
311
:-(
ExtDir = mam_encoder:encode_direction(Dir),
312
:-(
{selected, Rows} = execute_select_messages_to_retract(
313 HostType, ArcID, ExtBareRemJID, RetractionId, ExtDir),
314
:-(
mam_decoder:decode_retraction_info(Env, Rows, RetractionId).
315
316 make_tombstone(_HostType, ArcID, RetractionId, skip, _Params, _Env) ->
317
:-(
?LOG_INFO(#{what => make_tombstone_failed,
318 text => <<"Message to retract was not found">>,
319
:-(
user_id => ArcID, retraction_context => RetractionId});
320 make_tombstone(HostType, ArcID, _RetractionId,
321 RetractionInfo = #{message_id := MessID}, Params,
322 #{archive_jid := ArcJID} = Env) ->
323
:-(
RetractionInfo1 = mongoose_hooks:mam_retraction(HostType, RetractionInfo, Params),
324
:-(
Tombstone = mod_mam_utils:tombstone(RetractionInfo1, ArcJID),
325
:-(
TombstoneData = mam_encoder:encode_packet(Tombstone, Env),
326
:-(
execute_make_tombstone(HostType, TombstoneData, ArcID, MessID).
327
328 execute_select_messages_to_retract(HostType, ArcID, BareRemJID, {origin_id, OriginID}, Dir) ->
329
:-(
mongoose_rdbms:execute_successfully(HostType, mam_select_messages_to_retract_on_origin_id,
330 [ArcID, BareRemJID, OriginID, Dir]);
331 execute_select_messages_to_retract(HostType, ArcID, BareRemJID, {stanza_id, BinStanzaId}, Dir) ->
332
:-(
StanzaId = mod_mam_utils:external_binary_to_mess_id(BinStanzaId),
333
:-(
mongoose_rdbms:execute_successfully(HostType, mam_select_messages_to_retract_on_stanza_id,
334 [ArcID, BareRemJID, StanzaId, Dir]).
335
336 execute_make_tombstone(HostType, TombstoneData, ArcID, MessID) ->
337
:-(
mongoose_rdbms:execute_successfully(HostType, mam_make_tombstone,
338 [TombstoneData, ArcID, MessID]).
339
340 %% Insert logic
341 -spec prepare_message(host_type(), mod_mam:archive_message_params()) -> list().
342 prepare_message(HostType, Params = #{local_jid := ArcJID}) ->
343
:-(
Env = env_vars(HostType, ArcJID),
344
:-(
mam_encoder:encode_message(Params, Env, db_mappings()).
345
346 -spec prepare_insert(Name :: atom(), NumRows :: pos_integer()) -> ok.
347 prepare_insert(Name, NumRows) ->
348 1 Table = mam_message,
349 1 Fields = column_names(db_mappings()),
350 1 {Query, Fields2} = rdbms_queries:create_bulk_insert_query(Table, Fields, NumRows),
351 1 mongoose_rdbms:prepare(Name, Table, Fields2, Query),
352 1 ok.
353
354 %% Removal logic
355 -spec remove_archive(Acc, Params, Extra) -> {ok, Acc} when
356 Acc :: term(),
357 Params :: #{archive_id := mod_mam:archive_id() | undefined, owner := jid:jid()},
358 Extra :: gen_hook:extra().
359 remove_archive(Acc, #{archive_id := ArcID}, #{host_type := HostType}) ->
360
:-(
mongoose_rdbms:execute_successfully(HostType, mam_archive_remove, [ArcID]),
361
:-(
{ok, Acc}.
362
363 -spec remove_domain(Acc, Params, Extra) -> {ok | stop, Acc} when
364 Acc :: mongoose_domain_api:remove_domain_acc(),
365 Params :: map(),
366 Extra :: gen_hook:extra().
367 remove_domain(Acc, #{domain := Domain}, #{host_type := HostType}) ->
368
:-(
F = fun() ->
369
:-(
case gen_mod:get_module_opt(HostType, ?MODULE, delete_domain_limit) of
370
:-(
infinity -> remove_domain_all(HostType, Domain);
371
:-(
Limit -> remove_domain_batch(HostType, Domain, Limit)
372 end,
373
:-(
Acc
374 end,
375
:-(
mongoose_domain_api:remove_domain_wrapper(Acc, F, ?MODULE).
376
377 -spec remove_domain_all(host_type(), jid:lserver()) -> any().
378 remove_domain_all(HostType, Domain) ->
379
:-(
{atomic, _} = mongoose_rdbms:sql_transaction(HostType, fun() ->
380
:-(
mongoose_rdbms:execute_successfully(HostType, mam_remove_domain, [Domain]),
381
:-(
mongoose_rdbms:execute_successfully(HostType, mam_remove_domain_prefs, [Domain]),
382
:-(
mongoose_rdbms:execute_successfully(HostType, mam_remove_domain_users, [Domain])
383 end).
384
385 -spec remove_domain_batch(host_type(), jid:lserver(), non_neg_integer()) -> any().
386 remove_domain_batch(HostType, Domain, Limit) ->
387
:-(
DeleteQueries = [mam_incr_remove_domain, mam_incr_remove_domain_prefs, mam_incr_remove_domain_users],
388
:-(
TotalDeleted = mod_mam_utils:incremental_delete_domain(HostType, Domain, Limit, DeleteQueries, 0),
389
:-(
?LOG_INFO(#{what => mam_domain_removal_completed, total_records_deleted => TotalDeleted,
390
:-(
domain => Domain, host_type => HostType}).
391
392 %% GDPR logic
393 extract_gdpr_messages(Env, ArcID) ->
394
:-(
Filters = [{equal, user_id, ArcID}],
395
:-(
lookup_query(lookup, Env, Filters, asc, all).
396
397 %% Lookup logic
398 -spec lookup_messages(Acc, Params, Extra) -> {ok, Acc} when
399 Acc :: {ok, mod_mam:lookup_result()},
400 Params :: mam_iq:lookup_params(),
401 Extra :: gen_hook:extra().
402 lookup_messages({error, _Reason} = Result, _Params, _Extra) ->
403
:-(
{ok, Result};
404 lookup_messages(_Result, #{owner_jid := ArcJID} = Params, #{host_type := HostType}) ->
405 12 Env = env_vars(HostType, ArcJID),
406 12 ExdParams = mam_encoder:extend_lookup_params(Params, Env),
407 12 Filter = mam_filter:produce_filter(ExdParams, lookup_fields()),
408 12 {ok, mam_lookup:lookup(Env, Filter, ExdParams)}.
409
410 lookup_query(QueryType, Env, Filters, Order, OffsetLimit) ->
411 12 mam_lookup_sql:lookup_query(QueryType, Env, Filters, Order, OffsetLimit).
412
413 assert_archive_id_provided(#{archive_id := ArcID}) when is_integer(ArcID) ->
414 60 ok.
Line Hits Source