syn_test_suite_helper.erl 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378
  1. %% ==========================================================================================================
  2. %% Syn - A global Process Registry and Process Group manager.
  3. %%
  4. %% The MIT License (MIT)
  5. %%
  6. %% Copyright (c) 2015-2021 Roberto Ostinelli <roberto@ostinelli.net> and Neato Robotics, Inc.
  7. %%
  8. %% Permission is hereby granted, free of charge, to any person obtaining a copy
  9. %% of this software and associated documentation files (the "Software"), to deal
  10. %% in the Software without restriction, including without limitation the rights
  11. %% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  12. %% copies of the Software, and to permit persons to whom the Software is
  13. %% furnished to do so, subject to the following conditions:
  14. %%
  15. %% The above copyright notice and this permission notice shall be included in
  16. %% all copies or substantial portions of the Software.
  17. %%
  18. %% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. %% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. %% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  21. %% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22. %% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  23. %% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  24. %% THE SOFTWARE.
  25. %% ==========================================================================================================
  26. -module(syn_test_suite_helper).
  27. %% API
  28. -export([init_cluster/1, end_cluster/2]).
  29. -export([start_slave/1, stop_slave/1]).
  30. -export([connect_node/1, disconnect_node/1]).
  31. -export([clean_after_test/0]).
  32. -export([start_process/0, start_process/1, start_process/2]).
  33. -export([kill_process/1]).
  34. -export([wait_cluster_mesh_connected/1]).
  35. -export([wait_process_name_ready/1, wait_process_name_ready/2]).
  36. -export([wait_message_queue_empty/0]).
  37. -export([assert_cluster/2]).
  38. -export([assert_registry_scope_subcluster/3, assert_pg_scope_subcluster/3]).
  39. -export([assert_received_messages/1]).
  40. -export([assert_empty_queue/0]).
  41. -export([assert_wait/2]).
  42. -export([send_error_logger_to_disk/0]).
  43. %% internal
  44. -export([process_main/0]).
  45. %% macro
  46. -define(DEFAULT_WAIT_TIMEOUT, 5000).
  47. -define(UNEXPECTED_MESSAGES_WAIT_TIMEOUT, 1000).
  48. %% ===================================================================
  49. %% API
  50. %% ===================================================================
  51. init_cluster(NodesCount) ->
  52. SlavesCount = NodesCount - 1,
  53. {Nodes, NodesConfig} = lists:foldl(fun(I, {AccNodes, AccNodesConfig}) ->
  54. IBin = integer_to_binary(I),
  55. NodeShortName = list_to_atom(binary_to_list(<<"syn_slave_", IBin/binary>>)),
  56. {ok, SlaveNode} = start_slave(NodeShortName),
  57. %% connect
  58. lists:foreach(fun(N) ->
  59. rpc:call(SlaveNode, syn_test_suite_helper, connect_node, [N])
  60. end, AccNodes),
  61. %% config
  62. {
  63. [SlaveNode | AccNodes],
  64. [{NodeShortName, SlaveNode} | AccNodesConfig]
  65. }
  66. end, {[], []}, lists:seq(1, SlavesCount)),
  67. %% wait full cluster
  68. case syn_test_suite_helper:wait_cluster_mesh_connected([node()] ++ Nodes) of
  69. ok ->
  70. %% config
  71. NodesConfig;
  72. Other ->
  73. ct:pal("*********** Could not get full cluster of ~p nodes, skipping", [NodesCount]),
  74. {error_initializing_cluster, Other}
  75. end.
  76. end_cluster(NodesCount, Config) ->
  77. SlavesCount = NodesCount - 1,
  78. %% clean
  79. clean_after_test(),
  80. %% shutdown
  81. lists:foreach(fun(I) ->
  82. IBin = integer_to_binary(I),
  83. NodeShortName = list_to_atom(binary_to_list(<<"syn_slave_", IBin/binary>>)),
  84. SlaveNode = proplists:get_value(NodeShortName, Config),
  85. connect_node(SlaveNode),
  86. stop_slave(NodeShortName)
  87. end, lists:seq(1, SlavesCount)),
  88. %% wait
  89. timer:sleep(1000).
  90. start_slave(NodeShortName) ->
  91. %% start slave
  92. {ok, Node} = ct_slave:start(NodeShortName, [
  93. {boot_timeout, 10},
  94. {erl_flags, "-connect_all false -kernel dist_auto_connect never"}
  95. ]),
  96. %% add syn code path to slaves
  97. CodePath = lists:filter(fun(Path) ->
  98. nomatch =/= string:find(Path, "/syn/")
  99. end, code:get_path()),
  100. true = rpc:call(Node, code, set_path, [CodePath]),
  101. %% return
  102. {ok, Node}.
  103. stop_slave(NodeShortName) ->
  104. {ok, _} = ct_slave:stop(NodeShortName).
  105. connect_node(Node) ->
  106. net_kernel:connect_node(Node).
  107. disconnect_node(Node) ->
  108. erlang:disconnect_node(Node).
  109. clean_after_test() ->
  110. Nodes = [node() | nodes()],
  111. %% shutdown
  112. lists:foreach(fun(Node) ->
  113. %% close syn
  114. rpc:call(Node, application, stop, [syn]),
  115. %% clean env
  116. rpc:call(Node, application, unset_env, [syn, event_handler]),
  117. %% messages
  118. flush_inbox()
  119. end, Nodes).
  120. start_process() ->
  121. Pid = spawn(fun process_main/0),
  122. Pid.
  123. start_process(Node) when is_atom(Node) ->
  124. Pid = spawn(Node, fun process_main/0),
  125. Pid;
  126. start_process(Loop) when is_function(Loop) ->
  127. Pid = spawn(Loop),
  128. Pid.
  129. start_process(Node, Loop) ->
  130. Pid = spawn(Node, Loop),
  131. Pid.
  132. kill_process(RegisteredName) when is_atom(RegisteredName) ->
  133. case whereis(RegisteredName) of
  134. undefined -> ok;
  135. Pid -> kill_process(Pid)
  136. end;
  137. kill_process(Pid) when is_pid(Pid) ->
  138. case rpc:call(node(Pid), erlang, is_process_alive, [Pid]) of
  139. true ->
  140. MRef = monitor(process, Pid),
  141. exit(Pid, kill),
  142. receive
  143. {'DOWN', MRef, process, Pid, _Reason} -> ok
  144. after ?DEFAULT_WAIT_TIMEOUT ->
  145. ct:fail("~n\tCould not kill process ~p~n", [Pid])
  146. end;
  147. false ->
  148. ok
  149. end.
  150. wait_cluster_mesh_connected(Nodes) ->
  151. wait_cluster_mesh_connected(Nodes, os:system_time(millisecond)).
  152. wait_cluster_mesh_connected(Nodes, StartAt) ->
  153. AllSynced = lists:all(fun(Node) ->
  154. RemoteNodes = rpc:call(Node, erlang, nodes, []),
  155. AllNodes = [Node | RemoteNodes],
  156. lists:sort(AllNodes) == lists:sort(Nodes)
  157. end, Nodes),
  158. case AllSynced of
  159. true ->
  160. ok;
  161. false ->
  162. case os:system_time(millisecond) - StartAt > ?DEFAULT_WAIT_TIMEOUT of
  163. true ->
  164. {error, {could_not_init_cluster, Nodes}};
  165. false ->
  166. timer:sleep(50),
  167. wait_cluster_mesh_connected(Nodes, StartAt)
  168. end
  169. end.
  170. wait_process_name_ready(Name) ->
  171. wait_process_name_ready(Name, os:system_time(millisecond)).
  172. wait_process_name_ready(Name, StartAt) ->
  173. timer:sleep(50),
  174. case whereis(Name) of
  175. undefined ->
  176. case os:system_time(millisecond) - StartAt > ?DEFAULT_WAIT_TIMEOUT of
  177. true ->
  178. ct:fail("~n\tProcess with name ~p didn't come alive~n", [Name]);
  179. false ->
  180. wait_process_name_ready(Name, StartAt)
  181. end;
  182. Pid ->
  183. case process_info(Pid, status) of
  184. {status, waiting} ->
  185. ok;
  186. Other ->
  187. case os:system_time(millisecond) - StartAt > ?DEFAULT_WAIT_TIMEOUT of
  188. true ->
  189. ct:fail("~n\tProcess with name ~p didn't come ready~n\tStatus: ~p~n", [Name, Other]);
  190. false ->
  191. wait_process_name_ready(Name, StartAt)
  192. end
  193. end
  194. end.
  195. wait_message_queue_empty() ->
  196. timer:sleep(500),
  197. syn_test_suite_helper:assert_wait(
  198. ok,
  199. fun() ->
  200. flush_inbox(),
  201. syn_test_suite_helper:assert_empty_queue(self())
  202. end
  203. ).
  204. assert_cluster(Node, ExpectedNodes) ->
  205. assert_cluster(Node, ExpectedNodes, os:system_time(millisecond)).
  206. assert_cluster(Node, ExpectedNodes, StartAt) ->
  207. Nodes = rpc:call(Node, erlang, nodes, []),
  208. case do_assert_cluster(Nodes, ExpectedNodes, StartAt) of
  209. continue -> assert_cluster(Node, ExpectedNodes, StartAt);
  210. _ -> ok
  211. end.
  212. assert_registry_scope_subcluster(Node, Scope, ExpectedNodes) ->
  213. do_assert_scope_subcluster(registry, Node, Scope, ExpectedNodes).
  214. assert_pg_scope_subcluster(Node, Scope, ExpectedNodes) ->
  215. do_assert_scope_subcluster(pg, Node, Scope, ExpectedNodes).
  216. assert_received_messages(Messages) ->
  217. assert_received_messages(Messages, []).
  218. assert_received_messages([], UnexpectedMessages) ->
  219. assert_received_messages_wait([], UnexpectedMessages);
  220. assert_received_messages(Messages, UnexpectedMessages) ->
  221. receive
  222. Message ->
  223. case lists:member(Message, Messages) of
  224. true ->
  225. Messages1 = lists:delete(Message, Messages),
  226. assert_received_messages(Messages1, UnexpectedMessages);
  227. false ->
  228. assert_received_messages(Messages, [Message | UnexpectedMessages])
  229. end
  230. after ?DEFAULT_WAIT_TIMEOUT ->
  231. assert_received_messages_evaluate(Messages, UnexpectedMessages)
  232. end.
  233. assert_received_messages_wait(MissingMessages, UnexpectedMessages) ->
  234. receive
  235. Message ->
  236. assert_received_messages_wait(MissingMessages, [Message | UnexpectedMessages])
  237. after ?UNEXPECTED_MESSAGES_WAIT_TIMEOUT ->
  238. assert_received_messages_evaluate(MissingMessages, UnexpectedMessages)
  239. end.
  240. assert_received_messages_evaluate([], []) ->
  241. ok;
  242. assert_received_messages_evaluate(MissingMessages, UnexpectedMessages) ->
  243. ct:fail("~n\tReceive messages error (line ~p)~n\tMissing: ~p~n\tUnexpected: ~p~n",
  244. [get_line_from_stacktrace(), lists:reverse(MissingMessages), lists:reverse(UnexpectedMessages)]
  245. ).
  246. assert_empty_queue() ->
  247. assert_empty_queue([]).
  248. assert_empty_queue(UnexpectedMessages) ->
  249. receive
  250. Message ->
  251. assert_empty_queue([Message | UnexpectedMessages])
  252. after ?UNEXPECTED_MESSAGES_WAIT_TIMEOUT ->
  253. case UnexpectedMessages of
  254. [] -> ok;
  255. _ -> ct:fail("~n\tMessage queue was not empty, got:~n\t~p~n", [UnexpectedMessages])
  256. end
  257. end.
  258. assert_wait(ExpectedResult, Fun) ->
  259. assert_wait(ExpectedResult, Fun, os:system_time(millisecond)).
  260. assert_wait(ExpectedResult, Fun, StartAt) ->
  261. case Fun() of
  262. ExpectedResult ->
  263. ok;
  264. Result ->
  265. case os:system_time(millisecond) - StartAt > ?DEFAULT_WAIT_TIMEOUT of
  266. true ->
  267. ct:fail("~n\tExpected: ~p~n\tActual: ~p~n", [ExpectedResult, Result]);
  268. false ->
  269. timer:sleep(50),
  270. assert_wait(ExpectedResult, Fun, StartAt)
  271. end
  272. end.
  273. send_error_logger_to_disk() ->
  274. error_logger:logfile({open, atom_to_list(node())}).
  275. %% ===================================================================
  276. %% Internal
  277. %% ===================================================================
  278. process_main() ->
  279. receive
  280. _ -> process_main()
  281. end.
  282. do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes) ->
  283. do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes, os:system_time(millisecond)).
  284. do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes, StartAt) ->
  285. Nodes = rpc:call(Node, syn, subcluster_nodes, [Type, Scope]),
  286. case do_assert_cluster(Nodes, ExpectedNodes, StartAt) of
  287. continue -> do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes, StartAt);
  288. _ -> ok
  289. end.
  290. do_assert_cluster(Nodes, ExpectedNodes, StartAt) ->
  291. ExpectedCount = length(ExpectedNodes),
  292. %% count nodes
  293. case length(Nodes) of
  294. ExpectedCount ->
  295. %% loop nodes
  296. RemainingNodes = lists:filter(fun(N) -> not lists:member(N, ExpectedNodes) end, Nodes),
  297. case length(RemainingNodes) of
  298. 0 ->
  299. ok;
  300. _ ->
  301. case os:system_time(millisecond) - StartAt > ?DEFAULT_WAIT_TIMEOUT of
  302. true ->
  303. ct:fail("~n\tInvalid subcluster~n\tExpected: ~p~n\tActual: ~p~n\tLine: ~p~n",
  304. [ExpectedNodes, Nodes, get_line_from_stacktrace()]
  305. );
  306. false ->
  307. timer:sleep(50),
  308. continue
  309. end
  310. end;
  311. _ ->
  312. case os:system_time(millisecond) - StartAt > ?DEFAULT_WAIT_TIMEOUT of
  313. true ->
  314. ct:fail("~n\tInvalid subcluster~n\tExpected: ~p~n\tActual: ~p~n\tLine: ~p~n",
  315. [ExpectedNodes, Nodes, get_line_from_stacktrace()]
  316. );
  317. false ->
  318. timer:sleep(50),
  319. continue
  320. end
  321. end.
  322. flush_inbox() ->
  323. receive
  324. _ -> flush_inbox()
  325. after 0 ->
  326. ok
  327. end.
  328. get_line_from_stacktrace() ->
  329. {current_stacktrace, Stacktrace} = process_info(self(), current_stacktrace),
  330. [{_, _, _, FileInfo} | _] = lists:dropwhile(fun({Module, _Method, _Arity, _FileInfo}) ->
  331. Module =:= ?MODULE end, Stacktrace),
  332. proplists:get_value(line, FileInfo).