syn_test_suite_helper.erl 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364
  1. %% ==========================================================================================================
  2. %% Syn - A global Process Registry and Process Group manager.
  3. %%
  4. %% The MIT License (MIT)
  5. %%
  6. %% Copyright (c) 2015-2021 Roberto Ostinelli <roberto@ostinelli.net> and Neato Robotics, Inc.
  7. %%
  8. %% Permission is hereby granted, free of charge, to any person obtaining a copy
  9. %% of this software and associated documentation files (the "Software"), to deal
  10. %% in the Software without restriction, including without limitation the rights
  11. %% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  12. %% copies of the Software, and to permit persons to whom the Software is
  13. %% furnished to do so, subject to the following conditions:
  14. %%
  15. %% The above copyright notice and this permission notice shall be included in
  16. %% all copies or substantial portions of the Software.
  17. %%
  18. %% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. %% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. %% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  21. %% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22. %% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  23. %% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  24. %% THE SOFTWARE.
  25. %% ==========================================================================================================
  26. -module(syn_test_suite_helper).
  27. %% API
  28. -export([init_cluster/1, end_cluster/2]).
  29. -export([start_slave/1, stop_slave/1]).
  30. -export([connect_node/1, disconnect_node/1]).
  31. -export([clean_after_test/0]).
  32. -export([start_process/0, start_process/1, start_process/2]).
  33. -export([kill_process/1]).
  34. -export([wait_cluster_mesh_connected/1]).
  35. -export([wait_process_name_ready/1, wait_process_name_ready/2]).
  36. -export([wait_message_queue_empty/0]).
  37. -export([assert_cluster/2]).
  38. -export([assert_registry_scope_subcluster/3, assert_pg_scope_subcluster/3]).
  39. -export([assert_received_messages/1]).
  40. -export([assert_empty_queue/1]).
  41. -export([assert_wait/2]).
  42. -export([send_error_logger_to_disk/0]).
  43. %% internal
  44. -export([process_main/0]).
  45. %% macro
  46. -define(TIMEOUT, 5000).
  47. %% ===================================================================
  48. %% API
  49. %% ===================================================================
  50. init_cluster(NodesCount) ->
  51. SlavesCount = NodesCount - 1,
  52. {Nodes, NodesConfig} = lists:foldl(fun(I, {AccNodes, AccNodesConfig}) ->
  53. IBin = integer_to_binary(I),
  54. NodeShortName = binary_to_atom(<<"syn_slave_", IBin/binary>>),
  55. {ok, SlaveNode} = start_slave(NodeShortName),
  56. %% connect
  57. lists:foreach(fun(N) ->
  58. rpc:call(SlaveNode, syn_test_suite_helper, connect_node, [N])
  59. end, AccNodes),
  60. %% config
  61. {
  62. [SlaveNode | AccNodes],
  63. [{NodeShortName, SlaveNode} | AccNodesConfig]
  64. }
  65. end, {[], []}, lists:seq(1, SlavesCount)),
  66. %% wait full cluster
  67. case syn_test_suite_helper:wait_cluster_mesh_connected([node()] ++ Nodes) of
  68. ok ->
  69. %% config
  70. NodesConfig;
  71. Other ->
  72. ct:pal("*********** Could not get full cluster of ~p nodes, skipping", [NodesCount]),
  73. {error_initializing_cluster, Other}
  74. end.
  75. end_cluster(NodesCount, Config) ->
  76. SlavesCount = NodesCount - 1,
  77. %% shutdown
  78. lists:foreach(fun(I) ->
  79. IBin = integer_to_binary(I),
  80. NodeShortName = binary_to_atom(<<"syn_slave_", IBin/binary>>),
  81. SlaveNode = proplists:get_value(NodeShortName, Config),
  82. connect_node(SlaveNode),
  83. stop_slave(NodeShortName)
  84. end, lists:seq(1, SlavesCount)),
  85. %% clean
  86. clean_after_test(),
  87. %% wait
  88. timer:sleep(1000).
  89. start_slave(NodeShortName) ->
  90. %% start slave
  91. {ok, Node} = ct_slave:start(NodeShortName, [
  92. {boot_timeout, 10},
  93. {erl_flags, "-connect_all false -kernel dist_auto_connect never"}
  94. ]),
  95. %% add syn code path to slaves
  96. CodePath = lists:filter(fun(Path) ->
  97. nomatch =/= string:find(Path, "/syn/")
  98. end, code:get_path()),
  99. true = rpc:call(Node, code, set_path, [CodePath]),
  100. %% return
  101. {ok, Node}.
  102. stop_slave(NodeShortName) ->
  103. {ok, _} = ct_slave:stop(NodeShortName).
  104. connect_node(Node) ->
  105. net_kernel:connect_node(Node).
  106. disconnect_node(Node) ->
  107. erlang:disconnect_node(Node).
  108. clean_after_test() ->
  109. Nodes = [node() | nodes()],
  110. %% shutdown
  111. lists:foreach(fun(Node) ->
  112. %% close syn
  113. rpc:call(Node, application, stop, [syn]),
  114. %% clean env
  115. rpc:call(Node, application, unset_env, [syn, event_handler])
  116. end, Nodes).
  117. start_process() ->
  118. Pid = spawn(fun process_main/0),
  119. Pid.
  120. start_process(Node) when is_atom(Node) ->
  121. Pid = spawn(Node, fun process_main/0),
  122. Pid;
  123. start_process(Loop) when is_function(Loop) ->
  124. Pid = spawn(Loop),
  125. Pid.
  126. start_process(Node, Loop) ->
  127. Pid = spawn(Node, Loop),
  128. Pid.
  129. kill_process(RegisteredName) when is_atom(RegisteredName) ->
  130. case whereis(RegisteredName) of
  131. undefined -> ok;
  132. Pid -> kill_process(Pid)
  133. end;
  134. kill_process(Pid) when is_pid(Pid) ->
  135. case rpc:call(node(Pid), erlang, is_process_alive, [Pid]) of
  136. true ->
  137. MRef = monitor(process, Pid),
  138. exit(Pid, kill),
  139. receive
  140. {'DOWN', MRef, process, Pid, _Reason} -> ok
  141. after ?TIMEOUT ->
  142. ct:fail("~n\tCould not kill process ~p~n", [Pid])
  143. end;
  144. false ->
  145. ok
  146. end.
  147. wait_cluster_mesh_connected(Nodes) ->
  148. wait_cluster_mesh_connected(Nodes, os:system_time(millisecond)).
  149. wait_cluster_mesh_connected(Nodes, StartAt) ->
  150. AllSynced = lists:all(fun(Node) ->
  151. RemoteNodes = rpc:call(Node, erlang, nodes, []),
  152. AllNodes = [Node | RemoteNodes],
  153. lists:sort(AllNodes) == lists:sort(Nodes)
  154. end, Nodes),
  155. case AllSynced of
  156. true ->
  157. ok;
  158. false ->
  159. case os:system_time(millisecond) - StartAt > ?TIMEOUT of
  160. true ->
  161. {error, {could_not_init_cluster, Nodes}};
  162. false ->
  163. timer:sleep(50),
  164. wait_cluster_mesh_connected(Nodes, StartAt)
  165. end
  166. end.
  167. wait_process_name_ready(Name) ->
  168. wait_process_name_ready(Name, os:system_time(millisecond)).
  169. wait_process_name_ready(Name, StartAt) ->
  170. timer:sleep(50),
  171. case whereis(Name) of
  172. undefined ->
  173. case os:system_time(millisecond) - StartAt > ?TIMEOUT of
  174. true ->
  175. ct:fail("~n\tProcess with name ~p didn't come alive~n", [Name]);
  176. false ->
  177. wait_process_name_ready(Name, StartAt)
  178. end;
  179. Pid ->
  180. case process_info(Pid, status) of
  181. {status, waiting} ->
  182. ok;
  183. Other ->
  184. case os:system_time(millisecond) - StartAt > ?TIMEOUT of
  185. true ->
  186. ct:fail("~n\tProcess with name ~p didn't come ready~n\tStatus: ~p~n", [Name, Other]);
  187. false ->
  188. wait_process_name_ready(Name, StartAt)
  189. end
  190. end
  191. end.
  192. wait_message_queue_empty() ->
  193. timer:sleep(500),
  194. syn_test_suite_helper:assert_wait(
  195. ok,
  196. fun() ->
  197. flush_inbox(),
  198. syn_test_suite_helper:assert_empty_queue(self())
  199. end
  200. ).
  201. assert_cluster(Node, ExpectedNodes) ->
  202. assert_cluster(Node, ExpectedNodes, os:system_time(millisecond)).
  203. assert_cluster(Node, ExpectedNodes, StartAt) ->
  204. Nodes = rpc:call(Node, erlang, nodes, []),
  205. case do_assert_cluster(Nodes, ExpectedNodes, StartAt) of
  206. continue -> assert_cluster(Node, ExpectedNodes, StartAt);
  207. _ -> ok
  208. end.
  209. assert_registry_scope_subcluster(Node, Scope, ExpectedNodes) ->
  210. do_assert_scope_subcluster(registry, Node, Scope, ExpectedNodes).
  211. assert_pg_scope_subcluster(Node, Scope, ExpectedNodes) ->
  212. do_assert_scope_subcluster(pg, Node, Scope, ExpectedNodes).
  213. assert_received_messages(Messages) ->
  214. assert_received_messages(Messages, []).
  215. assert_received_messages([], UnexpectedMessages) ->
  216. do_assert_received_messages([], UnexpectedMessages);
  217. assert_received_messages(Messages, UnexpectedMessages) ->
  218. receive
  219. Message ->
  220. case lists:member(Message, Messages) of
  221. true ->
  222. Messages1 = lists:delete(Message, Messages),
  223. assert_received_messages(Messages1, UnexpectedMessages);
  224. false ->
  225. assert_received_messages(Messages, [Message | UnexpectedMessages])
  226. end
  227. after ?TIMEOUT ->
  228. do_assert_received_messages(Messages, UnexpectedMessages)
  229. end.
  230. assert_empty_queue(Pid) when is_pid(Pid) ->
  231. case process_info(Pid, message_queue_len) of
  232. {message_queue_len, 0} ->
  233. ok;
  234. _ ->
  235. {messages, Messages} = process_info(Pid, messages),
  236. ct:fail("~n\tMessage queue was not empty, got:~n\t~p~n", [Messages])
  237. end.
  238. assert_wait(ExpectedResult, Fun) ->
  239. assert_wait(ExpectedResult, Fun, os:system_time(millisecond)).
  240. assert_wait(ExpectedResult, Fun, StartAt) ->
  241. case Fun() of
  242. ExpectedResult ->
  243. ok;
  244. Result ->
  245. case os:system_time(millisecond) - StartAt > ?TIMEOUT of
  246. true ->
  247. ct:fail("~n\tExpected: ~p~n\tActual: ~p~n", [ExpectedResult, Result]);
  248. false ->
  249. timer:sleep(50),
  250. assert_wait(ExpectedResult, Fun, StartAt)
  251. end
  252. end.
  253. send_error_logger_to_disk() ->
  254. error_logger:logfile({open, atom_to_list(node())}).
  255. %% ===================================================================
  256. %% Internal
  257. %% ===================================================================
  258. process_main() ->
  259. receive
  260. _ -> process_main()
  261. end.
  262. do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes) ->
  263. do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes, os:system_time(millisecond)).
  264. do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes, StartAt) ->
  265. Nodes = rpc:call(Node, syn, subcluster_nodes, [Type, Scope]),
  266. case do_assert_cluster(Nodes, ExpectedNodes, StartAt) of
  267. continue -> do_assert_scope_subcluster(Type, Node, Scope, ExpectedNodes, StartAt);
  268. _ -> ok
  269. end.
  270. do_assert_cluster(Nodes, ExpectedNodes, StartAt) ->
  271. ExpectedCount = length(ExpectedNodes),
  272. %% count nodes
  273. case length(Nodes) of
  274. ExpectedCount ->
  275. %% loop nodes
  276. RemainingNodes = lists:filter(fun(N) -> not lists:member(N, ExpectedNodes) end, Nodes),
  277. case length(RemainingNodes) of
  278. 0 ->
  279. ok;
  280. _ ->
  281. case os:system_time(millisecond) - StartAt > ?TIMEOUT of
  282. true ->
  283. ct:fail("~n\tInvalid subcluster~n\tExpected: ~p~n\tActual: ~p~n\tLine: ~p~n",
  284. [ExpectedNodes, Nodes, get_line_from_stacktrace()]
  285. );
  286. false ->
  287. timer:sleep(50),
  288. continue
  289. end
  290. end;
  291. _ ->
  292. case os:system_time(millisecond) - StartAt > ?TIMEOUT of
  293. true ->
  294. ct:fail("~n\tInvalid subcluster~n\tExpected: ~p~n\tActual: ~p~n\tLine: ~p~n",
  295. [ExpectedNodes, Nodes, get_line_from_stacktrace()]
  296. );
  297. false ->
  298. timer:sleep(50),
  299. continue
  300. end
  301. end.
  302. do_assert_received_messages([], []) ->
  303. ok;
  304. do_assert_received_messages(MissingMessages, UnexpectedMessages) ->
  305. ct:fail("~n\tReceive messages error~n\tMissing: ~p~n\tUnexpected: ~p~n",
  306. [lists:reverse(MissingMessages), lists:reverse(UnexpectedMessages)]
  307. ).
  308. flush_inbox() ->
  309. receive
  310. _ -> flush_inbox()
  311. after 0 ->
  312. ok
  313. end.
  314. get_line_from_stacktrace() ->
  315. {current_stacktrace, Stacktrace} = process_info(self(), current_stacktrace),
  316. [{_, _, _, FileInfo} | _] = lists:dropwhile(fun({Module, _Method, _Arity, _FileInfo}) ->
  317. Module =:= ?MODULE end, Stacktrace),
  318. proplists:get_value(line, FileInfo).