syn_benchmark.erl 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246
  1. %% ==========================================================================================================
  2. %% Syn - A global Process Registry and Process Group manager.
  3. %%
  4. %% The MIT License (MIT)
  5. %%
  6. %% Copyright (c) 2019-2021 Roberto Ostinelli <roberto@ostinelli.net> and Neato Robotics, Inc.
  7. %%
  8. %% Permission is hereby granted, free of charge, to any person obtaining a copy
  9. %% of this software and associated documentation files (the "Software"), to deal
  10. %% in the Software without restriction, including without limitation the rights
  11. %% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  12. %% copies of the Software, and to permit persons to whom the Software is
  13. %% furnished to do so, subject to the following conditions:
  14. %%
  15. %% The above copyright notice and this permission notice shall be included in
  16. %% all copies or substantial portions of the Software.
  17. %%
  18. %% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. %% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. %% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  21. %% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22. %% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  23. %% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  24. %% THE SOFTWARE.
  25. %% ==========================================================================================================
  26. -module(syn_benchmark).
  27. %% API
  28. -export([
  29. start/0,
  30. start_processes/1,
  31. process_loop/0,
  32. register_on_node/3,
  33. do_register_on_node/2,
  34. unregister_on_node/3,
  35. do_unregister_on_node/2,
  36. wait_registration_propagation/1,
  37. wait_unregistration_propagation/1
  38. ]).
  39. -export([
  40. start_profiling/0,
  41. stop_profiling/0
  42. ]).
  43. %% ===================================================================
  44. %% API
  45. %% ===================================================================
  46. %% example run: `PROCESS_COUNT=100000 NODES_COUNT=2 make bench`
  47. start() ->
  48. %% init
  49. SlavesCount = list_to_integer(os:getenv("NODES_COUNT", "1")),
  50. ProcessCount = list_to_integer(os:getenv("PROCESS_COUNT", "100000")),
  51. ProcessesPerNode = round(ProcessCount / SlavesCount),
  52. io:format("-----> Starting benchmark on ~w nodes (~w slaves) (for ~w processes total (~w / slave node)~n",
  53. [SlavesCount + 1, SlavesCount, ProcessCount, ProcessesPerNode]
  54. ),
  55. %% start nodes
  56. NodesInfo = lists:foldl(fun(I, Acc) ->
  57. %% start slave
  58. CountBin = integer_to_binary(I),
  59. NodeShortName = binary_to_atom(<<"slave_", CountBin/binary>>),
  60. {ok, Node} = ct_slave:start(NodeShortName, [
  61. {boot_timeout, 10},
  62. {monitor_master, true}
  63. ]),
  64. %% add code path
  65. CodePath = code:get_path(),
  66. true = rpc:call(Node, code, set_path, [CodePath]),
  67. %% start syn
  68. rpc:call(Node, syn, start, []),
  69. %% gather data
  70. FromName = (I - 1) * ProcessesPerNode + 1,
  71. ToName = FromName + ProcessesPerNode - 1,
  72. %% fold
  73. [{Node, FromName, ToName} | Acc]
  74. end, [], lists:seq(1, SlavesCount)),
  75. %% start syn locally
  76. ok = syn:start(),
  77. timer:sleep(1000),
  78. CollectorPid = self(),
  79. %% start processes
  80. PidsMap = lists:foldl(fun({Node, _FromName, _ToName}, Acc) ->
  81. Pids = rpc:call(Node, ?MODULE, start_processes, [ProcessesPerNode]),
  82. maps:put(Node, Pids, Acc)
  83. end, #{}, NodesInfo),
  84. %% start registration
  85. lists:foreach(fun({Node, FromName, _ToName}) ->
  86. Pids = maps:get(Node, PidsMap),
  87. rpc:cast(Node, ?MODULE, register_on_node, [CollectorPid, FromName, Pids])
  88. end, NodesInfo),
  89. %% wait
  90. RegRemoteNodesTimes = wait_from_all_remote_nodes(nodes(), []),
  91. io:format("----> Remote registration times:~n"),
  92. io:format(" --> MIN: ~p secs.~n", [lists:min(RegRemoteNodesTimes)]),
  93. io:format(" --> MAX: ~p secs.~n", [lists:max(RegRemoteNodesTimes)]),
  94. {RegPropagationTimeMs, _} = timer:tc(?MODULE, wait_registration_propagation, [NodesInfo]),
  95. RegPropagationTime = RegPropagationTimeMs / 1000000,
  96. io:format("----> Eventual additional time to propagate all to master: ~p secs.~n", [RegPropagationTime]),
  97. %% sum
  98. RegTakenTime = (lists:max(RegRemoteNodesTimes) + RegPropagationTime),
  99. RegistrationRate = ProcessCount / RegTakenTime,
  100. io:format("====> Registeration rate (with propagation): ~p/sec.~n~n", [RegistrationRate]),
  101. timer:sleep(1000),
  102. %% start unregistration
  103. lists:foreach(fun({Node, FromName, ToName}) ->
  104. rpc:cast(Node, ?MODULE, unregister_on_node, [CollectorPid, FromName, ToName])
  105. end, NodesInfo),
  106. %% wait
  107. UnregRemoteNodesTimes = wait_from_all_remote_nodes(nodes(), []),
  108. io:format("----> Remote unregistration times:~n"),
  109. io:format(" --> MIN: ~p secs.~n", [lists:min(UnregRemoteNodesTimes)]),
  110. io:format(" --> MAX: ~p secs.~n", [lists:max(UnregRemoteNodesTimes)]),
  111. {UnregPropagationTimeMs, _} = timer:tc(?MODULE, wait_unregistration_propagation, [NodesInfo]),
  112. UnregPropagationTime = UnregPropagationTimeMs / 1000000,
  113. io:format("----> Eventual additional time to propagate all to master: ~p secs.~n", [UnregPropagationTime]),
  114. %% sum
  115. UnregTakenTime = (lists:max(UnregRemoteNodesTimes) + UnregPropagationTime),
  116. UnregistrationRate = ProcessCount / UnregTakenTime,
  117. io:format("====> Unregisteration rate (with propagation): ~p/sec.~n~n", [UnregistrationRate]),
  118. %% start re-registration
  119. lists:foreach(fun({Node, FromName, _ToName}) ->
  120. Pids = maps:get(Node, PidsMap),
  121. rpc:cast(Node, ?MODULE, register_on_node, [CollectorPid, FromName, Pids])
  122. end, NodesInfo),
  123. %% wait
  124. ReRegRemoteNodesTimes = wait_from_all_remote_nodes(nodes(), []),
  125. io:format("----> Remote re-registration times:~n"),
  126. io:format(" --> MIN: ~p secs.~n", [lists:min(ReRegRemoteNodesTimes)]),
  127. io:format(" --> MAX: ~p secs.~n", [lists:max(ReRegRemoteNodesTimes)]),
  128. {ReRegPropagationTimeMs, _} = timer:tc(?MODULE, wait_registration_propagation, [NodesInfo]),
  129. ReRegPropagationTime = ReRegPropagationTimeMs / 1000000,
  130. io:format("----> Eventual additional time to propagate all to master: ~p secs.~n", [ReRegPropagationTime]),
  131. %% sum
  132. ReRegTakenTime = (lists:max(ReRegRemoteNodesTimes) + ReRegPropagationTime),
  133. ReRegistrationRate = ProcessCount / ReRegTakenTime,
  134. io:format("====> Re-registeration rate (with propagation): ~p/sec.~n~n", [ReRegistrationRate]),
  135. %% kill all processes
  136. maps:foreach(fun(_Node, Pids) ->
  137. lists:foreach(fun(Pid) -> exit(Pid, kill) end, Pids)
  138. end, PidsMap),
  139. %% wait all unregistered
  140. {KillPropagationTimeMs, _} = timer:tc(?MODULE, wait_unregistration_propagation, [NodesInfo]),
  141. KillPropagationTime = KillPropagationTimeMs / 1000000,
  142. io:format("----> Time to propagate killed process to to master: ~p secs.~n", [KillPropagationTime]),
  143. KillRate = ProcessCount / KillPropagationTime,
  144. io:format("====> Unregistered after kill rate (with propagation): ~p/sec.~n~n", [KillRate]),
  145. %% stop node
  146. init:stop().
  147. register_on_node(CollectorPid, FromName, Pids) ->
  148. {TimeMs, _} = timer:tc(?MODULE, do_register_on_node, [FromName, Pids]),
  149. Time = TimeMs / 1000000,
  150. io:format("----> Registered on node ~p on ~p secs.~n", [node(), Time]),
  151. CollectorPid ! {done, node(), Time}.
  152. do_register_on_node(_Name, []) -> ok;
  153. do_register_on_node(Name, [Pid | PidsTail]) ->
  154. ok = syn:register(Name, Pid),
  155. do_register_on_node(Name + 1, PidsTail).
  156. unregister_on_node(CollectorPid, FromName, ToName) ->
  157. {TimeMs, _} = timer:tc(?MODULE, do_unregister_on_node, [FromName, ToName]),
  158. Time = TimeMs / 1000000,
  159. io:format("----> Unregistered on node ~p on ~p secs.~n", [node(), Time]),
  160. CollectorPid ! {done, node(), Time}.
  161. do_unregister_on_node(FromName, ToName) when FromName > ToName -> ok;
  162. do_unregister_on_node(Name, ToName) ->
  163. ok = syn:unregister(Name),
  164. do_unregister_on_node(Name + 1, ToName).
  165. start_processes(Count) ->
  166. start_processes(Count, []).
  167. start_processes(0, Pids) ->
  168. Pids;
  169. start_processes(Count, Pids) ->
  170. Pid = spawn(fun process_loop/0),
  171. start_processes(Count - 1, [Pid | Pids]).
  172. process_loop() ->
  173. receive
  174. _ -> ok
  175. end.
  176. wait_from_all_remote_nodes([], Times) -> Times;
  177. wait_from_all_remote_nodes([RemoteNode | Tail], Times) ->
  178. receive
  179. {done, RemoteNode, Time} ->
  180. wait_from_all_remote_nodes(Tail, [Time | Times])
  181. end.
  182. wait_registration_propagation([]) -> ok;
  183. wait_registration_propagation([{_Node, _FromName, ToName} | NodeInfosTail] = NodesInfo) ->
  184. case syn:lookup(ToName) of
  185. undefined ->
  186. timer:sleep(50),
  187. wait_registration_propagation(NodesInfo);
  188. {_Pid, undefined} ->
  189. wait_registration_propagation(NodeInfosTail)
  190. end.
  191. wait_unregistration_propagation([]) -> ok;
  192. wait_unregistration_propagation([{_Node, _FromName, ToName} | NodeInfosTail] = NodesInfo) ->
  193. case syn:lookup(ToName) of
  194. undefined ->
  195. wait_unregistration_propagation(NodeInfosTail);
  196. {_Pid, undefined} ->
  197. timer:sleep(50),
  198. wait_unregistration_propagation(NodesInfo)
  199. end.
  200. start_profiling() ->
  201. {ok, P} = eprof:start(),
  202. eprof:start_profiling(erlang:processes() -- [P]).
  203. stop_profiling() ->
  204. eprof:stop_profiling(),
  205. eprof:analyze(total).