syn_benchmark.erl 8.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. %% ==========================================================================================================
  2. %% Syn - A global Process Registry and Process Group manager.
  3. %%
  4. %% The MIT License (MIT)
  5. %%
  6. %% Copyright (c) 2019-2021 Roberto Ostinelli <roberto@ostinelli.net> and Neato Robotics, Inc.
  7. %%
  8. %% Permission is hereby granted, free of charge, to any person obtaining a copy
  9. %% of this software and associated documentation files (the "Software"), to deal
  10. %% in the Software without restriction, including without limitation the rights
  11. %% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  12. %% copies of the Software, and to permit persons to whom the Software is
  13. %% furnished to do so, subject to the following conditions:
  14. %%
  15. %% The above copyright notice and this permission notice shall be included in
  16. %% all copies or substantial portions of the Software.
  17. %%
  18. %% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. %% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. %% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  21. %% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22. %% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  23. %% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  24. %% THE SOFTWARE.
  25. %% ==========================================================================================================
  26. -module(syn_benchmark).
  27. %% API
  28. -compile([export_all]).
  29. %% ===================================================================
  30. %% API
  31. %% ===================================================================
  32. %% example run: `PROCESS_COUNT=100000 NODES_COUNT=2 make bench`
  33. start() ->
  34. %% init
  35. SlavesCount = list_to_integer(os:getenv("NODES_COUNT", "1")),
  36. ProcessCount = list_to_integer(os:getenv("PROCESS_COUNT", "100000")),
  37. ProcessesPerNode = round(ProcessCount / SlavesCount),
  38. io:format("-----> Starting benchmark on ~w nodes (~w slaves) (for ~w processes total (~w / slave node)~n",
  39. [SlavesCount + 1, SlavesCount, ProcessCount, ProcessesPerNode]
  40. ),
  41. %% start nodes
  42. NodesInfo = lists:foldl(fun(I, Acc) ->
  43. %% start slave
  44. CountBin = integer_to_binary(I),
  45. NodeShortName = binary_to_atom(<<"slave_", CountBin/binary>>),
  46. {ok, Node} = ct_slave:start(NodeShortName, [
  47. {boot_timeout, 10},
  48. {monitor_master, true}
  49. ]),
  50. %% add code path
  51. CodePath = code:get_path(),
  52. true = rpc:call(Node, code, set_path, [CodePath]),
  53. %% start syn
  54. rpc:call(Node, syn, start, []),
  55. %% gather data
  56. FromName = (I - 1) * ProcessesPerNode + 1,
  57. ToName = FromName + ProcessesPerNode - 1,
  58. %% fold
  59. [{Node, FromName, ToName} | Acc]
  60. end, [], lists:seq(1, SlavesCount)),
  61. %% start syn locally
  62. ok = syn:start(),
  63. timer:sleep(1000),
  64. CollectorPid = self(),
  65. %% start processes
  66. PidsMap = lists:foldl(fun({Node, _FromName, _ToName}, Acc) ->
  67. Pids = rpc:call(Node, ?MODULE, start_processes, [ProcessesPerNode]),
  68. maps:put(Node, Pids, Acc)
  69. end, #{}, NodesInfo),
  70. %% start registration
  71. lists:foreach(fun({Node, FromName, _ToName}) ->
  72. Pids = maps:get(Node, PidsMap),
  73. rpc:cast(Node, ?MODULE, register_on_node, [CollectorPid, FromName, Pids])
  74. end, NodesInfo),
  75. %% wait
  76. RegRemoteNodesTimes = wait_from_all_remote_nodes(nodes(), []),
  77. io:format("----> Remote registration times:~n"),
  78. io:format(" --> MIN: ~p secs.~n", [lists:min(RegRemoteNodesTimes)]),
  79. io:format(" --> MAX: ~p secs.~n", [lists:max(RegRemoteNodesTimes)]),
  80. {RegPropagationTimeMs, _} = timer:tc(?MODULE, wait_registration_propagation, [NodesInfo]),
  81. RegPropagationTime = RegPropagationTimeMs / 1000000,
  82. io:format("----> Eventual additional time to propagate all to master: ~p secs.~n", [RegPropagationTime]),
  83. %% sum
  84. RegTakenTime = (lists:max(RegRemoteNodesTimes) + RegPropagationTime),
  85. RegistrationRate = ProcessCount / RegTakenTime,
  86. io:format("====> Registeration rate (with propagation): ~p/sec.~n~n", [RegistrationRate]),
  87. timer:sleep(1000),
  88. %% start unregistration
  89. lists:foreach(fun({Node, FromName, ToName}) ->
  90. rpc:cast(Node, ?MODULE, unregister_on_node, [CollectorPid, FromName, ToName])
  91. end, NodesInfo),
  92. %% wait
  93. UnregRemoteNodesTimes = wait_from_all_remote_nodes(nodes(), []),
  94. io:format("----> Remote unregistration times:~n"),
  95. io:format(" --> MIN: ~p secs.~n", [lists:min(UnregRemoteNodesTimes)]),
  96. io:format(" --> MAX: ~p secs.~n", [lists:max(UnregRemoteNodesTimes)]),
  97. {UnregPropagationTimeMs, _} = timer:tc(?MODULE, wait_unregistration_propagation, [NodesInfo]),
  98. UnregPropagationTime = UnregPropagationTimeMs / 1000000,
  99. io:format("----> Eventual additional time to propagate all to master: ~p secs.~n", [UnregPropagationTime]),
  100. %% sum
  101. UnregTakenTime = (lists:max(UnregRemoteNodesTimes) + UnregPropagationTime),
  102. UnregistrationRate = ProcessCount / UnregTakenTime,
  103. io:format("====> Unregisteration rate (with propagation): ~p/sec.~n~n", [UnregistrationRate]),
  104. %% start re-registration
  105. lists:foreach(fun({Node, FromName, _ToName}) ->
  106. Pids = maps:get(Node, PidsMap),
  107. rpc:cast(Node, ?MODULE, register_on_node, [CollectorPid, FromName, Pids])
  108. end, NodesInfo),
  109. %% wait
  110. ReRegRemoteNodesTimes = wait_from_all_remote_nodes(nodes(), []),
  111. io:format("----> Remote re-registration times:~n"),
  112. io:format(" --> MIN: ~p secs.~n", [lists:min(ReRegRemoteNodesTimes)]),
  113. io:format(" --> MAX: ~p secs.~n", [lists:max(ReRegRemoteNodesTimes)]),
  114. {ReRegPropagationTimeMs, _} = timer:tc(?MODULE, wait_registration_propagation, [NodesInfo]),
  115. ReRegPropagationTime = ReRegPropagationTimeMs / 1000000,
  116. io:format("----> Eventual additional time to propagate all to master: ~p secs.~n", [ReRegPropagationTime]),
  117. %% sum
  118. ReRegTakenTime = (lists:max(ReRegRemoteNodesTimes) + ReRegPropagationTime),
  119. ReRegistrationRate = ProcessCount / ReRegTakenTime,
  120. io:format("====> Re-registeration rate (with propagation): ~p/sec.~n~n", [ReRegistrationRate]),
  121. %% kill all processes
  122. maps:foreach(fun(_Node, Pids) ->
  123. lists:foreach(fun(Pid) -> exit(Pid, kill) end, Pids)
  124. end, PidsMap),
  125. %% wait all unregistered
  126. {KillPropagationTimeMs, _} = timer:tc(?MODULE, wait_unregistration_propagation, [NodesInfo]),
  127. KillPropagationTime = KillPropagationTimeMs / 1000000,
  128. io:format("----> Time to propagate killed process to to master: ~p secs.~n", [KillPropagationTime]),
  129. KillRate = ProcessCount / KillPropagationTime,
  130. io:format("====> Unregistered after kill rate (with propagation): ~p/sec.~n~n", [KillRate]),
  131. %% stop node
  132. init:stop().
  133. register_on_node(CollectorPid, FromName, Pids) ->
  134. {TimeMs, _} = timer:tc(?MODULE, do_register_on_node, [FromName, Pids]),
  135. Time = TimeMs / 1000000,
  136. io:format("----> Registered on node ~p on ~p secs.~n", [node(), Time]),
  137. CollectorPid ! {done, node(), Time}.
  138. do_register_on_node(_Name, []) -> ok;
  139. do_register_on_node(Name, [Pid | PidsTail]) ->
  140. ok = syn:register(Name, Pid),
  141. do_register_on_node(Name + 1, PidsTail).
  142. unregister_on_node(CollectorPid, FromName, ToName) ->
  143. {TimeMs, _} = timer:tc(?MODULE, do_unregister_on_node, [FromName, ToName]),
  144. Time = TimeMs / 1000000,
  145. io:format("----> Unregistered on node ~p on ~p secs.~n", [node(), Time]),
  146. CollectorPid ! {done, node(), Time}.
  147. do_unregister_on_node(FromName, ToName) when FromName > ToName -> ok;
  148. do_unregister_on_node(Name, ToName) ->
  149. ok = syn:unregister(Name),
  150. do_unregister_on_node(Name + 1, ToName).
  151. start_processes(Count) ->
  152. start_processes(Count, []).
  153. start_processes(0, Pids) ->
  154. Pids;
  155. start_processes(Count, Pids) ->
  156. Pid = spawn(fun process_loop/0),
  157. start_processes(Count - 1, [Pid | Pids]).
  158. process_loop() ->
  159. receive
  160. _ -> ok
  161. end.
  162. wait_from_all_remote_nodes([], Times) -> Times;
  163. wait_from_all_remote_nodes([RemoteNode | Tail], Times) ->
  164. receive
  165. {done, RemoteNode, Time} ->
  166. wait_from_all_remote_nodes(Tail, [Time | Times])
  167. end.
  168. wait_registration_propagation([]) -> ok;
  169. wait_registration_propagation([{_Node, _FromName, ToName} | NodeInfosTail] = NodesInfo) ->
  170. case syn:lookup(ToName) of
  171. undefined ->
  172. timer:sleep(50),
  173. wait_registration_propagation(NodesInfo);
  174. {_Pid, undefined} ->
  175. wait_registration_propagation(NodeInfosTail)
  176. end.
  177. wait_unregistration_propagation([]) -> ok;
  178. wait_unregistration_propagation([{_Node, _FromName, ToName} | NodeInfosTail] = NodesInfo) ->
  179. case syn:lookup(ToName) of
  180. undefined ->
  181. wait_unregistration_propagation(NodeInfosTail);
  182. {_Pid, undefined} ->
  183. timer:sleep(50),
  184. wait_unregistration_propagation(NodesInfo)
  185. end.