pooler_tests.erl 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581
  1. -module(pooler_tests).
  2. -include_lib("eunit/include/eunit.hrl").
  3. -compile([export_all]).
  4. % The `user' processes represent users of the pooler library. A user
  5. % process will take a pid, report details on the pid it has, release
  6. % and take a new pid, stop cleanly, and crash.
  7. start_user() ->
  8. spawn(fun() -> user_loop(start) end).
  9. user_id(Pid) ->
  10. Pid ! {get_tc_id, self()},
  11. receive
  12. {Type, Id} ->
  13. {Type, Id}
  14. end.
  15. user_new_tc(Pid) ->
  16. Pid ! new_tc.
  17. user_stop(Pid) ->
  18. Pid ! stop.
  19. user_crash(Pid) ->
  20. Pid ! crash.
  21. user_loop(Atom) when Atom =:= error_no_members orelse Atom =:= start ->
  22. user_loop(pooler:take_member(test_pool_1));
  23. user_loop(MyTC) ->
  24. receive
  25. {get_tc_id, From} ->
  26. From ! pooled_gs:get_id(MyTC),
  27. user_loop(MyTC);
  28. {ping_tc, From} ->
  29. From ! pooled_gs:ping(MyTC),
  30. user_loop(MyTC);
  31. {ping_count, From} ->
  32. From ! pooled_gs:ping_count(MyTC),
  33. user_loop(MyTC);
  34. new_tc ->
  35. pooler:return_member(test_pool_1, MyTC, ok),
  36. MyNewTC = pooler:take_member(test_pool_1),
  37. user_loop(MyNewTC);
  38. stop ->
  39. pooler:return_member(test_pool_1, MyTC, ok),
  40. stopped;
  41. crash ->
  42. erlang:error({user_loop, kaboom})
  43. end.
  44. % The `tc' processes represent the pids tracked by pooler for testing.
  45. % They have a type and an ID and can report their type and ID and
  46. % stop.
  47. tc_loop({Type, Id}) ->
  48. receive
  49. {get_id, From} ->
  50. From ! {ok, Type, Id},
  51. tc_loop({Type, Id});
  52. stop -> stopped;
  53. crash ->
  54. erlang:error({tc_loop, kaboom})
  55. end.
  56. get_tc_id(Pid) ->
  57. Pid ! {get_id, self()},
  58. receive
  59. {ok, Type, Id} ->
  60. {Type, Id}
  61. after 200 ->
  62. timeout
  63. end.
  64. stop_tc(Pid) ->
  65. Pid ! stop.
  66. tc_starter(Type) ->
  67. Ref = make_ref(),
  68. spawn_link(fun() -> tc_loop({Type, Ref}) end).
  69. assert_tc_valid(Pid) ->
  70. ?assertMatch({_Type, _Ref}, get_tc_id(Pid)),
  71. ok.
  72. % tc_sanity_test() ->
  73. % Pid1 = tc_starter("1"),
  74. % {"1", Id1} = get_tc_id(Pid1),
  75. % Pid2 = tc_starter("1"),
  76. % {"1", Id2} = get_tc_id(Pid2),
  77. % ?assertNot(Id1 == Id2),
  78. % stop_tc(Pid1),
  79. % stop_tc(Pid2).
  80. % user_sanity_test() ->
  81. % Pid1 = tc_starter("1"),
  82. % User = spawn(fun() -> user_loop(Pid1) end),
  83. % ?assertMatch({"1", _Ref}, user_id(User)),
  84. % user_crash(User),
  85. % stop_tc(Pid1).
  86. pooler_basics_test_() ->
  87. {setup,
  88. fun() ->
  89. application:set_env(pooler, metrics_module, fake_metrics),
  90. fake_metrics:start_link()
  91. end,
  92. fun(_X) ->
  93. fake_metrics:stop()
  94. end,
  95. {foreach,
  96. % setup
  97. fun() ->
  98. Pools = [[{name, test_pool_1},
  99. {max_count, 3},
  100. {init_count, 2},
  101. {start_mfa,
  102. {pooled_gs, start_link, [{"type-0"}]}}]],
  103. application:set_env(pooler, pools, Pools),
  104. error_logger:delete_report_handler(error_logger_tty_h),
  105. application:start(crypto),
  106. application:start(pooler)
  107. end,
  108. fun(_X) ->
  109. application:stop(pooler)
  110. end,
  111. [
  112. {"there are init_count members at start",
  113. fun() ->
  114. Stats = [ P || {P, {_, free, _}} <- pooler:pool_stats(test_pool_1) ],
  115. ?assertEqual(2, length(Stats))
  116. end},
  117. {"take and return one",
  118. fun() ->
  119. P = pooler:take_member(test_pool_1),
  120. ?assertMatch({"type-0", _Id}, pooled_gs:get_id(P)),
  121. ok = pooler:return_member(test_pool_1, P, ok)
  122. end},
  123. {"take and return one, named pool",
  124. fun() ->
  125. P = pooler:take_member(test_pool_1),
  126. ?assertMatch({"type-0", _Id}, pooled_gs:get_id(P)),
  127. ok, pooler:return_member(test_pool_1, P)
  128. end},
  129. {"attempt to take form unknown pool",
  130. fun() ->
  131. %% since pools are now servers, an unknown pool will timeout
  132. ?assertExit({noproc, _}, pooler:take_member(bad_pool_name))
  133. end},
  134. {"members creation is triggered after pool exhaustion until max",
  135. fun() ->
  136. %% init count is 2
  137. Pids0 = [pooler:take_member(test_pool_1), pooler:take_member(test_pool_1)],
  138. %% since new member creation is async, can only assert
  139. %% that we will get a pid, but may not be first try.
  140. Pids = get_n_pids(1, Pids0),
  141. %% pool is at max now, requests should give error
  142. ?assertEqual(error_no_members, pooler:take_member(test_pool_1)),
  143. ?assertEqual(error_no_members, pooler:take_member(test_pool_1)),
  144. PRefs = [ R || {_T, R} <- [ pooled_gs:get_id(P) || P <- Pids ] ],
  145. % no duplicates
  146. ?assertEqual(length(PRefs), length(lists:usort(PRefs)))
  147. end
  148. },
  149. {"pids are reused most recent return first",
  150. fun() ->
  151. P1 = pooler:take_member(test_pool_1),
  152. P2 = pooler:take_member(test_pool_1),
  153. ?assertNot(P1 == P2),
  154. ok = pooler:return_member(test_pool_1, P1, ok),
  155. ok = pooler:return_member(test_pool_1, P2, ok),
  156. % pids are reused most recent first
  157. ?assertEqual(P2, pooler:take_member(test_pool_1)),
  158. ?assertEqual(P1, pooler:take_member(test_pool_1))
  159. end},
  160. {"if an in-use pid crashes it is replaced",
  161. fun() ->
  162. Pids0 = get_n_pids(3, []),
  163. Ids0 = [ pooled_gs:get_id(P) || P <- Pids0 ],
  164. % crash them all
  165. [ pooled_gs:crash(P) || P <- Pids0 ],
  166. Pids1 = get_n_pids(3, []),
  167. Ids1 = [ pooled_gs:get_id(P) || P <- Pids1 ],
  168. [ ?assertNot(lists:member(I, Ids0)) || I <- Ids1 ]
  169. end
  170. },
  171. {"if a free pid crashes it is replaced",
  172. fun() ->
  173. FreePids = [ P || {P, {_, free, _}} <- pooler:pool_stats(test_pool_1) ],
  174. [ exit(P, kill) || P <- FreePids ],
  175. Pids1 = get_n_pids(3, []),
  176. ?assertEqual(3, length(Pids1))
  177. end},
  178. {"if a pid is returned with bad status it is replaced",
  179. fun() ->
  180. Pids0 = get_n_pids(3, []),
  181. Ids0 = [ pooled_gs:get_id(P) || P <- Pids0 ],
  182. % return them all marking as bad
  183. [ pooler:return_member(test_pool_1, P, fail) || P <- Pids0 ],
  184. Pids1 = get_n_pids(3, []),
  185. Ids1 = [ pooled_gs:get_id(P) || P <- Pids1 ],
  186. [ ?assertNot(lists:member(I, Ids0)) || I <- Ids1 ]
  187. end
  188. },
  189. {"if a consumer crashes, pid is replaced",
  190. fun() ->
  191. Consumer = start_user(),
  192. StartId = user_id(Consumer),
  193. user_crash(Consumer),
  194. NewPid = hd(get_n_pids(1, [])),
  195. NewId = pooled_gs:get_id(NewPid),
  196. ?assertNot(NewId == StartId)
  197. end
  198. },
  199. {"it is ok to return an unknown pid",
  200. fun() ->
  201. Bogus1 = spawn(fun() -> ok end),
  202. Bogus2 = spawn(fun() -> ok end),
  203. ?assertEqual(ok, pooler:return_member(test_pool_1, Bogus1, ok)),
  204. ?assertEqual(ok, pooler:return_member(test_pool_1, Bogus2, fail))
  205. end
  206. },
  207. {"calling return_member on error_no_members is ignored",
  208. fun() ->
  209. ?assertEqual(ok, pooler:return_member(test_pool_1, error_no_members)),
  210. ?assertEqual(ok, pooler:return_member(test_pool_1, error_no_members, ok)),
  211. ?assertEqual(ok, pooler:return_member(test_pool_1, error_no_members, fail))
  212. end
  213. },
  214. {"metrics have been called",
  215. fun() ->
  216. %% exercise the API to ensure we have certain keys reported as metrics
  217. fake_metrics:reset_metrics(),
  218. Pids = [ pooler:take_member(test_pool_1) || _I <- lists:seq(1, 10) ],
  219. [ pooler:return_member(test_pool_1, P) || P <- Pids ],
  220. catch pooler:take_member(bad_pool_name),
  221. %% kill and unused member
  222. exit(hd(Pids), kill),
  223. %% kill a used member
  224. KillMe = pooler:take_member(test_pool_1),
  225. exit(KillMe, kill),
  226. %% FIXME: We need to wait for pooler to process the
  227. %% exit message. This is ugly, will fix later.
  228. timer:sleep(200), % :(
  229. ExpectKeys = lists:sort([<<"pooler.test_pool_1.error_no_members_count">>,
  230. <<"pooler.test_pool_1.events">>,
  231. <<"pooler.test_pool_1.free_count">>,
  232. <<"pooler.test_pool_1.in_use_count">>,
  233. <<"pooler.test_pool_1.killed_free_count">>,
  234. <<"pooler.test_pool_1.killed_in_use_count">>,
  235. <<"pooler.test_pool_1.take_rate">>]),
  236. Metrics = fake_metrics:get_metrics(),
  237. GotKeys = lists:usort([ Name || {Name, _, _} <- Metrics ]),
  238. ?assertEqual(ExpectKeys, GotKeys)
  239. end}
  240. ]}}.
  241. pooler_groups_test_() ->
  242. {setup,
  243. fun() ->
  244. application:set_env(pooler, metrics_module, fake_metrics),
  245. fake_metrics:start_link()
  246. end,
  247. fun(_X) ->
  248. fake_metrics:stop()
  249. end,
  250. {foreach,
  251. % setup
  252. fun() ->
  253. Pools = [[{name, test_pool_1},
  254. {group, group_1},
  255. {max_count, 3},
  256. {init_count, 2},
  257. {start_mfa,
  258. {pooled_gs, start_link, [{"type-1-1"}]}}],
  259. [{name, test_pool_2},
  260. {group, group_1},
  261. {max_count, 3},
  262. {init_count, 2},
  263. {start_mfa,
  264. {pooled_gs, start_link, [{"type-1-2"}]}}],
  265. %% test_pool_3 not part of the group
  266. [{name, test_pool_3},
  267. {group, undefined},
  268. {max_count, 3},
  269. {init_count, 2},
  270. {start_mfa,
  271. {pooled_gs, start_link, [{"type-3"}]}}]
  272. ],
  273. application:set_env(pooler, pools, Pools),
  274. %% error_logger:delete_report_handler(error_logger_tty_h),
  275. application:start(crypto),
  276. pg2:start(),
  277. application:start(pooler)
  278. end,
  279. fun(_X) ->
  280. application:stop(pooler)
  281. end,
  282. [
  283. {"take and return one group member (repeated)",
  284. fun() ->
  285. Types = [ begin
  286. Pid = pooler:take_group_member(group_1),
  287. {Type, _} = pooled_gs:get_id(Pid),
  288. ?assertMatch("type-1" ++ _, Type),
  289. ok = pooler:return_group_member(group_1, Pid, ok),
  290. Type
  291. end
  292. || _I <- lists:seq(1, 50) ],
  293. Type_1_1 = [ X || "type-1-1" = X <- Types ],
  294. Type_1_2 = [ X || "type-1-2" = X <- Types ],
  295. ?assert(length(Type_1_1) > 0),
  296. ?assert(length(Type_1_2) > 0)
  297. end},
  298. {"take member from unknown group",
  299. fun() ->
  300. ?assertEqual({error, {no_such_group, not_a_group}},
  301. pooler:take_group_member(not_a_group))
  302. end},
  303. {"return member to group, implied ok",
  304. fun() ->
  305. Pid = pooler:take_group_member(group_1),
  306. ?assertEqual(ok, pooler:return_group_member(group_1, Pid))
  307. end},
  308. {"return error_no_member to group",
  309. fun() ->
  310. ?assertEqual(ok, pooler:return_group_member(group_1, error_no_members))
  311. end},
  312. {"exhaust pools in group",
  313. fun() ->
  314. Pids = get_n_pids_group(group_1, 6, []),
  315. %% they should all be pids
  316. [ begin
  317. {Type, _} = pooled_gs:get_id(P),
  318. ?assertMatch("type-1" ++ _, Type),
  319. ok
  320. end || P <- Pids ],
  321. %% further attempts should be error
  322. [error_no_members,
  323. error_no_members,
  324. error_no_members] = [ pooler:take_group_member(group_1)
  325. || _I <- lists:seq(1, 3) ]
  326. end}
  327. ]}}.
  328. pooler_limit_failed_adds_test_() ->
  329. %% verify that pooler crashes completely if too many failures are
  330. %% encountered while trying to add pids.
  331. {setup,
  332. fun() ->
  333. Pools = [[{name, test_pool_1},
  334. {max_count, 10},
  335. {init_count, 10},
  336. {start_mfa,
  337. {pooled_gs, start_link, [crash]}}]],
  338. application:set_env(pooler, pools, Pools)
  339. end,
  340. fun(_) ->
  341. application:stop(pooler)
  342. end,
  343. fun() ->
  344. application:start(pooler),
  345. ?assertEqual(error_no_members, pooler:take_member(test_pool_1)),
  346. ?assertEqual(error_no_members, pooler:take_member(test_pool_1))
  347. end}.
  348. pooler_scheduled_cull_test_() ->
  349. {setup,
  350. fun() ->
  351. application:set_env(pooler, metrics_module, fake_metrics),
  352. fake_metrics:start_link(),
  353. Pools = [[{name, test_pool_1},
  354. {max_count, 10},
  355. {init_count, 2},
  356. {start_mfa, {pooled_gs, start_link, [{"type-0"}]}},
  357. {cull_interval, {200, ms}}]],
  358. application:set_env(pooler, pools, Pools),
  359. %% error_logger:delete_report_handler(error_logger_tty_h),
  360. application:start(pooler)
  361. end,
  362. fun(_X) ->
  363. fake_metrics:stop(),
  364. application:stop(pooler)
  365. end,
  366. [{"excess members are culled repeatedly",
  367. fun() ->
  368. %% take all members
  369. Pids1 = get_n_pids(test_pool_1, 10, []),
  370. %% return all
  371. [ pooler:return_member(test_pool_1, P) || P <- Pids1 ],
  372. ?assertEqual(10, length(pooler:pool_stats(test_pool_1))),
  373. %% wait for longer than cull delay
  374. timer:sleep(250),
  375. ?assertEqual(2, length(pooler:pool_stats(test_pool_1))),
  376. %% repeat the test to verify that culling gets rescheduled.
  377. Pids2 = get_n_pids(test_pool_1, 10, []),
  378. %% return all
  379. [ pooler:return_member(test_pool_1, P) || P <- Pids2 ],
  380. ?assertEqual(10, length(pooler:pool_stats(test_pool_1))),
  381. %% wait for longer than cull delay
  382. timer:sleep(250),
  383. ?assertEqual(2, length(pooler:pool_stats(test_pool_1)))
  384. end
  385. },
  386. {"non-excess members are not culled",
  387. fun() ->
  388. [P1, P2] = [pooler:take_member(test_pool_1) || _X <- [1, 2] ],
  389. [pooler:return_member(test_pool_1, P) || P <- [P1, P2] ],
  390. ?assertEqual(2, length(pooler:pool_stats(test_pool_1))),
  391. timer:sleep(250),
  392. ?assertEqual(2, length(pooler:pool_stats(test_pool_1)))
  393. end
  394. },
  395. {"in-use members are not culled",
  396. fun() ->
  397. %% take all members
  398. Pids = get_n_pids(test_pool_1, 10, []),
  399. %% don't return any
  400. ?assertEqual(10, length(pooler:pool_stats(test_pool_1))),
  401. %% wait for longer than cull delay
  402. timer:sleep(250),
  403. ?assertEqual(10, length(pooler:pool_stats(test_pool_1))),
  404. [ pooler:return_member(test_pool_1, P) || P <- Pids ]
  405. end}
  406. ]}.
  407. random_message_test_() ->
  408. {setup,
  409. fun() ->
  410. Pools = [[{name, test_pool_1},
  411. {max_count, 2},
  412. {init_count, 1},
  413. {start_mfa,
  414. {pooled_gs, start_link, [{"type-0"}]}}]],
  415. application:set_env(pooler, pools, Pools),
  416. error_logger:delete_report_handler(error_logger_tty_h),
  417. application:start(pooler),
  418. %% now send some bogus messages
  419. %% do the call in a throw-away process to avoid timeout error
  420. spawn(fun() -> catch gen_server:call(test_pool_1, {unexpected_garbage_msg, 5}) end),
  421. gen_server:cast(test_pool_1, {unexpected_garbage_msg, 6}),
  422. whereis(test_pool_1) ! {unexpected_garbage_msg, 7},
  423. ok
  424. end,
  425. fun(_) ->
  426. application:stop(pooler)
  427. end,
  428. [
  429. fun() ->
  430. Pid = pooler:take_member(test_pool_1),
  431. {Type, _} = pooled_gs:get_id(Pid),
  432. ?assertEqual("type-0", Type)
  433. end
  434. ]}.
  435. pooler_integration_test_() ->
  436. {foreach,
  437. % setup
  438. fun() ->
  439. Pools = [[{name, test_pool_1},
  440. {max_count, 10},
  441. {init_count, 10},
  442. {start_mfa,
  443. {pooled_gs, start_link, [{"type-0"}]}}]],
  444. application:set_env(pooler, pools, Pools),
  445. error_logger:delete_report_handler(error_logger_tty_h),
  446. application:start(pooler),
  447. Users = [ start_user() || _X <- lists:seq(1, 10) ],
  448. Users
  449. end,
  450. % cleanup
  451. fun(Users) ->
  452. [ user_stop(U) || U <- Users ],
  453. application:stop(pooler)
  454. end,
  455. %
  456. [
  457. fun(Users) ->
  458. fun() ->
  459. % each user has a different tc ID
  460. TcIds = lists:sort([ user_id(UPid) || UPid <- Users ]),
  461. ?assertEqual(lists:usort(TcIds), TcIds)
  462. end
  463. end
  464. ,
  465. fun(Users) ->
  466. fun() ->
  467. % users still unique after a renew cycle
  468. [ user_new_tc(UPid) || UPid <- Users ],
  469. TcIds = lists:sort([ user_id(UPid) || UPid <- Users ]),
  470. ?assertEqual(lists:usort(TcIds), TcIds)
  471. end
  472. end
  473. ,
  474. fun(Users) ->
  475. fun() ->
  476. % all users crash, pids are replaced
  477. TcIds1 = lists:sort([ user_id(UPid) || UPid <- Users ]),
  478. [ user_crash(UPid) || UPid <- Users ],
  479. Seq = lists:seq(1, 5),
  480. Users2 = [ start_user() || _X <- Seq ],
  481. TcIds2 = lists:sort([ user_id(UPid) || UPid <- Users2 ]),
  482. Both =
  483. sets:to_list(sets:intersection([sets:from_list(TcIds1),
  484. sets:from_list(TcIds2)])),
  485. ?assertEqual([], Both)
  486. end
  487. end
  488. ]
  489. }.
  490. time_as_millis_test_() ->
  491. Zeros = [ {{0, U}, 0} || U <- [min, sec, ms, mu] ],
  492. Ones = [{{1, min}, 60000},
  493. {{1, sec}, 1000},
  494. {{1, ms}, 1},
  495. {{1, mu}, 0}],
  496. Misc = [{{3000, mu}, 3}],
  497. Tests = Zeros ++ Ones ++ Misc,
  498. [ ?_assertEqual(E, pooler:time_as_millis(I)) || {I, E} <- Tests ].
  499. time_as_micros_test_() ->
  500. Zeros = [ {{0, U}, 0} || U <- [min, sec, ms, mu] ],
  501. Ones = [{{1, min}, 60000000},
  502. {{1, sec}, 1000000},
  503. {{1, ms}, 1000},
  504. {{1, mu}, 1}],
  505. Misc = [{{3000, mu}, 3000}],
  506. Tests = Zeros ++ Ones ++ Misc,
  507. [ ?_assertEqual(E, pooler:time_as_micros(I)) || {I, E} <- Tests ].
  508. % testing crash recovery means race conditions when either pids
  509. % haven't yet crashed or pooler hasn't recovered. So this helper loops
  510. % forver until N pids are obtained, ignoring error_no_members.
  511. get_n_pids(N, Acc) ->
  512. get_n_pids(test_pool_1, N, Acc).
  513. get_n_pids(_Pool, 0, Acc) ->
  514. Acc;
  515. get_n_pids(Pool, N, Acc) ->
  516. case pooler:take_member(Pool) of
  517. error_no_members ->
  518. get_n_pids(Pool, N, Acc);
  519. Pid ->
  520. get_n_pids(Pool, N - 1, [Pid|Acc])
  521. end.
  522. get_n_pids_group(_Group, 0, Acc) ->
  523. Acc;
  524. get_n_pids_group(Group, N, Acc) ->
  525. case pooler:take_group_member(Group) of
  526. error_no_members ->
  527. get_n_pids_group(Group, N, Acc);
  528. Pid ->
  529. get_n_pids_group(Group, N - 1, [Pid|Acc])
  530. end.