sam_test_agent.c 30 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252
  1. /*
  2. * Copyright (c) 2009-2011 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. /*
  35. * Provides test of SAM API
  36. */
  37. #include <config.h>
  38. #include <stdio.h>
  39. #include <stdint.h>
  40. #include <stdlib.h>
  41. #include <unistd.h>
  42. #include <pthread.h>
  43. #include <limits.h>
  44. #include <sys/types.h>
  45. #include <sys/socket.h>
  46. #include <netinet/in.h>
  47. #include <arpa/inet.h>
  48. #include <netdb.h>
  49. #include <sys/un.h>
  50. #include <corosync/corotypes.h>
  51. #include <corosync/sam.h>
  52. #include <signal.h>
  53. #include <string.h>
  54. #include <sys/wait.h>
  55. #include <corosync/cmap.h>
  56. #include "common_test_agent.h"
  57. extern const char *__progname;
  58. static int test2_sig_delivered = 0;
  59. static int test5_hc_cb_count = 0;
  60. static int test6_sig_delivered = 0;
  61. /*
  62. * First test will just register SAM, with policy restart. First instance will
  63. * sleep one second, send hc and sleep another 3 seconds. This should force restart.
  64. * Second instance will sleep one second, send hc, stop hc and sleep 3 seconds.
  65. * Then start hc again and sleep 3 seconds. This should force restart again.
  66. * Last instance just calls initialize again. This should end with error.
  67. * Then call start, followed by stop and start again. Finally, we will call finalize
  68. * twice. One should succeed, second should fail. After this, we will call every function
  69. * (none should succeed).
  70. */
  71. static int test1 (void)
  72. {
  73. cs_error_t error;
  74. unsigned int instance_id;
  75. int i;
  76. qb_enter();
  77. error = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART);
  78. if (error != CS_OK) {
  79. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  80. return 1;
  81. }
  82. qb_log (LOG_INFO, "register");
  83. error = sam_register (&instance_id);
  84. if (error != CS_OK) {
  85. qb_log (LOG_ERR, "Can't register. Error %d", error);
  86. return 1;
  87. }
  88. if (instance_id == 1 || instance_id == 2) {
  89. qb_log (LOG_INFO, "iid %d: start", instance_id);
  90. error = sam_start ();
  91. if (error != CS_OK) {
  92. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  93. return 1;
  94. }
  95. for (i = 0; i < 10; i++) {
  96. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  97. sleep (1);
  98. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  99. error = sam_hc_send ();
  100. if (error != CS_OK) {
  101. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  102. return 1;
  103. }
  104. }
  105. if (instance_id == 2) {
  106. qb_log (LOG_INFO, "iid %d: stop", instance_id);
  107. error = sam_stop ();
  108. if (error != CS_OK) {
  109. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  110. return 1;
  111. }
  112. }
  113. qb_log (LOG_INFO, "iid %d: sleep 3", instance_id);
  114. sleep (3);
  115. qb_log (LOG_INFO, "iid %d: start", instance_id);
  116. error = sam_start ();
  117. if (error != CS_OK) {
  118. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  119. return 1;
  120. }
  121. qb_log (LOG_INFO, "iid %d: sleep 3", instance_id);
  122. sleep (3);
  123. return 0;
  124. }
  125. if (instance_id == 3) {
  126. error = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART);
  127. if (error == CS_OK) {
  128. qb_log (LOG_ERR, "Can initialize SAM API after initialization");
  129. return 1;
  130. }
  131. error = sam_start ();
  132. if (error != CS_OK) {
  133. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  134. return 1;
  135. }
  136. error = sam_stop ();
  137. if (error != CS_OK) {
  138. qb_log (LOG_ERR, "Can't stop hc. Error %d", error);
  139. return 1;
  140. }
  141. error = sam_finalize ();
  142. if (error != CS_OK) {
  143. qb_log (LOG_ERR, "Can't finalize sam. Error %d", error);
  144. return 1;
  145. }
  146. error = sam_finalize ();
  147. if (error == CS_OK) {
  148. qb_log (LOG_ERR, "Can finalize sam after finalization!");
  149. return 1;
  150. }
  151. if (sam_initialize (2, SAM_RECOVERY_POLICY_RESTART) == CS_OK ||
  152. sam_start () == CS_OK || sam_stop () == CS_OK ||
  153. sam_register (NULL) == CS_OK || sam_hc_send () == CS_OK ||
  154. sam_hc_callback_register (NULL) == CS_OK) {
  155. qb_log (LOG_ERR, "Can call one of function after finalization!");
  156. return 1;
  157. }
  158. return 0;
  159. }
  160. return 1;
  161. }
  162. static void test2_signal (int sig)
  163. {
  164. qb_enter();
  165. test2_sig_delivered = 1;
  166. }
  167. /*
  168. * This tests recovery policy quit and callback.
  169. */
  170. static int test2 (void) {
  171. cs_error_t error;
  172. unsigned int instance_id;
  173. qb_enter();
  174. error = sam_initialize (2000, SAM_RECOVERY_POLICY_QUIT);
  175. if (error != CS_OK) {
  176. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  177. return 1;
  178. }
  179. qb_log (LOG_INFO, "register");
  180. error = sam_register (&instance_id);
  181. if (error != CS_OK) {
  182. qb_log (LOG_ERR, "Can't register. Error %d", error);
  183. return 1;
  184. }
  185. if (instance_id == 1) {
  186. signal (SIGTERM, test2_signal);
  187. qb_log (LOG_INFO, "iid %d: start", instance_id);
  188. error = sam_start ();
  189. if (error != CS_OK) {
  190. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  191. return 1;
  192. }
  193. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  194. sleep (1);
  195. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  196. error = sam_hc_send ();
  197. if (error != CS_OK) {
  198. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  199. return 1;
  200. }
  201. qb_log (LOG_INFO, "iid %d: wait for delivery of signal", instance_id);
  202. while (!test2_sig_delivered) {
  203. sleep (1);
  204. }
  205. qb_log (LOG_INFO, "iid %d: wait for real kill", instance_id);
  206. sleep (3);
  207. }
  208. return 1;
  209. }
  210. /*
  211. * Smoke test. Better to turn off coredump ;) This has no time limit, just restart process
  212. * when it dies.
  213. */
  214. static int test3 (void) {
  215. cs_error_t error;
  216. unsigned int instance_id;
  217. qb_log (LOG_INFO, "initialize");
  218. error = sam_initialize (0, SAM_RECOVERY_POLICY_RESTART);
  219. if (error != CS_OK) {
  220. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  221. return 1;
  222. }
  223. qb_log (LOG_INFO, "register");
  224. error = sam_register (&instance_id);
  225. if (error != CS_OK) {
  226. qb_log (LOG_ERR, "Can't register. Error %d", error);
  227. return 1;
  228. }
  229. if (instance_id < 100) {
  230. qb_log (LOG_INFO, "iid %d: start", instance_id);
  231. error = sam_start ();
  232. if (error != CS_OK) {
  233. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  234. return 1;
  235. }
  236. qb_log (LOG_INFO, "iid %d: Sending signal", instance_id);
  237. kill(getpid(), SIGSEGV);
  238. return 1;
  239. }
  240. return 0;
  241. }
  242. /*
  243. * Test sam_data_store, sam_data_restore and sam_data_getsize
  244. */
  245. static int test4 (void)
  246. {
  247. size_t size;
  248. cs_error_t err;
  249. int i;
  250. unsigned int instance_id;
  251. char saved_data[128];
  252. char saved_data2[128];
  253. qb_log (LOG_INFO, "sam_data_getsize 1");
  254. err = sam_data_getsize (&size);
  255. if (err != CS_ERR_BAD_HANDLE) {
  256. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  257. return 1;
  258. }
  259. qb_log (LOG_INFO, "sam_data_getsize 2");
  260. err = sam_data_getsize (NULL);
  261. if (err != CS_ERR_INVALID_PARAM) {
  262. qb_log (LOG_ERR, "Test should return CS_ERR_INVALID_PARAM. Error returned %d", err);
  263. return 1;
  264. }
  265. qb_log (LOG_INFO, "sam_data_store 1");
  266. err = sam_data_store (NULL, 0);
  267. if (err != CS_ERR_BAD_HANDLE) {
  268. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  269. return 1;
  270. }
  271. qb_log (LOG_INFO, "sam_data_restore 1");
  272. err = sam_data_restore (saved_data, sizeof (saved_data));
  273. if (err != CS_ERR_BAD_HANDLE) {
  274. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  275. return 1;
  276. }
  277. qb_log (LOG_INFO, "sam_initialize");
  278. err = sam_initialize (0, SAM_RECOVERY_POLICY_RESTART);
  279. if (err != CS_OK) {
  280. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  281. return 1;
  282. }
  283. qb_log (LOG_INFO, "sam_data_getsize 3");
  284. err = sam_data_getsize (&size);
  285. if (err != CS_OK) {
  286. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  287. return 1;
  288. }
  289. if (size != 0) {
  290. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  291. return 1;
  292. }
  293. qb_log (LOG_INFO, "sam_data_restore 2");
  294. err = sam_data_restore (NULL, sizeof (saved_data));
  295. if (err != CS_ERR_INVALID_PARAM) {
  296. qb_log (LOG_ERR, "Test should return CS_ERR_INVALID_PARAM. Error returned %d", err);
  297. return 1;
  298. }
  299. /*
  300. * Store some real data
  301. */
  302. for (i = 0; i < sizeof (saved_data); i++) {
  303. saved_data[i] = (char)(i + 5);
  304. }
  305. qb_log (LOG_INFO, "sam_data_store 2");
  306. err = sam_data_store (saved_data, sizeof (saved_data));
  307. if (err != CS_OK) {
  308. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  309. return 1;
  310. }
  311. qb_log (LOG_INFO, " sam_data_getsize 4");
  312. err = sam_data_getsize (&size);
  313. if (err != CS_OK) {
  314. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  315. return 1;
  316. }
  317. if (size != sizeof (saved_data)) {
  318. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  319. return 1;
  320. }
  321. qb_log (LOG_INFO, " sam_data_restore 3");
  322. err = sam_data_restore (saved_data2, sizeof (saved_data2) - 1);
  323. if (err != CS_ERR_INVALID_PARAM) {
  324. qb_log (LOG_ERR, "Test should return CS_ERR_INVALID_PARAM. Error returned %d", err);
  325. return 1;
  326. }
  327. qb_log (LOG_INFO, " sam_data_restore 4");
  328. err = sam_data_restore (saved_data2, sizeof (saved_data2));
  329. if (err != CS_OK) {
  330. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  331. return 1;
  332. }
  333. if (memcmp (saved_data, saved_data2, sizeof (saved_data2)) != 0) {
  334. qb_log (LOG_ERR, "Retored data are not same");
  335. return 1;
  336. }
  337. memset (saved_data2, 0, sizeof (saved_data2));
  338. qb_log (LOG_INFO, " sam_data_store 3");
  339. err = sam_data_store (NULL, 1);
  340. if (err != CS_OK) {
  341. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  342. return 1;
  343. }
  344. qb_log (LOG_INFO, " sam_data_getsize 5");
  345. err = sam_data_getsize (&size);
  346. if (err != CS_OK) {
  347. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  348. return 1;
  349. }
  350. if (size != 0) {
  351. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  352. return 1;
  353. }
  354. qb_log (LOG_INFO, " sam_data_store 4");
  355. err = sam_data_store (saved_data, sizeof (saved_data));
  356. if (err != CS_OK) {
  357. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  358. return 1;
  359. }
  360. qb_log (LOG_INFO, " register");
  361. err = sam_register (&instance_id);
  362. if (err != CS_OK) {
  363. qb_log (LOG_ERR, "Can't register. Error %d", err);
  364. return 1;
  365. }
  366. if (instance_id == 1) {
  367. qb_log (LOG_INFO, "iid %d: sam_start", instance_id);
  368. err = sam_start ();
  369. if (err != CS_OK) {
  370. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  371. return 1;
  372. }
  373. qb_log (LOG_INFO, "iid %d: sam_data_getsize 6", instance_id);
  374. err = sam_data_getsize (&size);
  375. if (err != CS_OK) {
  376. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  377. return 1;
  378. }
  379. if (size != sizeof (saved_data2)) {
  380. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  381. return 1;
  382. }
  383. qb_log (LOG_INFO, "iid %d: sam_data_restore 5", instance_id);
  384. err = sam_data_restore (saved_data2, sizeof (saved_data2));
  385. if (err != CS_OK) {
  386. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  387. return 1;
  388. }
  389. if (memcmp (saved_data, saved_data2, sizeof (saved_data2)) != 0) {
  390. qb_log (LOG_ERR, "Retored data are not same");
  391. return 1;
  392. }
  393. for (i = 0; i < sizeof (saved_data); i++) {
  394. saved_data[i] = (char)(i - 5);
  395. }
  396. qb_log (LOG_INFO, "iid %d: sam_data_store 5", instance_id);
  397. err = sam_data_store (saved_data, sizeof (saved_data) - 7);
  398. if (err != CS_OK) {
  399. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  400. return 1;
  401. }
  402. exit (1);
  403. }
  404. if (instance_id == 2) {
  405. qb_log (LOG_INFO, "iid %d: sam_start", instance_id);
  406. err = sam_start ();
  407. if (err != CS_OK) {
  408. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  409. return 1;
  410. }
  411. qb_log (LOG_INFO, "iid %d: sam_data_getsize 7", instance_id);
  412. err = sam_data_getsize (&size);
  413. if (err != CS_OK) {
  414. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  415. return 1;
  416. }
  417. if (size != sizeof (saved_data2) - 7) {
  418. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  419. return 1;
  420. }
  421. qb_log (LOG_INFO, "iid %d: sam_data_restore 6", instance_id);
  422. err = sam_data_restore (saved_data2, sizeof (saved_data2));
  423. if (err != CS_OK) {
  424. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  425. return 1;
  426. }
  427. for (i = 0; i < sizeof (saved_data); i++) {
  428. saved_data[i] = (char)(i - 5);
  429. }
  430. if (memcmp (saved_data, saved_data2, sizeof (saved_data2) - 7) != 0) {
  431. qb_log (LOG_ERR, "Retored data are not same");
  432. return 1;
  433. }
  434. qb_log (LOG_INFO, "iid %d: sam_data_store 6", instance_id);
  435. err = sam_data_store (NULL, 0);
  436. if (err != CS_OK) {
  437. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  438. return 1;
  439. }
  440. exit (1);
  441. }
  442. if (instance_id == 3) {
  443. qb_log (LOG_INFO, "iid %d: sam_data_getsize 8", instance_id);
  444. err = sam_data_getsize (&size);
  445. if (err != CS_OK) {
  446. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  447. return 1;
  448. }
  449. if (size != 0) {
  450. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  451. return 1;
  452. }
  453. }
  454. return (0);
  455. }
  456. static int test5_hc_cb (void)
  457. {
  458. cs_error_t res;
  459. qb_log (LOG_INFO, "%d", ++test5_hc_cb_count);
  460. res = sam_data_store (&test5_hc_cb_count, sizeof (test5_hc_cb_count));
  461. if (res != CS_OK)
  462. return 1;
  463. if (test5_hc_cb_count > 10)
  464. return 1;
  465. return 0;
  466. }
  467. /*
  468. * Test event driven healtchecking.
  469. */
  470. static int test5 (void)
  471. {
  472. cs_error_t error;
  473. unsigned int instance_id;
  474. int hc_cb_count;
  475. qb_log (LOG_INFO, " initialize");
  476. error = sam_initialize (100, SAM_RECOVERY_POLICY_RESTART);
  477. if (error != CS_OK) {
  478. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  479. return 1;
  480. }
  481. qb_log (LOG_INFO, " register");
  482. error = sam_register (&instance_id);
  483. if (error != CS_OK) {
  484. qb_log (LOG_ERR, "Can't register. Error %d", error);
  485. return 1;
  486. }
  487. if (instance_id == 1) {
  488. qb_log (LOG_INFO, "iid %d: hc callback register", instance_id);
  489. error = sam_hc_callback_register (test5_hc_cb);
  490. if (error != CS_OK) {
  491. qb_log (LOG_ERR, "Can't register hc cb. Error %d", error);
  492. return 1;
  493. }
  494. qb_log (LOG_INFO, "iid %d: start", instance_id);
  495. error = sam_start ();
  496. if (error != CS_OK) {
  497. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  498. return 1;
  499. }
  500. sleep (2);
  501. qb_log (LOG_INFO, "iid %d: Failed. Wasn't killed.", instance_id);
  502. return 1;
  503. }
  504. if (instance_id == 2) {
  505. error = sam_data_restore (&hc_cb_count, sizeof (hc_cb_count));
  506. if (error != CS_OK) {
  507. qb_log (LOG_ERR, "sam_data_restore should return CS_OK. Error returned %d", error);
  508. return 1;
  509. }
  510. if (hc_cb_count != 11) {
  511. qb_log (LOG_ERR, "iid %d: Premature killed. hc_cb_count should be 11 and it is %d",
  512. __FUNCTION__, instance_id - 1, hc_cb_count);
  513. return 1;
  514. }
  515. return 0;
  516. }
  517. return 1;
  518. }
  519. static void test6_signal (int sig) {
  520. cs_error_t error;
  521. qb_enter();
  522. test6_sig_delivered++;
  523. if ((error = sam_data_store (&test6_sig_delivered, sizeof (test6_sig_delivered))) != CS_OK) {
  524. qb_log (LOG_ERR, "Can't store data! Error : %d", error);
  525. }
  526. }
  527. /*
  528. * Test warn signal set.
  529. */
  530. static int test6 (void) {
  531. cs_error_t error;
  532. unsigned int instance_id;
  533. int test6_sig_del;
  534. qb_log (LOG_INFO, " initialize");
  535. error = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART);
  536. if (error != CS_OK) {
  537. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  538. return 1;
  539. }
  540. qb_log (LOG_INFO, " register");
  541. error = sam_register (&instance_id);
  542. if (error != CS_OK) {
  543. qb_log (LOG_ERR, "Can't register. Error %d", error);
  544. return 1;
  545. }
  546. if (instance_id == 1) {
  547. error = sam_warn_signal_set (SIGUSR1);
  548. if (error != CS_OK) {
  549. qb_log (LOG_ERR, "Can't set warn signal. Error %d", error);
  550. return 1;
  551. }
  552. signal (SIGUSR1, test6_signal);
  553. qb_log (LOG_INFO, " iid %d: start", instance_id);
  554. error = sam_start ();
  555. if (error != CS_OK) {
  556. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  557. return 1;
  558. }
  559. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  560. sleep (1);
  561. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  562. error = sam_hc_send ();
  563. if (error != CS_OK) {
  564. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  565. return 1;
  566. }
  567. qb_log (LOG_INFO, "iid %d: wait for delivery of signal", instance_id);
  568. while (!test6_sig_delivered) {
  569. sleep (1);
  570. }
  571. qb_log (LOG_INFO, "iid %d: wait for real kill", instance_id);
  572. sleep (3);
  573. qb_log (LOG_INFO, "iid %d: wasn't killed", instance_id);
  574. return (1);
  575. }
  576. if (instance_id == 2) {
  577. error = sam_data_restore (&test6_sig_del, sizeof (test6_sig_del));
  578. if (error != CS_OK) {
  579. qb_log (LOG_ERR, "Can't restore data. Error %d", error);
  580. return 1;
  581. }
  582. if (test6_sig_del != 1) {
  583. qb_log (LOG_ERR, "Previous test failed. Signal was not delivered");
  584. return 1;
  585. }
  586. error = sam_warn_signal_set (SIGKILL);
  587. if (error != CS_OK) {
  588. qb_log (LOG_ERR, "Can't set warn signal. Error %d", error);
  589. return 1;
  590. }
  591. signal (SIGUSR1, test6_signal);
  592. qb_log (LOG_INFO, "iid %d: start", instance_id);
  593. error = sam_start ();
  594. if (error != CS_OK) {
  595. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  596. return 1;
  597. }
  598. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  599. sleep (1);
  600. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  601. error = sam_hc_send ();
  602. if (error != CS_OK) {
  603. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  604. return 1;
  605. }
  606. qb_log (LOG_INFO, "iid %d: wait for delivery of signal", instance_id);
  607. while (!test6_sig_delivered) {
  608. sleep (1);
  609. }
  610. qb_log (LOG_INFO, "iid %d: wasn't killed", instance_id);
  611. return (1);
  612. }
  613. if (instance_id == 3) {
  614. error = sam_data_restore (&test6_sig_del, sizeof (test6_sig_del));
  615. if (error != CS_OK) {
  616. qb_log (LOG_ERR, "Can't restore data. Error %d", error);
  617. return 1;
  618. }
  619. if (test6_sig_del != 1) {
  620. qb_log (LOG_ERR, "Previous test failed. Signal WAS delivered");
  621. return 1;
  622. }
  623. return (0);
  624. }
  625. return 1;
  626. }
  627. /*
  628. * Test cmap integration + quit policy
  629. */
  630. static int test8 (pid_t pid, pid_t old_pid, int test_n) {
  631. cmap_handle_t cmap_handle;
  632. cs_error_t err;
  633. uint64_t tstamp1, tstamp2;
  634. int32_t msec_diff;
  635. unsigned int instance_id;
  636. char key_name[CMAP_KEYNAME_MAXLEN];
  637. char *str;
  638. err = cmap_initialize (&cmap_handle);
  639. if (err != CS_OK) {
  640. qb_log (LOG_INFO, "Could not initialize Cluster Map API instance error %d. Test skipped", err);
  641. return (1);
  642. }
  643. qb_log (LOG_INFO, "test %d", test_n);
  644. if (test_n == 2) {
  645. /*
  646. * Object should not exist
  647. */
  648. qb_log (LOG_INFO, "Testing if object exists (it shouldn't)");
  649. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  650. err = cmap_get_string(cmap_handle, key_name, &str);
  651. if (err == CS_OK) {
  652. qb_log (LOG_INFO, "Could find key \"%s\": %d.", key_name, err);
  653. free(str);
  654. return (2);
  655. }
  656. }
  657. if (test_n == 1 || test_n == 2) {
  658. qb_log (LOG_INFO, " initialize");
  659. err = sam_initialize (2000, SAM_RECOVERY_POLICY_QUIT | SAM_RECOVERY_POLICY_CMAP);
  660. if (err != CS_OK) {
  661. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  662. return 2;
  663. }
  664. qb_log (LOG_INFO, " register");
  665. err = sam_register (&instance_id);
  666. if (err != CS_OK) {
  667. qb_log (LOG_ERR, "Can't register. Error %d", err);
  668. return 2;
  669. }
  670. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.recovery", pid);
  671. err = cmap_get_string(cmap_handle, key_name, &str);
  672. if (err != CS_OK) {
  673. qb_log (LOG_INFO, "Could not get \"recovery\" key: %d.", err);
  674. return (2);
  675. }
  676. if (strcmp(str, "quit") != 0) {
  677. qb_log (LOG_INFO, "Recovery key \"%s\" is not \"quit\".", key_name);
  678. free(str);
  679. return (2);
  680. }
  681. free(str);
  682. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  683. err = cmap_get_string(cmap_handle, key_name, &str);
  684. if (err != CS_OK) {
  685. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  686. return (2);
  687. }
  688. if (strcmp(str, "stopped") != 0) {
  689. qb_log (LOG_INFO, "State key is not \"stopped\".");
  690. free(str);
  691. return (2);
  692. }
  693. free(str);
  694. qb_log (LOG_INFO, "iid %d: start", instance_id);
  695. err = sam_start ();
  696. if (err != CS_OK) {
  697. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  698. return 2;
  699. }
  700. err = cmap_get_string(cmap_handle, key_name, &str);
  701. if (err != CS_OK) {
  702. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  703. return (2);
  704. }
  705. if (strcmp(str, "running") != 0) {
  706. qb_log (LOG_INFO, "State key is not \"running\".");
  707. free(str);
  708. return (2);
  709. }
  710. free(str);
  711. qb_log (LOG_INFO, "iid %d: stop", instance_id);
  712. err = sam_stop ();
  713. if (err != CS_OK) {
  714. qb_log (LOG_ERR, "Can't stop hc. Error %d", err);
  715. return 2;
  716. }
  717. err = cmap_get_string(cmap_handle, key_name, &str);
  718. if (err != CS_OK) {
  719. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  720. return (2);
  721. }
  722. if (strcmp(str, "stopped") != 0) {
  723. qb_log (LOG_INFO, "State key is not \"stopped\".");
  724. free(str);
  725. return (2);
  726. }
  727. free(str);
  728. qb_log (LOG_INFO, "iid %d: sleeping 5", instance_id);
  729. sleep (5);
  730. err = cmap_get_string(cmap_handle, key_name, &str);
  731. if (err != CS_OK) {
  732. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  733. return (2);
  734. }
  735. if (strcmp(str, "stopped") != 0) {
  736. qb_log (LOG_INFO, "State key is not \"stopped\".");
  737. free(str);
  738. return (2);
  739. }
  740. free(str);
  741. qb_log (LOG_INFO, "iid %d: start 2", instance_id);
  742. err = sam_start ();
  743. if (err != CS_OK) {
  744. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  745. return 2;
  746. }
  747. err = cmap_get_string(cmap_handle, key_name, &str);
  748. if (err != CS_OK) {
  749. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  750. return (2);
  751. }
  752. if (strcmp(str, "running") != 0) {
  753. qb_log (LOG_INFO, "State key is not \"running\".");
  754. free(str);
  755. return (2);
  756. }
  757. free(str);
  758. if (test_n == 2) {
  759. qb_log (LOG_INFO, "iid %d: sleeping 5. Should be killed", instance_id);
  760. sleep (5);
  761. return (2);
  762. } else {
  763. qb_log (LOG_INFO, "iid %d: Test HC", instance_id);
  764. err = sam_hc_send ();
  765. if (err != CS_OK) {
  766. qb_log (LOG_ERR, "Can't send hc. Error %d", err);
  767. return 2;
  768. }
  769. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.last_updated", pid);
  770. err = cmap_get_uint64(cmap_handle, key_name, &tstamp1);
  771. if (err != CS_OK) {
  772. qb_log (LOG_INFO, "Could not get \"last_updated\" key: %d.", err);
  773. return (2);
  774. }
  775. qb_log (LOG_INFO, "iid %d: Sleep 1", instance_id);
  776. sleep (1);
  777. err = sam_hc_send ();
  778. if (err != CS_OK) {
  779. qb_log (LOG_ERR, "Can't send hc. Error %d", err);
  780. return 2;
  781. }
  782. sleep (1);
  783. err = cmap_get_uint64(cmap_handle, key_name, &tstamp2);
  784. if (err != CS_OK) {
  785. qb_log (LOG_INFO, "Could not get \"last_updated\" key: %d.", err);
  786. return (2);
  787. }
  788. msec_diff = (tstamp2 - tstamp1)/CS_TIME_NS_IN_MSEC;
  789. if (msec_diff < 500 || msec_diff > 2000) {
  790. qb_log (LOG_INFO, "Difference %d is not within <500, 2000> interval.", msec_diff);
  791. return (2);
  792. }
  793. qb_log (LOG_INFO, "iid %d: stop 2", instance_id);
  794. err = sam_stop ();
  795. if (err != CS_OK) {
  796. qb_log (LOG_ERR, "Can't stop hc. Error %d", err);
  797. return 2;
  798. }
  799. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  800. err = cmap_get_string(cmap_handle, key_name, &str);
  801. if (err != CS_OK) {
  802. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  803. return (2);
  804. }
  805. if (strcmp(str, "stopped") != 0) {
  806. qb_log (LOG_INFO, "State key is not \"stopped\".");
  807. free(str);
  808. return (2);
  809. }
  810. free(str);
  811. qb_log (LOG_INFO, "iid %d: exiting", instance_id);
  812. return (0);
  813. }
  814. }
  815. if (test_n == 3) {
  816. qb_log (LOG_INFO, "Testing if status is failed");
  817. /*
  818. * Previous should be FAILED
  819. */
  820. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  821. err = cmap_get_string(cmap_handle, key_name, &str);
  822. if (err != CS_OK) {
  823. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  824. return (2);
  825. }
  826. if (strcmp(str, "failed") != 0) {
  827. qb_log (LOG_INFO, "State key is not \"failed\".");
  828. free(str);
  829. return (2);
  830. }
  831. free(str);
  832. return (0);
  833. }
  834. return (2);
  835. }
  836. /*
  837. * Test cmap integration + restart policy
  838. */
  839. static int test9 (pid_t pid, pid_t old_pid, int test_n) {
  840. cs_error_t err;
  841. cmap_handle_t cmap_handle;
  842. unsigned int instance_id;
  843. char *str;
  844. char key_name[CMAP_KEYNAME_MAXLEN];
  845. err = cmap_initialize (&cmap_handle);
  846. if (err != CS_OK) {
  847. qb_log (LOG_INFO, "Could not initialize Cluster Map API instance error %d. Test skipped", err);
  848. return (1);
  849. }
  850. qb_log (LOG_INFO, "test %d", test_n);
  851. if (test_n == 1) {
  852. qb_log (LOG_INFO, " initialize");
  853. err = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART | SAM_RECOVERY_POLICY_CMAP);
  854. if (err != CS_OK) {
  855. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  856. return 2;
  857. }
  858. qb_log (LOG_INFO, " register");
  859. err = sam_register (&instance_id);
  860. if (err != CS_OK) {
  861. qb_log (LOG_ERR, "Can't register. Error %d", err);
  862. return 2;
  863. }
  864. qb_log (LOG_INFO, " iid %d", instance_id);
  865. if (instance_id < 3) {
  866. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.recovery", pid);
  867. err = cmap_get_string(cmap_handle, key_name, &str);
  868. if (err != CS_OK) {
  869. qb_log (LOG_INFO, "Could not get \"recovery\" key: %d.", err);
  870. return (2);
  871. }
  872. if (strcmp(str, "restart") != 0) {
  873. qb_log (LOG_INFO, "Recovery key \"%s\" is not \"restart\".", str);
  874. free(str);
  875. return (2);
  876. }
  877. free(str);
  878. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  879. err = cmap_get_string(cmap_handle, key_name, &str);
  880. if (err != CS_OK) {
  881. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  882. return (2);
  883. }
  884. if (strcmp(str, "stopped") != 0) {
  885. qb_log (LOG_INFO, "State key is not \"stopped\".");
  886. free(str);
  887. return (2);
  888. }
  889. free(str);
  890. qb_log (LOG_INFO, "iid %d: start", instance_id);
  891. err = sam_start ();
  892. if (err != CS_OK) {
  893. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  894. return 2;
  895. }
  896. err = cmap_get_string(cmap_handle, key_name, &str);
  897. if (err != CS_OK) {
  898. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  899. return (2);
  900. }
  901. if (strcmp(str, "running") != 0) {
  902. qb_log (LOG_INFO, "State key is not \"running\".");
  903. free(str);
  904. return (2);
  905. }
  906. free(str);
  907. qb_log (LOG_INFO, "iid %d: waiting for kill", instance_id);
  908. sleep (10);
  909. return (2);
  910. }
  911. if (instance_id == 3) {
  912. qb_log (LOG_INFO, "iid %d: mark failed", instance_id);
  913. err = sam_mark_failed ();
  914. if (err != CS_OK) {
  915. qb_log (LOG_ERR, "Can't mark failed. Error %d", err);
  916. return 2;
  917. }
  918. sleep (10);
  919. return (2);
  920. }
  921. return (2);
  922. }
  923. if (test_n == 2) {
  924. qb_log (LOG_INFO, "Testing if status is failed");
  925. /*
  926. * Previous should be FAILED
  927. */
  928. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  929. err = cmap_get_string(cmap_handle, key_name, &str);
  930. if (err != CS_OK) {
  931. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  932. return (2);
  933. }
  934. if (strcmp(str, "failed") != 0) {
  935. qb_log (LOG_INFO, "State key is not \"failed\".");
  936. free(str);
  937. return (2);
  938. }
  939. free(str);
  940. return (0);
  941. }
  942. return (2);
  943. }
  944. static int hc_allways_respond_cb(void)
  945. {
  946. qb_log (LOG_INFO, "health check OK.");
  947. return 0;
  948. }
  949. static int setup_hc (void)
  950. {
  951. cs_error_t err;
  952. unsigned int instance_id;
  953. err = sam_initialize (1000, SAM_RECOVERY_POLICY_QUIT | SAM_RECOVERY_POLICY_CMAP);
  954. if (err != CS_OK) {
  955. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  956. return 2;
  957. }
  958. qb_log (LOG_INFO, " register");
  959. err = sam_register (&instance_id);
  960. if (err != CS_OK) {
  961. qb_log (LOG_ERR, "Can't register. Error %d", err);
  962. return 2;
  963. }
  964. err = sam_hc_callback_register (hc_allways_respond_cb);
  965. qb_log (LOG_INFO, "instance id %d: start", instance_id);
  966. err = sam_start ();
  967. if (err != CS_OK) {
  968. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  969. return 2;
  970. }
  971. return (0);
  972. }
  973. static int do_test_command(int sock, char* func, char*args[], int num_args)
  974. {
  975. int err = 0;
  976. pid_t pid;
  977. int stat;
  978. pid = fork ();
  979. if (pid == -1) {
  980. qb_log (LOG_ERR, "Can't fork");
  981. return -1;
  982. }
  983. if (pid == 0) {
  984. if (strcmp ("test1", func) == 0) {
  985. err = test1 ();
  986. } else if (strcmp ("test2", func) == 0) {
  987. err = test2 ();
  988. } else if (strcmp ("test3", func) == 0) {
  989. err = test3 ();
  990. } else if (strcmp ("test4", func) == 0) {
  991. err = test4 ();
  992. } else if (strcmp ("test5", func) == 0) {
  993. err = test5 ();
  994. } else if (strcmp ("test6", func) == 0) {
  995. err = test6 ();
  996. } else if (strcmp ("test8", func) == 0) {
  997. err = test8 (getpid(), 0, 1);
  998. } else if (strcmp ("test9", func) == 0) {
  999. err = test9 (getpid(), 0, 1);
  1000. }
  1001. sam_finalize ();
  1002. exit(err);
  1003. }
  1004. if (pid > 0) {
  1005. waitpid (pid, &stat, 0);
  1006. return WEXITSTATUS (stat);
  1007. }
  1008. return -1;
  1009. }
  1010. static void do_command (int sock, char* func, char*args[], int num_args)
  1011. {
  1012. char response[100];
  1013. int err = 0;
  1014. ssize_t rc;
  1015. size_t send_len;
  1016. qb_log (LOG_INFO, "RPC:%s() called.", func);
  1017. if (strncmp ("test", func, 4) == 0) {
  1018. err = do_test_command(sock, func, args, num_args);
  1019. } else if (strcmp ("setup_hc", func) == 0) {
  1020. err = setup_hc ();
  1021. } else if (strcmp ("sam_stop", func) == 0) {
  1022. err = sam_stop ();
  1023. if (err != CS_OK) {
  1024. err = -1;
  1025. qb_log (LOG_ERR,"RPC:%s sam_stop failed!", func);
  1026. snprintf (response, 100, "%s", FAIL_STR);
  1027. }
  1028. err = sam_finalize();
  1029. } else {
  1030. err = -1;
  1031. qb_log (LOG_ERR,"RPC:%s not supported!", func);
  1032. snprintf (response, 100, "%s", NOT_SUPPORTED_STR);
  1033. }
  1034. if (err == 0) {
  1035. snprintf (response, 100, "%s", OK_STR);
  1036. } else if (err == 1) {
  1037. snprintf (response, 100, "%s", FAIL_STR);
  1038. qb_log (LOG_ERR, "%s() test skipped?! (%d).", func, err);
  1039. } else {
  1040. snprintf (response, 100, "%s", FAIL_STR);
  1041. qb_log (LOG_ERR, "%s() failed (%d).", func, err);
  1042. }
  1043. send_len = strlen (response);
  1044. rc = send (sock, response, send_len, 0);
  1045. assert(rc == send_len);
  1046. }
  1047. int
  1048. main (int argc, char *argv[])
  1049. {
  1050. return test_agent_run ("sam_test_agent", 9036, do_command, NULL);
  1051. }