sam_test_agent.c 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251
  1. /*
  2. * Copyright (c) 2009-2011 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. /*
  35. * Provides test of SAM API
  36. */
  37. #include <config.h>
  38. #include <stdio.h>
  39. #include <stdint.h>
  40. #include <stdlib.h>
  41. #include <unistd.h>
  42. #include <pthread.h>
  43. #include <limits.h>
  44. #include <sys/types.h>
  45. #include <sys/socket.h>
  46. #include <netinet/in.h>
  47. #include <arpa/inet.h>
  48. #include <netdb.h>
  49. #include <sys/un.h>
  50. #include <corosync/corotypes.h>
  51. #include <corosync/sam.h>
  52. #include <signal.h>
  53. #include <string.h>
  54. #include <sys/wait.h>
  55. #include <corosync/cmap.h>
  56. #include "common_test_agent.h"
  57. extern const char *__progname;
  58. static int test2_sig_delivered = 0;
  59. static int test5_hc_cb_count = 0;
  60. static int test6_sig_delivered = 0;
  61. /*
  62. * First test will just register SAM, with policy restart. First instance will
  63. * sleep one second, send hc and sleep another 3 seconds. This should force restart.
  64. * Second instance will sleep one second, send hc, stop hc and sleep 3 seconds.
  65. * Then start hc again and sleep 3 seconds. This should force restart again.
  66. * Last instance just calls initialize again. This should end with error.
  67. * Then call start, followed by stop and start again. Finally, we will call finalize
  68. * twice. One should succeed, second should fail. After this, we will call every function
  69. * (none should succeed).
  70. */
  71. static int test1 (void)
  72. {
  73. cs_error_t error;
  74. unsigned int instance_id;
  75. int i;
  76. qb_enter();
  77. error = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART);
  78. if (error != CS_OK) {
  79. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  80. return 1;
  81. }
  82. qb_log (LOG_INFO, "register");
  83. error = sam_register (&instance_id);
  84. if (error != CS_OK) {
  85. qb_log (LOG_ERR, "Can't register. Error %d", error);
  86. return 1;
  87. }
  88. if (instance_id == 1 || instance_id == 2) {
  89. qb_log (LOG_INFO, "iid %d: start", instance_id);
  90. error = sam_start ();
  91. if (error != CS_OK) {
  92. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  93. return 1;
  94. }
  95. for (i = 0; i < 10; i++) {
  96. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  97. sleep (1);
  98. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  99. error = sam_hc_send ();
  100. if (error != CS_OK) {
  101. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  102. return 1;
  103. }
  104. }
  105. if (instance_id == 2) {
  106. qb_log (LOG_INFO, "iid %d: stop", instance_id);
  107. error = sam_stop ();
  108. if (error != CS_OK) {
  109. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  110. return 1;
  111. }
  112. }
  113. qb_log (LOG_INFO, "iid %d: sleep 3", instance_id);
  114. sleep (3);
  115. qb_log (LOG_INFO, "iid %d: start", instance_id);
  116. error = sam_start ();
  117. if (error != CS_OK) {
  118. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  119. return 1;
  120. }
  121. qb_log (LOG_INFO, "iid %d: sleep 3", instance_id);
  122. sleep (3);
  123. return 0;
  124. }
  125. if (instance_id == 3) {
  126. error = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART);
  127. if (error == CS_OK) {
  128. qb_log (LOG_ERR, "Can initialize SAM API after initialization");
  129. return 1;
  130. }
  131. error = sam_start ();
  132. if (error != CS_OK) {
  133. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  134. return 1;
  135. }
  136. error = sam_stop ();
  137. if (error != CS_OK) {
  138. qb_log (LOG_ERR, "Can't stop hc. Error %d", error);
  139. return 1;
  140. }
  141. error = sam_finalize ();
  142. if (error != CS_OK) {
  143. qb_log (LOG_ERR, "Can't finalize sam. Error %d", error);
  144. return 1;
  145. }
  146. error = sam_finalize ();
  147. if (error == CS_OK) {
  148. qb_log (LOG_ERR, "Can finalize sam after finalization!");
  149. return 1;
  150. }
  151. if (sam_initialize (2, SAM_RECOVERY_POLICY_RESTART) == CS_OK ||
  152. sam_start () == CS_OK || sam_stop () == CS_OK ||
  153. sam_register (NULL) == CS_OK || sam_hc_send () == CS_OK ||
  154. sam_hc_callback_register (NULL) == CS_OK) {
  155. qb_log (LOG_ERR, "Can call one of function after finalization!");
  156. return 1;
  157. }
  158. return 0;
  159. }
  160. return 1;
  161. }
  162. static void test2_signal (int sig)
  163. {
  164. qb_enter();
  165. test2_sig_delivered = 1;
  166. }
  167. /*
  168. * This tests recovery policy quit and callback.
  169. */
  170. static int test2 (void) {
  171. cs_error_t error;
  172. unsigned int instance_id;
  173. qb_enter();
  174. error = sam_initialize (2000, SAM_RECOVERY_POLICY_QUIT);
  175. if (error != CS_OK) {
  176. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  177. return 1;
  178. }
  179. qb_log (LOG_INFO, "register");
  180. error = sam_register (&instance_id);
  181. if (error != CS_OK) {
  182. qb_log (LOG_ERR, "Can't register. Error %d", error);
  183. return 1;
  184. }
  185. if (instance_id == 1) {
  186. signal (SIGTERM, test2_signal);
  187. qb_log (LOG_INFO, "iid %d: start", instance_id);
  188. error = sam_start ();
  189. if (error != CS_OK) {
  190. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  191. return 1;
  192. }
  193. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  194. sleep (1);
  195. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  196. error = sam_hc_send ();
  197. if (error != CS_OK) {
  198. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  199. return 1;
  200. }
  201. qb_log (LOG_INFO, "iid %d: wait for delivery of signal", instance_id);
  202. while (!test2_sig_delivered) {
  203. sleep (1);
  204. }
  205. qb_log (LOG_INFO, "iid %d: wait for real kill", instance_id);
  206. sleep (3);
  207. }
  208. return 1;
  209. }
  210. /*
  211. * Smoke test. Better to turn off coredump ;) This has no time limit, just restart process
  212. * when it dies.
  213. */
  214. static int test3 (void) {
  215. cs_error_t error;
  216. unsigned int instance_id;
  217. qb_log (LOG_INFO, "initialize");
  218. error = sam_initialize (0, SAM_RECOVERY_POLICY_RESTART);
  219. if (error != CS_OK) {
  220. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  221. return 1;
  222. }
  223. qb_log (LOG_INFO, "register");
  224. error = sam_register (&instance_id);
  225. if (error != CS_OK) {
  226. qb_log (LOG_ERR, "Can't register. Error %d", error);
  227. return 1;
  228. }
  229. if (instance_id < 100) {
  230. qb_log (LOG_INFO, "iid %d: start", instance_id);
  231. error = sam_start ();
  232. if (error != CS_OK) {
  233. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  234. return 1;
  235. }
  236. qb_log (LOG_INFO, "iid %d: Sending signal", instance_id);
  237. kill(getpid(), SIGSEGV);
  238. return 1;
  239. }
  240. return 0;
  241. }
  242. /*
  243. * Test sam_data_store, sam_data_restore and sam_data_getsize
  244. */
  245. static int test4 (void)
  246. {
  247. size_t size;
  248. cs_error_t err;
  249. int i;
  250. unsigned int instance_id;
  251. char saved_data[128];
  252. char saved_data2[128];
  253. qb_log (LOG_INFO, "sam_data_getsize 1");
  254. err = sam_data_getsize (&size);
  255. if (err != CS_ERR_BAD_HANDLE) {
  256. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  257. return 1;
  258. }
  259. qb_log (LOG_INFO, "sam_data_getsize 2");
  260. err = sam_data_getsize (NULL);
  261. if (err != CS_ERR_INVALID_PARAM) {
  262. qb_log (LOG_ERR, "Test should return CS_ERR_INVALID_PARAM. Error returned %d", err);
  263. return 1;
  264. }
  265. qb_log (LOG_INFO, "sam_data_store 1");
  266. err = sam_data_store (NULL, 0);
  267. if (err != CS_ERR_BAD_HANDLE) {
  268. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  269. return 1;
  270. }
  271. qb_log (LOG_INFO, "sam_data_restore 1");
  272. err = sam_data_restore (saved_data, sizeof (saved_data));
  273. if (err != CS_ERR_BAD_HANDLE) {
  274. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  275. return 1;
  276. }
  277. qb_log (LOG_INFO, "sam_initialize");
  278. err = sam_initialize (0, SAM_RECOVERY_POLICY_RESTART);
  279. if (err != CS_OK) {
  280. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  281. return 1;
  282. }
  283. qb_log (LOG_INFO, "sam_data_getsize 3");
  284. err = sam_data_getsize (&size);
  285. if (err != CS_OK) {
  286. qb_log (LOG_ERR, "Test should return CS_ERR_BAD_HANDLE. Error returned %d", err);
  287. return 1;
  288. }
  289. if (size != 0) {
  290. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  291. return 1;
  292. }
  293. qb_log (LOG_INFO, "sam_data_restore 2");
  294. err = sam_data_restore (NULL, sizeof (saved_data));
  295. if (err != CS_ERR_INVALID_PARAM) {
  296. qb_log (LOG_ERR, "Test should return CS_ERR_INVALID_PARAM. Error returned %d", err);
  297. return 1;
  298. }
  299. /*
  300. * Store some real data
  301. */
  302. for (i = 0; i < sizeof (saved_data); i++) {
  303. saved_data[i] = (char)(i + 5);
  304. }
  305. qb_log (LOG_INFO, "sam_data_store 2");
  306. err = sam_data_store (saved_data, sizeof (saved_data));
  307. if (err != CS_OK) {
  308. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  309. return 1;
  310. }
  311. qb_log (LOG_INFO, " sam_data_getsize 4");
  312. err = sam_data_getsize (&size);
  313. if (err != CS_OK) {
  314. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  315. return 1;
  316. }
  317. if (size != sizeof (saved_data)) {
  318. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  319. return 1;
  320. }
  321. qb_log (LOG_INFO, " sam_data_restore 3");
  322. err = sam_data_restore (saved_data2, sizeof (saved_data2) - 1);
  323. if (err != CS_ERR_INVALID_PARAM) {
  324. qb_log (LOG_ERR, "Test should return CS_ERR_INVALID_PARAM. Error returned %d", err);
  325. return 1;
  326. }
  327. qb_log (LOG_INFO, " sam_data_restore 4");
  328. err = sam_data_restore (saved_data2, sizeof (saved_data2));
  329. if (err != CS_OK) {
  330. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  331. return 1;
  332. }
  333. if (memcmp (saved_data, saved_data2, sizeof (saved_data2)) != 0) {
  334. qb_log (LOG_ERR, "Retored data are not same");
  335. return 1;
  336. }
  337. memset (saved_data2, 0, sizeof (saved_data2));
  338. qb_log (LOG_INFO, " sam_data_store 3");
  339. err = sam_data_store (NULL, 1);
  340. if (err != CS_OK) {
  341. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  342. return 1;
  343. }
  344. qb_log (LOG_INFO, " sam_data_getsize 5");
  345. err = sam_data_getsize (&size);
  346. if (err != CS_OK) {
  347. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  348. return 1;
  349. }
  350. if (size != 0) {
  351. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  352. return 1;
  353. }
  354. qb_log (LOG_INFO, " sam_data_store 4");
  355. err = sam_data_store (saved_data, sizeof (saved_data));
  356. if (err != CS_OK) {
  357. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  358. return 1;
  359. }
  360. qb_log (LOG_INFO, " register");
  361. err = sam_register (&instance_id);
  362. if (err != CS_OK) {
  363. qb_log (LOG_ERR, "Can't register. Error %d", err);
  364. return 1;
  365. }
  366. if (instance_id == 1) {
  367. qb_log (LOG_INFO, "iid %d: sam_start", instance_id);
  368. err = sam_start ();
  369. if (err != CS_OK) {
  370. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  371. return 1;
  372. }
  373. qb_log (LOG_INFO, "iid %d: sam_data_getsize 6", instance_id);
  374. err = sam_data_getsize (&size);
  375. if (err != CS_OK) {
  376. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  377. return 1;
  378. }
  379. if (size != sizeof (saved_data2)) {
  380. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  381. return 1;
  382. }
  383. qb_log (LOG_INFO, "iid %d: sam_data_restore 5", instance_id);
  384. err = sam_data_restore (saved_data2, sizeof (saved_data2));
  385. if (err != CS_OK) {
  386. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  387. return 1;
  388. }
  389. if (memcmp (saved_data, saved_data2, sizeof (saved_data2)) != 0) {
  390. qb_log (LOG_ERR, "Retored data are not same");
  391. return 1;
  392. }
  393. for (i = 0; i < sizeof (saved_data); i++) {
  394. saved_data[i] = (char)(i - 5);
  395. }
  396. qb_log (LOG_INFO, "iid %d: sam_data_store 5", instance_id);
  397. err = sam_data_store (saved_data, sizeof (saved_data) - 7);
  398. if (err != CS_OK) {
  399. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  400. return 1;
  401. }
  402. exit (1);
  403. }
  404. if (instance_id == 2) {
  405. qb_log (LOG_INFO, "iid %d: sam_start", instance_id);
  406. err = sam_start ();
  407. if (err != CS_OK) {
  408. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  409. return 1;
  410. }
  411. qb_log (LOG_INFO, "iid %d: sam_data_getsize 7", instance_id);
  412. err = sam_data_getsize (&size);
  413. if (err != CS_OK) {
  414. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  415. return 1;
  416. }
  417. if (size != sizeof (saved_data2) - 7) {
  418. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  419. return 1;
  420. }
  421. qb_log (LOG_INFO, "iid %d: sam_data_restore 6", instance_id);
  422. err = sam_data_restore (saved_data2, sizeof (saved_data2));
  423. if (err != CS_OK) {
  424. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  425. return 1;
  426. }
  427. for (i = 0; i < sizeof (saved_data); i++) {
  428. saved_data[i] = (char)(i - 5);
  429. }
  430. if (memcmp (saved_data, saved_data2, sizeof (saved_data2) - 7) != 0) {
  431. qb_log (LOG_ERR, "Retored data are not same");
  432. return 1;
  433. }
  434. qb_log (LOG_INFO, "iid %d: sam_data_store 6", instance_id);
  435. err = sam_data_store (NULL, 0);
  436. if (err != CS_OK) {
  437. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  438. return 1;
  439. }
  440. exit (1);
  441. }
  442. if (instance_id == 3) {
  443. qb_log (LOG_INFO, "iid %d: sam_data_getsize 8", instance_id);
  444. err = sam_data_getsize (&size);
  445. if (err != CS_OK) {
  446. qb_log (LOG_ERR, "Test should return CS_OK. Error returned %d", err);
  447. return 1;
  448. }
  449. if (size != 0) {
  450. qb_log (LOG_ERR, "Test should return size of 0. Returned %zx", size);
  451. return 1;
  452. }
  453. }
  454. return (0);
  455. }
  456. static int test5_hc_cb (void)
  457. {
  458. cs_error_t res;
  459. qb_log (LOG_INFO, "%d", ++test5_hc_cb_count);
  460. res = sam_data_store (&test5_hc_cb_count, sizeof (test5_hc_cb_count));
  461. if (res != CS_OK)
  462. return 1;
  463. if (test5_hc_cb_count > 10)
  464. return 1;
  465. return 0;
  466. }
  467. /*
  468. * Test event driven healtchecking.
  469. */
  470. static int test5 (void)
  471. {
  472. cs_error_t error;
  473. unsigned int instance_id;
  474. int hc_cb_count;
  475. qb_log (LOG_INFO, " initialize");
  476. error = sam_initialize (100, SAM_RECOVERY_POLICY_RESTART);
  477. if (error != CS_OK) {
  478. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  479. return 1;
  480. }
  481. qb_log (LOG_INFO, " register");
  482. error = sam_register (&instance_id);
  483. if (error != CS_OK) {
  484. qb_log (LOG_ERR, "Can't register. Error %d", error);
  485. return 1;
  486. }
  487. if (instance_id == 1) {
  488. qb_log (LOG_INFO, "iid %d: hc callback register", instance_id);
  489. error = sam_hc_callback_register (test5_hc_cb);
  490. if (error != CS_OK) {
  491. qb_log (LOG_ERR, "Can't register hc cb. Error %d", error);
  492. return 1;
  493. }
  494. qb_log (LOG_INFO, "iid %d: start", instance_id);
  495. error = sam_start ();
  496. if (error != CS_OK) {
  497. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  498. return 1;
  499. }
  500. sleep (2);
  501. qb_log (LOG_INFO, "iid %d: Failed. Wasn't killed.", instance_id);
  502. return 1;
  503. }
  504. if (instance_id == 2) {
  505. error = sam_data_restore (&hc_cb_count, sizeof (hc_cb_count));
  506. if (error != CS_OK) {
  507. qb_log (LOG_ERR, "sam_data_restore should return CS_OK. Error returned %d", error);
  508. return 1;
  509. }
  510. if (hc_cb_count != 11) {
  511. qb_log (LOG_ERR, "iid %d: Premature killed. hc_cb_count should be 11 and it is %d",
  512. __FUNCTION__, instance_id - 1, hc_cb_count);
  513. return 1;
  514. }
  515. return 0;
  516. }
  517. return 1;
  518. }
  519. static void test6_signal (int sig) {
  520. cs_error_t error;
  521. qb_enter();
  522. test6_sig_delivered++;
  523. if ((error = sam_data_store (&test6_sig_delivered, sizeof (test6_sig_delivered))) != CS_OK) {
  524. qb_log (LOG_ERR, "Can't store data! Error : %d", error);
  525. }
  526. }
  527. /*
  528. * Test warn signal set.
  529. */
  530. static int test6 (void) {
  531. cs_error_t error;
  532. unsigned int instance_id;
  533. int test6_sig_del;
  534. qb_log (LOG_INFO, " initialize");
  535. error = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART);
  536. if (error != CS_OK) {
  537. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", error);
  538. return 1;
  539. }
  540. qb_log (LOG_INFO, " register");
  541. error = sam_register (&instance_id);
  542. if (error != CS_OK) {
  543. qb_log (LOG_ERR, "Can't register. Error %d", error);
  544. return 1;
  545. }
  546. if (instance_id == 1) {
  547. error = sam_warn_signal_set (SIGUSR1);
  548. if (error != CS_OK) {
  549. qb_log (LOG_ERR, "Can't set warn signal. Error %d", error);
  550. return 1;
  551. }
  552. signal (SIGUSR1, test6_signal);
  553. qb_log (LOG_INFO, " iid %d: start", instance_id);
  554. error = sam_start ();
  555. if (error != CS_OK) {
  556. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  557. return 1;
  558. }
  559. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  560. sleep (1);
  561. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  562. error = sam_hc_send ();
  563. if (error != CS_OK) {
  564. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  565. return 1;
  566. }
  567. qb_log (LOG_INFO, "iid %d: wait for delivery of signal", instance_id);
  568. while (!test6_sig_delivered) {
  569. sleep (1);
  570. }
  571. qb_log (LOG_INFO, "iid %d: wait for real kill", instance_id);
  572. sleep (3);
  573. qb_log (LOG_INFO, "iid %d: wasn't killed", instance_id);
  574. return (1);
  575. }
  576. if (instance_id == 2) {
  577. error = sam_data_restore (&test6_sig_del, sizeof (test6_sig_del));
  578. if (error != CS_OK) {
  579. qb_log (LOG_ERR, "Can't restore data. Error %d", error);
  580. return 1;
  581. }
  582. if (test6_sig_del != 1) {
  583. qb_log (LOG_ERR, "Previous test failed. Signal was not delivered");
  584. return 1;
  585. }
  586. error = sam_warn_signal_set (SIGKILL);
  587. if (error != CS_OK) {
  588. qb_log (LOG_ERR, "Can't set warn signal. Error %d", error);
  589. return 1;
  590. }
  591. signal (SIGUSR1, test6_signal);
  592. qb_log (LOG_INFO, "iid %d: start", instance_id);
  593. error = sam_start ();
  594. if (error != CS_OK) {
  595. qb_log (LOG_ERR, "Can't start hc. Error %d", error);
  596. return 1;
  597. }
  598. qb_log (LOG_INFO, "iid %d: sleep 1", instance_id);
  599. sleep (1);
  600. qb_log (LOG_INFO, "iid %d: hc send", instance_id);
  601. error = sam_hc_send ();
  602. if (error != CS_OK) {
  603. qb_log (LOG_ERR, "Can't send hc. Error %d", error);
  604. return 1;
  605. }
  606. qb_log (LOG_INFO, "iid %d: wait for delivery of signal", instance_id);
  607. while (!test6_sig_delivered) {
  608. sleep (1);
  609. }
  610. qb_log (LOG_INFO, "iid %d: wasn't killed", instance_id);
  611. return (1);
  612. }
  613. if (instance_id == 3) {
  614. error = sam_data_restore (&test6_sig_del, sizeof (test6_sig_del));
  615. if (error != CS_OK) {
  616. qb_log (LOG_ERR, "Can't restore data. Error %d", error);
  617. return 1;
  618. }
  619. if (test6_sig_del != 1) {
  620. qb_log (LOG_ERR, "Previous test failed. Signal WAS delivered");
  621. return 1;
  622. }
  623. return (0);
  624. }
  625. return 1;
  626. }
  627. /*
  628. * Test cmap integration + quit policy
  629. */
  630. static int test8 (pid_t pid, pid_t old_pid, int test_n) {
  631. cmap_handle_t cmap_handle;
  632. cs_error_t err;
  633. uint64_t tstamp1, tstamp2;
  634. int32_t msec_diff;
  635. unsigned int instance_id;
  636. char key_name[CMAP_KEYNAME_MAXLEN];
  637. char *str;
  638. err = cmap_initialize (&cmap_handle);
  639. if (err != CS_OK) {
  640. qb_log (LOG_INFO, "Could not initialize Cluster Map API instance error %d. Test skipped", err);
  641. return (1);
  642. }
  643. qb_log (LOG_INFO, "test %d", test_n);
  644. if (test_n == 2) {
  645. /*
  646. * Object should not exist
  647. */
  648. qb_log (LOG_INFO, "Testing if object exists (it shouldn't)");
  649. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  650. err = cmap_get_string(cmap_handle, key_name, &str);
  651. if (err == CS_OK) {
  652. qb_log (LOG_INFO, "Could find key \"%s\": %d.", key_name, err);
  653. free(str);
  654. return (2);
  655. }
  656. }
  657. if (test_n == 1 || test_n == 2) {
  658. qb_log (LOG_INFO, " initialize");
  659. err = sam_initialize (2000, SAM_RECOVERY_POLICY_QUIT | SAM_RECOVERY_POLICY_CMAP);
  660. if (err != CS_OK) {
  661. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  662. return 2;
  663. }
  664. qb_log (LOG_INFO, " register");
  665. err = sam_register (&instance_id);
  666. if (err != CS_OK) {
  667. qb_log (LOG_ERR, "Can't register. Error %d", err);
  668. return 2;
  669. }
  670. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.recovery", pid);
  671. err = cmap_get_string(cmap_handle, key_name, &str);
  672. if (err != CS_OK) {
  673. qb_log (LOG_INFO, "Could not get \"recovery\" key: %d.", err);
  674. return (2);
  675. }
  676. if (strcmp(str, "quit") != 0) {
  677. qb_log (LOG_INFO, "Recovery key \"%s\" is not \"quit\".", key_name);
  678. free(str);
  679. return (2);
  680. }
  681. free(str);
  682. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  683. err = cmap_get_string(cmap_handle, key_name, &str);
  684. if (err != CS_OK) {
  685. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  686. return (2);
  687. }
  688. if (strcmp(str, "stopped") != 0) {
  689. qb_log (LOG_INFO, "State key is not \"stopped\".");
  690. free(str);
  691. return (2);
  692. }
  693. free(str);
  694. qb_log (LOG_INFO, "iid %d: start", instance_id);
  695. err = sam_start ();
  696. if (err != CS_OK) {
  697. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  698. return 2;
  699. }
  700. err = cmap_get_string(cmap_handle, key_name, &str);
  701. if (err != CS_OK) {
  702. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  703. return (2);
  704. }
  705. if (strcmp(str, "running") != 0) {
  706. qb_log (LOG_INFO, "State key is not \"running\".");
  707. free(str);
  708. return (2);
  709. }
  710. free(str);
  711. qb_log (LOG_INFO, "iid %d: stop", instance_id);
  712. err = sam_stop ();
  713. if (err != CS_OK) {
  714. qb_log (LOG_ERR, "Can't stop hc. Error %d", err);
  715. return 2;
  716. }
  717. err = cmap_get_string(cmap_handle, key_name, &str);
  718. if (err != CS_OK) {
  719. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  720. return (2);
  721. }
  722. if (strcmp(str, "stopped") != 0) {
  723. qb_log (LOG_INFO, "State key is not \"stopped\".");
  724. free(str);
  725. return (2);
  726. }
  727. free(str);
  728. qb_log (LOG_INFO, "iid %d: sleeping 5", instance_id);
  729. sleep (5);
  730. err = cmap_get_string(cmap_handle, key_name, &str);
  731. if (err != CS_OK) {
  732. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  733. return (2);
  734. }
  735. if (strcmp(str, "stopped") != 0) {
  736. qb_log (LOG_INFO, "State key is not \"stopped\".");
  737. free(str);
  738. return (2);
  739. }
  740. free(str);
  741. qb_log (LOG_INFO, "iid %d: start 2", instance_id);
  742. err = sam_start ();
  743. if (err != CS_OK) {
  744. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  745. return 2;
  746. }
  747. err = cmap_get_string(cmap_handle, key_name, &str);
  748. if (err != CS_OK) {
  749. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  750. return (2);
  751. }
  752. if (strcmp(str, "running") != 0) {
  753. qb_log (LOG_INFO, "State key is not \"running\".");
  754. free(str);
  755. return (2);
  756. }
  757. free(str);
  758. if (test_n == 2) {
  759. qb_log (LOG_INFO, "iid %d: sleeping 5. Should be killed", instance_id);
  760. sleep (5);
  761. return (2);
  762. } else {
  763. qb_log (LOG_INFO, "iid %d: Test HC", instance_id);
  764. err = sam_hc_send ();
  765. if (err != CS_OK) {
  766. qb_log (LOG_ERR, "Can't send hc. Error %d", err);
  767. return 2;
  768. }
  769. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.last_updated", pid);
  770. err = cmap_get_uint64(cmap_handle, key_name, &tstamp1);
  771. if (err != CS_OK) {
  772. qb_log (LOG_INFO, "Could not get \"last_updated\" key: %d.", err);
  773. return (2);
  774. }
  775. qb_log (LOG_INFO, "iid %d: Sleep 1", instance_id);
  776. sleep (1);
  777. err = sam_hc_send ();
  778. if (err != CS_OK) {
  779. qb_log (LOG_ERR, "Can't send hc. Error %d", err);
  780. return 2;
  781. }
  782. sleep (1);
  783. err = cmap_get_uint64(cmap_handle, key_name, &tstamp2);
  784. if (err != CS_OK) {
  785. qb_log (LOG_INFO, "Could not get \"last_updated\" key: %d.", err);
  786. return (2);
  787. }
  788. msec_diff = (tstamp2 - tstamp1)/CS_TIME_NS_IN_MSEC;
  789. if (msec_diff < 500 || msec_diff > 2000) {
  790. qb_log (LOG_INFO, "Difference %d is not within <500, 2000> interval.", msec_diff);
  791. return (2);
  792. }
  793. qb_log (LOG_INFO, "iid %d: stop 2", instance_id);
  794. err = sam_stop ();
  795. if (err != CS_OK) {
  796. qb_log (LOG_ERR, "Can't stop hc. Error %d", err);
  797. return 2;
  798. }
  799. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  800. err = cmap_get_string(cmap_handle, key_name, &str);
  801. if (err != CS_OK) {
  802. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  803. return (2);
  804. }
  805. if (strcmp(str, "stopped") != 0) {
  806. qb_log (LOG_INFO, "State key is not \"stopped\".");
  807. free(str);
  808. return (2);
  809. }
  810. free(str);
  811. qb_log (LOG_INFO, "iid %d: exiting", instance_id);
  812. return (0);
  813. }
  814. }
  815. if (test_n == 3) {
  816. qb_log (LOG_INFO, "Testing if status is failed");
  817. /*
  818. * Previous should be FAILED
  819. */
  820. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  821. err = cmap_get_string(cmap_handle, key_name, &str);
  822. if (err != CS_OK) {
  823. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  824. return (2);
  825. }
  826. if (strcmp(str, "failed") != 0) {
  827. qb_log (LOG_INFO, "State key is not \"failed\".");
  828. free(str);
  829. return (2);
  830. }
  831. free(str);
  832. return (0);
  833. }
  834. return (2);
  835. }
  836. /*
  837. * Test cmap integration + restart policy
  838. */
  839. static int test9 (pid_t pid, pid_t old_pid, int test_n) {
  840. cs_error_t err;
  841. cmap_handle_t cmap_handle;
  842. unsigned int instance_id;
  843. char *str;
  844. char key_name[CMAP_KEYNAME_MAXLEN];
  845. err = cmap_initialize (&cmap_handle);
  846. if (err != CS_OK) {
  847. qb_log (LOG_INFO, "Could not initialize Cluster Map API instance error %d. Test skipped", err);
  848. return (1);
  849. }
  850. qb_log (LOG_INFO, "test %d", test_n);
  851. if (test_n == 1) {
  852. qb_log (LOG_INFO, " initialize");
  853. err = sam_initialize (2000, SAM_RECOVERY_POLICY_RESTART | SAM_RECOVERY_POLICY_CMAP);
  854. if (err != CS_OK) {
  855. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  856. return 2;
  857. }
  858. qb_log (LOG_INFO, " register");
  859. err = sam_register (&instance_id);
  860. if (err != CS_OK) {
  861. qb_log (LOG_ERR, "Can't register. Error %d", err);
  862. return 2;
  863. }
  864. qb_log (LOG_INFO, " iid %d", instance_id);
  865. if (instance_id < 3) {
  866. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.recovery", pid);
  867. err = cmap_get_string(cmap_handle, key_name, &str);
  868. if (err != CS_OK) {
  869. qb_log (LOG_INFO, "Could not get \"recovery\" key: %d.", err);
  870. return (2);
  871. }
  872. if (strcmp(str, "restart") != 0) {
  873. qb_log (LOG_INFO, "Recovery key \"%s\" is not \"restart\".", str);
  874. free(str);
  875. return (2);
  876. }
  877. free(str);
  878. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  879. err = cmap_get_string(cmap_handle, key_name, &str);
  880. if (err != CS_OK) {
  881. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  882. return (2);
  883. }
  884. if (strcmp(str, "stopped") != 0) {
  885. qb_log (LOG_INFO, "State key is not \"stopped\".");
  886. free(str);
  887. return (2);
  888. }
  889. free(str);
  890. qb_log (LOG_INFO, "iid %d: start", instance_id);
  891. err = sam_start ();
  892. if (err != CS_OK) {
  893. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  894. return 2;
  895. }
  896. err = cmap_get_string(cmap_handle, key_name, &str);
  897. if (err != CS_OK) {
  898. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  899. return (2);
  900. }
  901. if (strcmp(str, "running") != 0) {
  902. qb_log (LOG_INFO, "State key is not \"running\".");
  903. free(str);
  904. return (2);
  905. }
  906. free(str);
  907. qb_log (LOG_INFO, "iid %d: waiting for kill", instance_id);
  908. sleep (10);
  909. return (2);
  910. }
  911. if (instance_id == 3) {
  912. qb_log (LOG_INFO, "iid %d: mark failed", instance_id);
  913. err = sam_mark_failed ();
  914. if (err != CS_OK) {
  915. qb_log (LOG_ERR, "Can't mark failed. Error %d", err);
  916. return 2;
  917. }
  918. sleep (10);
  919. return (2);
  920. }
  921. return (2);
  922. }
  923. if (test_n == 2) {
  924. qb_log (LOG_INFO, "Testing if status is failed");
  925. /*
  926. * Previous should be FAILED
  927. */
  928. snprintf(key_name, CMAP_KEYNAME_MAXLEN, "resources.process.%d.state", pid);
  929. err = cmap_get_string(cmap_handle, key_name, &str);
  930. if (err != CS_OK) {
  931. qb_log (LOG_INFO, "Could not get \"state\" key: %d.", err);
  932. return (2);
  933. }
  934. if (strcmp(str, "failed") != 0) {
  935. qb_log (LOG_INFO, "State key is not \"failed\".");
  936. free(str);
  937. return (2);
  938. }
  939. free(str);
  940. return (0);
  941. }
  942. return (2);
  943. }
  944. static int hc_allways_respond_cb(void)
  945. {
  946. qb_log (LOG_INFO, "health check OK.");
  947. return 0;
  948. }
  949. static int setup_hc (void)
  950. {
  951. cs_error_t err;
  952. unsigned int instance_id;
  953. err = sam_initialize (1000, SAM_RECOVERY_POLICY_QUIT | SAM_RECOVERY_POLICY_CMAP);
  954. if (err != CS_OK) {
  955. qb_log (LOG_ERR, "Can't initialize SAM API. Error %d", err);
  956. return 2;
  957. }
  958. qb_log (LOG_INFO, " register");
  959. err = sam_register (&instance_id);
  960. if (err != CS_OK) {
  961. qb_log (LOG_ERR, "Can't register. Error %d", err);
  962. return 2;
  963. }
  964. err = sam_hc_callback_register (hc_allways_respond_cb);
  965. qb_log (LOG_INFO, "instance id %d: start", instance_id);
  966. err = sam_start ();
  967. if (err != CS_OK) {
  968. qb_log (LOG_ERR, "Can't start hc. Error %d", err);
  969. return 2;
  970. }
  971. return (0);
  972. }
  973. static int do_test_command(int sock, char* func, char*args[], int num_args)
  974. {
  975. int err = 0;
  976. pid_t pid;
  977. int stat;
  978. pid = fork ();
  979. if (pid == -1) {
  980. qb_log (LOG_ERR, "Can't fork");
  981. return -1;
  982. }
  983. if (pid == 0) {
  984. if (strcmp ("test1", func) == 0) {
  985. err = test1 ();
  986. } else if (strcmp ("test2", func) == 0) {
  987. err = test2 ();
  988. } else if (strcmp ("test3", func) == 0) {
  989. err = test3 ();
  990. } else if (strcmp ("test4", func) == 0) {
  991. err = test4 ();
  992. } else if (strcmp ("test5", func) == 0) {
  993. err = test5 ();
  994. } else if (strcmp ("test6", func) == 0) {
  995. err = test6 ();
  996. } else if (strcmp ("test8", func) == 0) {
  997. err = test8 (getpid(), 0, 1);
  998. } else if (strcmp ("test9", func) == 0) {
  999. err = test9 (getpid(), 0, 1);
  1000. }
  1001. sam_finalize ();
  1002. exit(err);
  1003. }
  1004. if (pid > 0) {
  1005. waitpid (pid, &stat, 0);
  1006. return WEXITSTATUS (stat);
  1007. }
  1008. return -1;
  1009. }
  1010. static void do_command (int sock, char* func, char*args[], int num_args)
  1011. {
  1012. char response[100];
  1013. int err = 0;
  1014. ssize_t rc;
  1015. size_t send_len;
  1016. qb_log (LOG_INFO, "RPC:%s() called.", func);
  1017. if (strncmp ("test", func, 4) == 0) {
  1018. err = do_test_command(sock, func, args, num_args);
  1019. } else if (strcmp ("setup_hc", func) == 0) {
  1020. err = setup_hc ();
  1021. } else if (strcmp ("sam_stop", func) == 0) {
  1022. err = sam_stop ();
  1023. if (err != CS_OK) {
  1024. qb_log (LOG_ERR,"RPC:%s sam_stop failed!", func);
  1025. snprintf (response, 100, "%s", FAIL_STR);
  1026. }
  1027. err = sam_finalize();
  1028. } else {
  1029. err = -1;
  1030. qb_log (LOG_ERR,"RPC:%s not supported!", func);
  1031. snprintf (response, 100, "%s", NOT_SUPPORTED_STR);
  1032. }
  1033. if (err == 0) {
  1034. snprintf (response, 100, "%s", OK_STR);
  1035. } else if (err == 1) {
  1036. snprintf (response, 100, "%s", FAIL_STR);
  1037. qb_log (LOG_ERR, "%s() test skipped?! (%d).", func, err);
  1038. } else {
  1039. snprintf (response, 100, "%s", FAIL_STR);
  1040. qb_log (LOG_ERR, "%s() failed (%d).", func, err);
  1041. }
  1042. send_len = strlen (response);
  1043. rc = send (sock, response, send_len, 0);
  1044. assert(rc == send_len);
  1045. }
  1046. int
  1047. main (int argc, char *argv[])
  1048. {
  1049. return test_agent_run ("sam_test_agent", 9036, do_command, NULL);
  1050. }