vsf_quorum.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484
  1. /*
  2. * Copyright (c) 2008-2015 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Christine Caulfield (ccaulfie@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of Red Hat Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include <config.h>
  35. #include <pwd.h>
  36. #include <grp.h>
  37. #include <sys/types.h>
  38. #include <sys/poll.h>
  39. #include <sys/uio.h>
  40. #include <sys/mman.h>
  41. #include <sys/socket.h>
  42. #include <sys/un.h>
  43. #include <sys/time.h>
  44. #include <sys/resource.h>
  45. #include <netinet/in.h>
  46. #include <arpa/inet.h>
  47. #include <unistd.h>
  48. #include <fcntl.h>
  49. #include <stdlib.h>
  50. #include <stdio.h>
  51. #include <errno.h>
  52. #include <sched.h>
  53. #include <time.h>
  54. #include "quorum.h"
  55. #include <corosync/corotypes.h>
  56. #include <qb/qbipc_common.h>
  57. #include <corosync/corodefs.h>
  58. #include <corosync/swab.h>
  59. #include <qb/qblist.h>
  60. #include <corosync/mar_gen.h>
  61. #include <corosync/ipc_quorum.h>
  62. #include <corosync/coroapi.h>
  63. #include <corosync/logsys.h>
  64. #include <corosync/icmap.h>
  65. #include "service.h"
  66. #include "votequorum.h"
  67. #include "vsf_ykd.h"
  68. LOGSYS_DECLARE_SUBSYS ("QUORUM");
  69. struct quorum_pd {
  70. unsigned char track_flags;
  71. int tracking_enabled;
  72. struct qb_list_head list;
  73. void *conn;
  74. };
  75. struct internal_callback_pd {
  76. struct qb_list_head list;
  77. quorum_callback_fn_t callback;
  78. void *context;
  79. };
  80. static void message_handler_req_lib_quorum_getquorate (void *conn,
  81. const void *msg);
  82. static void message_handler_req_lib_quorum_trackstart (void *conn,
  83. const void *msg);
  84. static void message_handler_req_lib_quorum_trackstop (void *conn,
  85. const void *msg);
  86. static void message_handler_req_lib_quorum_gettype (void *conn,
  87. const void *msg);
  88. static void send_library_notification(void *conn);
  89. static void send_internal_notification(void);
  90. static char *quorum_exec_init_fn (struct corosync_api_v1 *api);
  91. static int quorum_lib_init_fn (void *conn);
  92. static int quorum_lib_exit_fn (void *conn);
  93. static int primary_designated = 0;
  94. static int quorum_type = 0;
  95. static struct corosync_api_v1 *corosync_api;
  96. static struct qb_list_head lib_trackers_list;
  97. static struct qb_list_head internal_trackers_list;
  98. static struct memb_ring_id quorum_ring_id;
  99. static size_t quorum_view_list_entries = 0;
  100. static int quorum_view_list[PROCESSOR_COUNT_MAX];
  101. struct quorum_services_api_ver1 *quorum_iface = NULL;
  102. static char view_buf[64];
  103. static void log_view_list(const unsigned int *view_list, size_t view_list_entries)
  104. {
  105. int total = (int)view_list_entries;
  106. int len, pos, ret;
  107. int i = 0;
  108. while (1) {
  109. len = sizeof(view_buf);
  110. pos = 0;
  111. memset(view_buf, 0, len);
  112. for (; i < total; i++) {
  113. ret = snprintf(view_buf + pos, len - pos, " %u", view_list[i]);
  114. if (ret >= len - pos)
  115. break;
  116. pos += ret;
  117. }
  118. log_printf (LOGSYS_LEVEL_NOTICE, "Members[%d]:%s%s",
  119. total, view_buf, i < total ? "\\" : "");
  120. if (i == total)
  121. break;
  122. }
  123. }
  124. /* Internal quorum API function */
  125. static void quorum_api_set_quorum(const unsigned int *view_list,
  126. size_t view_list_entries,
  127. int quorum, struct memb_ring_id *ring_id)
  128. {
  129. int old_quorum = primary_designated;
  130. primary_designated = quorum;
  131. if (primary_designated && !old_quorum) {
  132. log_printf (LOGSYS_LEVEL_NOTICE, "This node is within the primary component and will provide service.");
  133. } else if (!primary_designated && old_quorum) {
  134. log_printf (LOGSYS_LEVEL_NOTICE, "This node is within the non-primary component and will NOT provide any services.");
  135. }
  136. quorum_view_list_entries = view_list_entries;
  137. memcpy(&quorum_ring_id, ring_id, sizeof (quorum_ring_id));
  138. memcpy(quorum_view_list, view_list, sizeof(unsigned int)*view_list_entries);
  139. log_view_list(view_list, view_list_entries);
  140. /* Tell internal listeners */
  141. send_internal_notification();
  142. /* Tell IPC listeners */
  143. send_library_notification(NULL);
  144. }
  145. static struct corosync_lib_handler quorum_lib_service[] =
  146. {
  147. { /* 0 */
  148. .lib_handler_fn = message_handler_req_lib_quorum_getquorate,
  149. .flow_control = CS_LIB_FLOW_CONTROL_NOT_REQUIRED
  150. },
  151. { /* 1 */
  152. .lib_handler_fn = message_handler_req_lib_quorum_trackstart,
  153. .flow_control = CS_LIB_FLOW_CONTROL_NOT_REQUIRED
  154. },
  155. { /* 2 */
  156. .lib_handler_fn = message_handler_req_lib_quorum_trackstop,
  157. .flow_control = CS_LIB_FLOW_CONTROL_NOT_REQUIRED
  158. },
  159. { /* 3 */
  160. .lib_handler_fn = message_handler_req_lib_quorum_gettype,
  161. .flow_control = CS_LIB_FLOW_CONTROL_NOT_REQUIRED
  162. }
  163. };
  164. static struct corosync_service_engine quorum_service_handler = {
  165. .name = "corosync cluster quorum service v0.1",
  166. .id = QUORUM_SERVICE,
  167. .priority = 1,
  168. .private_data_size = sizeof (struct quorum_pd),
  169. .flow_control = CS_LIB_FLOW_CONTROL_NOT_REQUIRED,
  170. .allow_inquorate = CS_LIB_ALLOW_INQUORATE,
  171. .lib_init_fn = quorum_lib_init_fn,
  172. .lib_exit_fn = quorum_lib_exit_fn,
  173. .lib_engine = quorum_lib_service,
  174. .exec_init_fn = quorum_exec_init_fn,
  175. .lib_engine_count = sizeof (quorum_lib_service) / sizeof (struct corosync_lib_handler)
  176. };
  177. struct corosync_service_engine *vsf_quorum_get_service_engine_ver0 (void)
  178. {
  179. return (&quorum_service_handler);
  180. }
  181. /* -------------------------------------------------- */
  182. /*
  183. * Internal API functions for corosync
  184. */
  185. static int quorum_quorate(void)
  186. {
  187. return primary_designated;
  188. }
  189. static int quorum_register_callback(quorum_callback_fn_t function, void *context)
  190. {
  191. struct internal_callback_pd *pd = malloc(sizeof(struct internal_callback_pd));
  192. if (!pd)
  193. return -1;
  194. pd->context = context;
  195. pd->callback = function;
  196. qb_list_add (&pd->list, &internal_trackers_list);
  197. return 0;
  198. }
  199. static int quorum_unregister_callback(quorum_callback_fn_t function, void *context)
  200. {
  201. struct internal_callback_pd *pd;
  202. struct qb_list_head *tmp, *tmp_iter;
  203. qb_list_for_each_safe(tmp, tmp_iter, &internal_trackers_list) {
  204. pd = qb_list_entry(tmp, struct internal_callback_pd, list);
  205. if (pd->callback == function && pd->context == context) {
  206. qb_list_del(&pd->list);
  207. free(pd);
  208. return 0;
  209. }
  210. }
  211. return -1;
  212. }
  213. static struct quorum_callin_functions callins = {
  214. .quorate = quorum_quorate,
  215. .register_callback = quorum_register_callback,
  216. .unregister_callback = quorum_unregister_callback
  217. };
  218. /* --------------------------------------------------------------------- */
  219. static char *quorum_exec_init_fn (struct corosync_api_v1 *api)
  220. {
  221. char *quorum_module = NULL;
  222. char *error;
  223. corosync_api = api;
  224. qb_list_init (&lib_trackers_list);
  225. qb_list_init (&internal_trackers_list);
  226. /*
  227. * Tell corosync we have a quorum engine.
  228. */
  229. api->quorum_initialize(&callins);
  230. /*
  231. * Look for a quorum provider
  232. */
  233. if (icmap_get_string("quorum.provider", &quorum_module) == CS_OK) {
  234. log_printf (LOGSYS_LEVEL_NOTICE,
  235. "Using quorum provider %s", quorum_module);
  236. error = (char *)"Invalid quorum provider";
  237. if (strcmp (quorum_module, "corosync_votequorum") == 0) {
  238. error = votequorum_init (api, quorum_api_set_quorum);
  239. quorum_type = 1;
  240. }
  241. if (strcmp (quorum_module, "corosync_ykd") == 0) {
  242. error = ykd_init (api, quorum_api_set_quorum);
  243. quorum_type = 1;
  244. }
  245. if (error) {
  246. log_printf (LOGSYS_LEVEL_CRIT,
  247. "Quorum provider: %s failed to initialize.",
  248. quorum_module);
  249. free(quorum_module);
  250. return (error);
  251. }
  252. }
  253. if (quorum_module) {
  254. free(quorum_module);
  255. quorum_module = NULL;
  256. }
  257. /*
  258. * setting quorum_type and primary_designated in the right order is important
  259. * always try to lookup/init a quorum module, then revert back to be quorate
  260. */
  261. if (quorum_type == 0) {
  262. primary_designated = 1;
  263. }
  264. return (NULL);
  265. }
  266. static int quorum_lib_init_fn (void *conn)
  267. {
  268. struct quorum_pd *pd = (struct quorum_pd *)corosync_api->ipc_private_data_get (conn);
  269. log_printf(LOGSYS_LEVEL_DEBUG, "lib_init_fn: conn=%p", conn);
  270. qb_list_init (&pd->list);
  271. pd->conn = conn;
  272. return (0);
  273. }
  274. static int quorum_lib_exit_fn (void *conn)
  275. {
  276. struct quorum_pd *quorum_pd = (struct quorum_pd *)corosync_api->ipc_private_data_get (conn);
  277. log_printf(LOGSYS_LEVEL_DEBUG, "lib_exit_fn: conn=%p", conn);
  278. if (quorum_pd->tracking_enabled) {
  279. qb_list_del (&quorum_pd->list);
  280. qb_list_init (&quorum_pd->list);
  281. }
  282. return (0);
  283. }
  284. static void send_internal_notification(void)
  285. {
  286. struct qb_list_head *tmp;
  287. struct internal_callback_pd *pd;
  288. qb_list_for_each(tmp, &internal_trackers_list) {
  289. pd = qb_list_entry(tmp, struct internal_callback_pd, list);
  290. pd->callback(primary_designated, pd->context);
  291. }
  292. }
  293. static void send_library_notification(void *conn)
  294. {
  295. int size = sizeof(struct res_lib_quorum_notification) + sizeof(unsigned int)*quorum_view_list_entries;
  296. char buf[size];
  297. struct res_lib_quorum_notification *res_lib_quorum_notification = (struct res_lib_quorum_notification *)buf;
  298. struct qb_list_head *tmp;
  299. int i;
  300. log_printf(LOGSYS_LEVEL_DEBUG, "sending quorum notification to %p, length = %d", conn, size);
  301. res_lib_quorum_notification->quorate = primary_designated;
  302. res_lib_quorum_notification->ring_seq = quorum_ring_id.seq;
  303. res_lib_quorum_notification->view_list_entries = quorum_view_list_entries;
  304. for (i=0; i<quorum_view_list_entries; i++) {
  305. res_lib_quorum_notification->view_list[i] = quorum_view_list[i];
  306. }
  307. res_lib_quorum_notification->header.id = MESSAGE_RES_QUORUM_NOTIFICATION;
  308. res_lib_quorum_notification->header.size = size;
  309. res_lib_quorum_notification->header.error = CS_OK;
  310. /* Send it to all interested parties */
  311. if (conn) {
  312. corosync_api->ipc_dispatch_send(conn, res_lib_quorum_notification, size);
  313. }
  314. else {
  315. struct quorum_pd *qpd;
  316. qb_list_for_each(tmp, &lib_trackers_list) {
  317. qpd = qb_list_entry(tmp, struct quorum_pd, list);
  318. corosync_api->ipc_dispatch_send(qpd->conn,
  319. res_lib_quorum_notification, size);
  320. }
  321. }
  322. return;
  323. }
  324. static void message_handler_req_lib_quorum_getquorate (void *conn,
  325. const void *msg)
  326. {
  327. struct res_lib_quorum_getquorate res_lib_quorum_getquorate;
  328. log_printf(LOGSYS_LEVEL_DEBUG, "got quorate request on %p", conn);
  329. /* send status */
  330. res_lib_quorum_getquorate.quorate = primary_designated;
  331. res_lib_quorum_getquorate.header.size = sizeof(res_lib_quorum_getquorate);
  332. res_lib_quorum_getquorate.header.id = MESSAGE_RES_QUORUM_GETQUORATE;
  333. res_lib_quorum_getquorate.header.error = CS_OK;
  334. corosync_api->ipc_response_send(conn, &res_lib_quorum_getquorate, sizeof(res_lib_quorum_getquorate));
  335. }
  336. static void message_handler_req_lib_quorum_trackstart (void *conn,
  337. const void *msg)
  338. {
  339. const struct req_lib_quorum_trackstart *req_lib_quorum_trackstart = msg;
  340. struct qb_ipc_response_header res;
  341. struct quorum_pd *quorum_pd = (struct quorum_pd *)corosync_api->ipc_private_data_get (conn);
  342. cs_error_t error = CS_OK;
  343. log_printf(LOGSYS_LEVEL_DEBUG, "got trackstart request on %p", conn);
  344. /*
  345. * If an immediate listing of the current cluster membership
  346. * is requested, generate membership list
  347. */
  348. if (req_lib_quorum_trackstart->track_flags & CS_TRACK_CURRENT ||
  349. req_lib_quorum_trackstart->track_flags & CS_TRACK_CHANGES) {
  350. log_printf(LOGSYS_LEVEL_DEBUG, "sending initial status to %p", conn);
  351. send_library_notification(conn);
  352. }
  353. if (quorum_pd->tracking_enabled) {
  354. error = CS_ERR_EXIST;
  355. goto response_send;
  356. }
  357. /*
  358. * Record requests for tracking
  359. */
  360. if (req_lib_quorum_trackstart->track_flags & CS_TRACK_CHANGES ||
  361. req_lib_quorum_trackstart->track_flags & CS_TRACK_CHANGES_ONLY) {
  362. quorum_pd->track_flags = req_lib_quorum_trackstart->track_flags;
  363. quorum_pd->tracking_enabled = 1;
  364. qb_list_add (&quorum_pd->list, &lib_trackers_list);
  365. }
  366. response_send:
  367. /* send status */
  368. res.size = sizeof(res);
  369. res.id = MESSAGE_RES_QUORUM_TRACKSTART;
  370. res.error = error;
  371. corosync_api->ipc_response_send(conn, &res, sizeof(struct qb_ipc_response_header));
  372. }
  373. static void message_handler_req_lib_quorum_trackstop (void *conn, const void *msg)
  374. {
  375. struct qb_ipc_response_header res;
  376. struct quorum_pd *quorum_pd = (struct quorum_pd *)corosync_api->ipc_private_data_get (conn);
  377. log_printf(LOGSYS_LEVEL_DEBUG, "got trackstop request on %p", conn);
  378. if (quorum_pd->tracking_enabled) {
  379. res.error = CS_OK;
  380. quorum_pd->tracking_enabled = 0;
  381. qb_list_del (&quorum_pd->list);
  382. qb_list_init (&quorum_pd->list);
  383. } else {
  384. res.error = CS_ERR_NOT_EXIST;
  385. }
  386. /* send status */
  387. res.size = sizeof(res);
  388. res.id = MESSAGE_RES_QUORUM_TRACKSTOP;
  389. res.error = CS_OK;
  390. corosync_api->ipc_response_send(conn, &res, sizeof(struct qb_ipc_response_header));
  391. }
  392. static void message_handler_req_lib_quorum_gettype (void *conn,
  393. const void *msg)
  394. {
  395. struct res_lib_quorum_gettype res_lib_quorum_gettype;
  396. log_printf(LOGSYS_LEVEL_DEBUG, "got quorum_type request on %p", conn);
  397. /* send status */
  398. res_lib_quorum_gettype.quorum_type = quorum_type;
  399. res_lib_quorum_gettype.header.size = sizeof(res_lib_quorum_gettype);
  400. res_lib_quorum_gettype.header.id = MESSAGE_RES_QUORUM_GETTYPE;
  401. res_lib_quorum_gettype.header.error = CS_OK;
  402. corosync_api->ipc_response_send(conn, &res_lib_quorum_gettype, sizeof(res_lib_quorum_gettype));
  403. }