evs.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571
  1. /*
  2. * vi: set autoindent tabstop=4 shiftwidth=4 :
  3. * Copyright (c) 2004-2005 MontaVista Software, Inc.
  4. * Copyright (c) 2006-2007, 2009 Red Hat, Inc.
  5. *
  6. * All rights reserved.
  7. *
  8. * Author: Steven Dake (sdake@redhat.com)
  9. *
  10. * This software licensed under BSD license, the text of which follows:
  11. *
  12. * Redistribution and use in source and binary forms, with or without
  13. * modification, are permitted provided that the following conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above copyright notice,
  16. * this list of conditions and the following disclaimer.
  17. * - Redistributions in binary form must reproduce the above copyright notice,
  18. * this list of conditions and the following disclaimer in the documentation
  19. * and/or other materials provided with the distribution.
  20. * - Neither the name of the MontaVista Software, Inc. nor the names of its
  21. * contributors may be used to endorse or promote products derived from this
  22. * software without specific prior written permission.
  23. *
  24. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  25. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  26. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  28. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  30. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  31. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  32. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  33. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  34. * THE POSSIBILITY OF SUCH DAMAGE.
  35. */
  36. /*
  37. * Provides an extended virtual synchrony API using the corosync executive
  38. */
  39. #include <config.h>
  40. #include <stdlib.h>
  41. #include <string.h>
  42. #include <unistd.h>
  43. #include <pthread.h>
  44. #include <sys/types.h>
  45. #include <sys/socket.h>
  46. #include <errno.h>
  47. #include <corosync/totem/totem.h>
  48. #include <corosync/corotypes.h>
  49. #include <corosync/evs.h>
  50. #include <corosync/ipc_evs.h>
  51. #include <corosync/coroipcc.h>
  52. #undef MIN
  53. #define MIN(x,y) ((x) < (y) ? (x) : (y))
  54. struct evs_inst {
  55. void *ipc_ctx;
  56. int finalize;
  57. evs_callbacks_t callbacks;
  58. pthread_mutex_t response_mutex;
  59. pthread_mutex_t dispatch_mutex;
  60. };
  61. static void evs_instance_destructor (void *instance);
  62. DECLARE_SAHDB_DATABASE (evs_handle_t_db, evs_instance_destructor);
  63. /*
  64. * Clean up function for an evt instance (saEvtInitialize) handle
  65. */
  66. static void evs_instance_destructor (void *instance)
  67. {
  68. struct evs_inst *evs_inst = instance;
  69. pthread_mutex_destroy (&evs_inst->response_mutex);
  70. pthread_mutex_destroy (&evs_inst->dispatch_mutex);
  71. }
  72. /**
  73. * @defgroup evs_coroipcc The extended virtual synchrony passthrough API
  74. * @ingroup coroipcc
  75. *
  76. * @{
  77. */
  78. /**
  79. * test
  80. * @param handle The handle of evs initialize
  81. * @param callbacks The callbacks for evs_initialize
  82. * @returns EVS_OK
  83. */
  84. evs_error_t evs_initialize (
  85. evs_handle_t *handle,
  86. evs_callbacks_t *callbacks)
  87. {
  88. cs_error_t error;
  89. struct evs_inst *evs_inst;
  90. error = saHandleCreate (&evs_handle_t_db, sizeof (struct evs_inst), handle);
  91. if (error != CS_OK) {
  92. goto error_no_destroy;
  93. }
  94. error = saHandleInstanceGet (&evs_handle_t_db, *handle, (void *)&evs_inst);
  95. if (error != CS_OK) {
  96. goto error_destroy;
  97. }
  98. error = coroipcc_service_connect (
  99. IPC_SOCKET_NAME,
  100. EVS_SERVICE,
  101. IPC_REQUEST_SIZE,
  102. IPC_RESPONSE_SIZE,
  103. IPC_DISPATCH_SIZE,
  104. &evs_inst->ipc_ctx);
  105. if (error != EVS_OK) {
  106. goto error_put_destroy;
  107. }
  108. memcpy (&evs_inst->callbacks, callbacks, sizeof (evs_callbacks_t));
  109. pthread_mutex_init (&evs_inst->response_mutex, NULL);
  110. pthread_mutex_init (&evs_inst->dispatch_mutex, NULL);
  111. saHandleInstancePut (&evs_handle_t_db, *handle);
  112. return (CS_OK);
  113. error_put_destroy:
  114. saHandleInstancePut (&evs_handle_t_db, *handle);
  115. error_destroy:
  116. saHandleDestroy (&evs_handle_t_db, *handle);
  117. error_no_destroy:
  118. return (error);
  119. }
  120. evs_error_t evs_finalize (
  121. evs_handle_t handle)
  122. {
  123. struct evs_inst *evs_inst;
  124. cs_error_t error;
  125. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  126. if (error != CS_OK) {
  127. return (error);
  128. }
  129. pthread_mutex_lock (&evs_inst->response_mutex);
  130. /*
  131. * Another thread has already started finalizing
  132. */
  133. if (evs_inst->finalize) {
  134. pthread_mutex_unlock (&evs_inst->response_mutex);
  135. saHandleInstancePut (&evs_handle_t_db, handle);
  136. return (EVS_ERR_BAD_HANDLE);
  137. }
  138. evs_inst->finalize = 1;
  139. coroipcc_service_disconnect (evs_inst->ipc_ctx);
  140. pthread_mutex_unlock (&evs_inst->response_mutex);
  141. saHandleDestroy (&evs_handle_t_db, handle);
  142. saHandleInstancePut (&evs_handle_t_db, handle);
  143. return (EVS_OK);
  144. }
  145. evs_error_t evs_fd_get (
  146. evs_handle_t handle,
  147. int *fd)
  148. {
  149. cs_error_t error;
  150. struct evs_inst *evs_inst;
  151. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  152. if (error != CS_OK) {
  153. return (error);
  154. }
  155. *fd = coroipcc_fd_get (evs_inst->ipc_ctx);
  156. saHandleInstancePut (&evs_handle_t_db, handle);
  157. return (CS_OK);
  158. }
  159. evs_error_t evs_dispatch (
  160. evs_handle_t handle,
  161. cs_dispatch_flags_t dispatch_types)
  162. {
  163. int timeout = -1;
  164. cs_error_t error;
  165. int cont = 1; /* always continue do loop except when set to 0 */
  166. int dispatch_avail;
  167. struct evs_inst *evs_inst;
  168. struct res_evs_confchg_callback *res_evs_confchg_callback;
  169. struct res_evs_deliver_callback *res_evs_deliver_callback;
  170. evs_callbacks_t callbacks;
  171. mar_res_header_t *dispatch_data;
  172. int ignore_dispatch = 0;
  173. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  174. if (error != CS_OK) {
  175. return (error);
  176. }
  177. /*
  178. * Timeout instantly for SA_DISPATCH_ONE or SA_DISPATCH_ALL and
  179. * wait indefinately for SA_DISPATCH_BLOCKING
  180. */
  181. if (dispatch_types == EVS_DISPATCH_ALL) {
  182. timeout = 0;
  183. }
  184. do {
  185. pthread_mutex_lock (&evs_inst->dispatch_mutex);
  186. dispatch_avail = coroipcc_dispatch_get (
  187. evs_inst->ipc_ctx,
  188. (void **)&dispatch_data,
  189. timeout);
  190. pthread_mutex_unlock (&evs_inst->dispatch_mutex);
  191. if (dispatch_avail == 0 && dispatch_types == EVS_DISPATCH_ALL) {
  192. break; /* exit do while cont is 1 loop */
  193. } else
  194. if (dispatch_avail == 0) {
  195. continue; /* next dispatch event */
  196. }
  197. if (dispatch_avail == -1) {
  198. if (evs_inst->finalize == 1) {
  199. error = CS_OK;
  200. } else {
  201. error = CS_ERR_LIBRARY;
  202. }
  203. goto error_put;
  204. }
  205. /*
  206. * Make copy of callbacks, message data, unlock instance, and call callback
  207. * A risk of this dispatch method is that the callback routines may
  208. * operate at the same time that evsFinalize has been called.
  209. */
  210. memcpy (&callbacks, &evs_inst->callbacks, sizeof (evs_callbacks_t));
  211. /*
  212. * Dispatch incoming message
  213. */
  214. switch (dispatch_data->id) {
  215. case MESSAGE_RES_EVS_DELIVER_CALLBACK:
  216. res_evs_deliver_callback = (struct res_evs_deliver_callback *)dispatch_data;
  217. callbacks.evs_deliver_fn (
  218. res_evs_deliver_callback->local_nodeid,
  219. &res_evs_deliver_callback->msg,
  220. res_evs_deliver_callback->msglen);
  221. break;
  222. case MESSAGE_RES_EVS_CONFCHG_CALLBACK:
  223. res_evs_confchg_callback = (struct res_evs_confchg_callback *)dispatch_data;
  224. callbacks.evs_confchg_fn (
  225. res_evs_confchg_callback->member_list,
  226. res_evs_confchg_callback->member_list_entries,
  227. res_evs_confchg_callback->left_list,
  228. res_evs_confchg_callback->left_list_entries,
  229. res_evs_confchg_callback->joined_list,
  230. res_evs_confchg_callback->joined_list_entries);
  231. break;
  232. default:
  233. coroipcc_dispatch_put (evs_inst->ipc_ctx);
  234. error = CS_ERR_LIBRARY;
  235. goto error_put;
  236. break;
  237. }
  238. coroipcc_dispatch_put (evs_inst->ipc_ctx);
  239. /*
  240. * Determine if more messages should be processed
  241. * */
  242. switch (dispatch_types) {
  243. case EVS_DISPATCH_ONE:
  244. if (ignore_dispatch) {
  245. ignore_dispatch = 0;
  246. } else {
  247. cont = 0;
  248. }
  249. break;
  250. case EVS_DISPATCH_ALL:
  251. if (ignore_dispatch) {
  252. ignore_dispatch = 0;
  253. }
  254. break;
  255. case EVS_DISPATCH_BLOCKING:
  256. break;
  257. }
  258. } while (cont);
  259. error_put:
  260. saHandleInstancePut (&evs_handle_t_db, handle);
  261. return (error);
  262. }
  263. evs_error_t evs_join (
  264. evs_handle_t handle,
  265. const struct evs_group *groups,
  266. size_t group_entries)
  267. {
  268. evs_error_t error;
  269. struct evs_inst *evs_inst;
  270. struct iovec iov[2];
  271. struct req_lib_evs_join req_lib_evs_join;
  272. struct res_lib_evs_join res_lib_evs_join;
  273. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  274. if (error != EVS_OK) {
  275. return (error);
  276. }
  277. req_lib_evs_join.header.size = sizeof (struct req_lib_evs_join) +
  278. (group_entries * sizeof (struct evs_group));
  279. req_lib_evs_join.header.id = MESSAGE_REQ_EVS_JOIN;
  280. req_lib_evs_join.group_entries = group_entries;
  281. iov[0].iov_base = &req_lib_evs_join;
  282. iov[0].iov_len = sizeof (struct req_lib_evs_join);
  283. iov[1].iov_base = (void*) groups; /* cast away const */
  284. iov[1].iov_len = (group_entries * sizeof (struct evs_group));
  285. pthread_mutex_lock (&evs_inst->response_mutex);
  286. error = coroipcc_msg_send_reply_receive (evs_inst->ipc_ctx, iov, 2,
  287. &res_lib_evs_join, sizeof (struct res_lib_evs_join));
  288. pthread_mutex_unlock (&evs_inst->response_mutex);
  289. if (error != CS_OK) {
  290. goto error_exit;
  291. }
  292. error = res_lib_evs_join.header.error;
  293. error_exit:
  294. saHandleInstancePut (&evs_handle_t_db, handle);
  295. return (error);
  296. }
  297. evs_error_t evs_leave (
  298. evs_handle_t handle,
  299. const struct evs_group *groups,
  300. size_t group_entries)
  301. {
  302. evs_error_t error;
  303. struct evs_inst *evs_inst;
  304. struct iovec iov[2];
  305. struct req_lib_evs_leave req_lib_evs_leave;
  306. struct res_lib_evs_leave res_lib_evs_leave;
  307. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  308. if (error != CS_OK) {
  309. return (error);
  310. }
  311. req_lib_evs_leave.header.size = sizeof (struct req_lib_evs_leave) +
  312. (group_entries * sizeof (struct evs_group));
  313. req_lib_evs_leave.header.id = MESSAGE_REQ_EVS_LEAVE;
  314. req_lib_evs_leave.group_entries = group_entries;
  315. iov[0].iov_base = &req_lib_evs_leave;
  316. iov[0].iov_len = sizeof (struct req_lib_evs_leave);
  317. iov[1].iov_base = (void *) groups; /* cast away const */
  318. iov[1].iov_len = (group_entries * sizeof (struct evs_group));
  319. pthread_mutex_lock (&evs_inst->response_mutex);
  320. error = coroipcc_msg_send_reply_receive (evs_inst->ipc_ctx, iov, 2,
  321. &res_lib_evs_leave, sizeof (struct res_lib_evs_leave));
  322. pthread_mutex_unlock (&evs_inst->response_mutex);
  323. if (error != CS_OK) {
  324. goto error_exit;
  325. }
  326. error = res_lib_evs_leave.header.error;
  327. error_exit:
  328. saHandleInstancePut (&evs_handle_t_db, handle);
  329. return (error);
  330. }
  331. evs_error_t evs_mcast_joined (
  332. evs_handle_t handle,
  333. evs_guarantee_t guarantee,
  334. const struct iovec *iovec,
  335. unsigned int iov_len)
  336. {
  337. int i;
  338. evs_error_t error;
  339. struct evs_inst *evs_inst;
  340. struct iovec iov[64];
  341. struct req_lib_evs_mcast_joined req_lib_evs_mcast_joined;
  342. struct res_lib_evs_mcast_joined res_lib_evs_mcast_joined;
  343. size_t msg_len = 0;
  344. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  345. if (error != CS_OK) {
  346. return (error);
  347. }
  348. for (i = 0; i < iov_len; i++ ) {
  349. msg_len += iovec[i].iov_len;
  350. }
  351. req_lib_evs_mcast_joined.header.size = sizeof (struct req_lib_evs_mcast_joined) +
  352. msg_len;
  353. req_lib_evs_mcast_joined.header.id = MESSAGE_REQ_EVS_MCAST_JOINED;
  354. req_lib_evs_mcast_joined.guarantee = guarantee;
  355. req_lib_evs_mcast_joined.msg_len = msg_len;
  356. iov[0].iov_base = &req_lib_evs_mcast_joined;
  357. iov[0].iov_len = sizeof (struct req_lib_evs_mcast_joined);
  358. memcpy (&iov[1], iovec, iov_len * sizeof (struct iovec));
  359. pthread_mutex_lock (&evs_inst->response_mutex);
  360. error = coroipcc_msg_send_reply_receive (evs_inst->ipc_ctx, iov,
  361. iov_len + 1,
  362. &res_lib_evs_mcast_joined,
  363. sizeof (struct res_lib_evs_mcast_joined));
  364. pthread_mutex_unlock (&evs_inst->response_mutex);
  365. if (error != CS_OK) {
  366. goto error_exit;
  367. }
  368. error = res_lib_evs_mcast_joined.header.error;
  369. error_exit:
  370. saHandleInstancePut (&evs_handle_t_db, handle);
  371. return (error);
  372. }
  373. evs_error_t evs_mcast_groups (
  374. evs_handle_t handle,
  375. evs_guarantee_t guarantee,
  376. const struct evs_group *groups,
  377. size_t group_entries,
  378. const struct iovec *iovec,
  379. unsigned int iov_len)
  380. {
  381. int i;
  382. evs_error_t error;
  383. struct evs_inst *evs_inst;
  384. struct iovec iov[64]; /* FIXME: what if iov_len > 62 ? use malloc */
  385. struct req_lib_evs_mcast_groups req_lib_evs_mcast_groups;
  386. struct res_lib_evs_mcast_groups res_lib_evs_mcast_groups;
  387. size_t msg_len = 0;
  388. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  389. if (error != CS_OK) {
  390. return (error);
  391. }
  392. for (i = 0; i < iov_len; i++) {
  393. msg_len += iovec[i].iov_len;
  394. }
  395. req_lib_evs_mcast_groups.header.size = sizeof (struct req_lib_evs_mcast_groups) +
  396. (group_entries * sizeof (struct evs_group)) + msg_len;
  397. req_lib_evs_mcast_groups.header.id = MESSAGE_REQ_EVS_MCAST_GROUPS;
  398. req_lib_evs_mcast_groups.guarantee = guarantee;
  399. req_lib_evs_mcast_groups.msg_len = msg_len;
  400. req_lib_evs_mcast_groups.group_entries = group_entries;
  401. iov[0].iov_base = &req_lib_evs_mcast_groups;
  402. iov[0].iov_len = sizeof (struct req_lib_evs_mcast_groups);
  403. iov[1].iov_base = (void *) groups; /* cast away const */
  404. iov[1].iov_len = (group_entries * sizeof (struct evs_group));
  405. memcpy (&iov[2], iovec, iov_len * sizeof (struct iovec));
  406. pthread_mutex_lock (&evs_inst->response_mutex);
  407. error = coroipcc_msg_send_reply_receive (evs_inst->ipc_ctx, iov,
  408. iov_len + 2,
  409. &res_lib_evs_mcast_groups,
  410. sizeof (struct res_lib_evs_mcast_groups));
  411. pthread_mutex_unlock (&evs_inst->response_mutex);
  412. if (error != CS_OK) {
  413. goto error_exit;
  414. }
  415. error = res_lib_evs_mcast_groups.header.error;
  416. error_exit:
  417. saHandleInstancePut (&evs_handle_t_db, handle);
  418. return (error);
  419. }
  420. evs_error_t evs_membership_get (
  421. evs_handle_t handle,
  422. unsigned int *local_nodeid,
  423. unsigned int *member_list,
  424. size_t *member_list_entries)
  425. {
  426. evs_error_t error;
  427. struct evs_inst *evs_inst;
  428. struct iovec iov;
  429. struct req_lib_evs_membership_get req_lib_evs_membership_get;
  430. struct res_lib_evs_membership_get res_lib_evs_membership_get;
  431. error = saHandleInstanceGet (&evs_handle_t_db, handle, (void *)&evs_inst);
  432. if (error != CS_OK) {
  433. return (error);
  434. }
  435. req_lib_evs_membership_get.header.size = sizeof (struct req_lib_evs_membership_get);
  436. req_lib_evs_membership_get.header.id = MESSAGE_REQ_EVS_MEMBERSHIP_GET;
  437. iov.iov_base = &req_lib_evs_membership_get;
  438. iov.iov_len = sizeof (struct req_lib_evs_membership_get);
  439. pthread_mutex_lock (&evs_inst->response_mutex);
  440. error = coroipcc_msg_send_reply_receive (evs_inst->ipc_ctx,
  441. &iov,
  442. 1,
  443. &res_lib_evs_membership_get,
  444. sizeof (struct res_lib_evs_membership_get));
  445. pthread_mutex_unlock (&evs_inst->response_mutex);
  446. if (error != CS_OK) {
  447. goto error_exit;
  448. }
  449. error = res_lib_evs_membership_get.header.error;
  450. /*
  451. * Copy results to caller
  452. */
  453. if (local_nodeid) {
  454. *local_nodeid = res_lib_evs_membership_get.local_nodeid;
  455. }
  456. *member_list_entries = MIN (*member_list_entries,
  457. res_lib_evs_membership_get.member_list_entries);
  458. if (member_list) {
  459. memcpy (member_list, &res_lib_evs_membership_get.member_list,
  460. *member_list_entries * sizeof (struct in_addr));
  461. }
  462. error_exit:
  463. saHandleInstancePut (&evs_handle_t_db, handle);
  464. return (error);
  465. }
  466. /** @} */