ipc_glue.c 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902
  1. /*
  2. * Copyright (c) 2010-2012 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Angus Salkeld <asalkeld@redhat.com>
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include <config.h>
  35. #include <stdlib.h>
  36. #include <stdio.h>
  37. #include <errno.h>
  38. #include <assert.h>
  39. #include <sys/uio.h>
  40. #include <string.h>
  41. #include <qb/qbdefs.h>
  42. #include <qb/qblist.h>
  43. #include <qb/qbutil.h>
  44. #include <qb/qbloop.h>
  45. #include <qb/qbipcs.h>
  46. #include <corosync/swab.h>
  47. #include <corosync/corotypes.h>
  48. #include <corosync/corodefs.h>
  49. #include <corosync/totem/totempg.h>
  50. #include <corosync/logsys.h>
  51. #include <corosync/icmap.h>
  52. #include "sync.h"
  53. #include "timer.h"
  54. #include "main.h"
  55. #include "util.h"
  56. #include "apidef.h"
  57. #include "service.h"
  58. LOGSYS_DECLARE_SUBSYS ("MAIN");
  59. static struct corosync_api_v1 *api = NULL;
  60. static int32_t ipc_not_enough_fds_left = 0;
  61. static int32_t ipc_fc_is_quorate; /* boolean */
  62. static int32_t ipc_fc_totem_queue_level; /* percentage used */
  63. static int32_t ipc_fc_sync_in_process; /* boolean */
  64. static int32_t ipc_allow_connections = 0; /* boolean */
  65. #define CS_IPCS_MAPPER_SERV_NAME 256
  66. struct cs_ipcs_mapper {
  67. int32_t id;
  68. qb_ipcs_service_t *inst;
  69. char name[CS_IPCS_MAPPER_SERV_NAME];
  70. };
  71. struct outq_item {
  72. void *msg;
  73. size_t mlen;
  74. struct qb_list_head list;
  75. };
  76. static struct cs_ipcs_mapper ipcs_mapper[SERVICES_COUNT_MAX];
  77. static int32_t cs_ipcs_job_add(enum qb_loop_priority p, void *data, qb_loop_job_dispatch_fn fn);
  78. static int32_t cs_ipcs_dispatch_add(enum qb_loop_priority p, int32_t fd, int32_t events,
  79. void *data, qb_ipcs_dispatch_fn_t fn);
  80. static int32_t cs_ipcs_dispatch_mod(enum qb_loop_priority p, int32_t fd, int32_t events,
  81. void *data, qb_ipcs_dispatch_fn_t fn);
  82. static int32_t cs_ipcs_dispatch_del(int32_t fd);
  83. static void outq_flush (void *data);
  84. static struct qb_ipcs_poll_handlers corosync_poll_funcs = {
  85. .job_add = cs_ipcs_job_add,
  86. .dispatch_add = cs_ipcs_dispatch_add,
  87. .dispatch_mod = cs_ipcs_dispatch_mod,
  88. .dispatch_del = cs_ipcs_dispatch_del,
  89. };
  90. static int32_t cs_ipcs_connection_accept (qb_ipcs_connection_t *c, uid_t euid, gid_t egid);
  91. static void cs_ipcs_connection_created(qb_ipcs_connection_t *c);
  92. static int32_t cs_ipcs_msg_process(qb_ipcs_connection_t *c,
  93. void *data, size_t size);
  94. static int32_t cs_ipcs_connection_closed (qb_ipcs_connection_t *c);
  95. static void cs_ipcs_connection_destroyed (qb_ipcs_connection_t *c);
  96. static struct qb_ipcs_service_handlers corosync_service_funcs = {
  97. .connection_accept = cs_ipcs_connection_accept,
  98. .connection_created = cs_ipcs_connection_created,
  99. .msg_process = cs_ipcs_msg_process,
  100. .connection_closed = cs_ipcs_connection_closed,
  101. .connection_destroyed = cs_ipcs_connection_destroyed,
  102. };
  103. static const char* cs_ipcs_serv_short_name(int32_t service_id)
  104. {
  105. const char *name;
  106. switch (service_id) {
  107. case CFG_SERVICE:
  108. name = "cfg";
  109. break;
  110. case CPG_SERVICE:
  111. name = "cpg";
  112. break;
  113. case QUORUM_SERVICE:
  114. name = "quorum";
  115. break;
  116. case PLOAD_SERVICE:
  117. name = "pload";
  118. break;
  119. case VOTEQUORUM_SERVICE:
  120. name = "votequorum";
  121. break;
  122. case MON_SERVICE:
  123. name = "mon";
  124. break;
  125. case WD_SERVICE:
  126. name = "wd";
  127. break;
  128. case CMAP_SERVICE:
  129. name = "cmap";
  130. break;
  131. default:
  132. name = NULL;
  133. break;
  134. }
  135. return name;
  136. }
  137. void cs_ipc_allow_connections(int32_t allow)
  138. {
  139. ipc_allow_connections = allow;
  140. }
  141. int32_t cs_ipcs_service_destroy(int32_t service_id)
  142. {
  143. if (ipcs_mapper[service_id].inst) {
  144. qb_ipcs_destroy(ipcs_mapper[service_id].inst);
  145. ipcs_mapper[service_id].inst = NULL;
  146. }
  147. return 0;
  148. }
  149. static int32_t cs_ipcs_connection_accept (qb_ipcs_connection_t *c, uid_t euid, gid_t egid)
  150. {
  151. int32_t service = qb_ipcs_service_id_get(c);
  152. uint8_t u8;
  153. char key_name[ICMAP_KEYNAME_MAXLEN];
  154. if (!ipc_allow_connections) {
  155. log_printf(LOGSYS_LEVEL_DEBUG, "Denied connection, corosync is not ready");
  156. return -EAGAIN;
  157. }
  158. if (corosync_service[service] == NULL ||
  159. ipcs_mapper[service].inst == NULL) {
  160. return -ENOSYS;
  161. }
  162. if (ipc_not_enough_fds_left) {
  163. return -EMFILE;
  164. }
  165. if (euid == 0 || egid == 0) {
  166. return 0;
  167. }
  168. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "uidgid.uid.%u", euid);
  169. if (icmap_get_uint8(key_name, &u8) == CS_OK && u8 == 1)
  170. return 0;
  171. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "uidgid.config.uid.%u", euid);
  172. if (icmap_get_uint8(key_name, &u8) == CS_OK && u8 == 1)
  173. return 0;
  174. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "uidgid.gid.%u", egid);
  175. if (icmap_get_uint8(key_name, &u8) == CS_OK && u8 == 1)
  176. return 0;
  177. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "uidgid.config.gid.%u", egid);
  178. if (icmap_get_uint8(key_name, &u8) == CS_OK && u8 == 1)
  179. return 0;
  180. log_printf(LOGSYS_LEVEL_ERROR, "Denied connection attempt from %d:%d", euid, egid);
  181. return -EACCES;
  182. }
  183. static char * pid_to_name (pid_t pid, char *out_name, size_t name_len)
  184. {
  185. char *name;
  186. char *rest;
  187. FILE *fp;
  188. char fname[32];
  189. char buf[256];
  190. snprintf (fname, 32, "/proc/%d/stat", pid);
  191. fp = fopen (fname, "r");
  192. if (!fp) {
  193. return NULL;
  194. }
  195. if (fgets (buf, sizeof (buf), fp) == NULL) {
  196. fclose (fp);
  197. return NULL;
  198. }
  199. fclose (fp);
  200. name = strrchr (buf, '(');
  201. if (!name) {
  202. return NULL;
  203. }
  204. /* move past the bracket */
  205. name++;
  206. rest = strrchr (buf, ')');
  207. if (rest == NULL || rest[1] != ' ') {
  208. return NULL;
  209. }
  210. *rest = '\0';
  211. /* move past the NULL and space */
  212. rest += 2;
  213. /* copy the name */
  214. strncpy (out_name, name, name_len);
  215. out_name[name_len - 1] = '\0';
  216. return out_name;
  217. }
  218. struct cs_ipcs_conn_context {
  219. char *icmap_path;
  220. struct qb_list_head outq_head;
  221. int32_t queuing;
  222. uint32_t queued;
  223. uint64_t invalid_request;
  224. uint64_t overload;
  225. uint32_t sent;
  226. char data[1];
  227. };
  228. static void cs_ipcs_connection_created(qb_ipcs_connection_t *c)
  229. {
  230. int32_t service = 0;
  231. struct cs_ipcs_conn_context *context;
  232. char proc_name[32];
  233. struct qb_ipcs_connection_stats stats;
  234. int32_t size = sizeof(struct cs_ipcs_conn_context);
  235. char key_name[ICMAP_KEYNAME_MAXLEN];
  236. int set_client_pid = 0;
  237. int set_proc_name = 0;
  238. log_printf(LOG_DEBUG, "connection created");
  239. service = qb_ipcs_service_id_get(c);
  240. size += corosync_service[service]->private_data_size;
  241. context = calloc(1, size);
  242. if (context == NULL) {
  243. qb_ipcs_disconnect(c);
  244. return;
  245. }
  246. qb_list_init(&context->outq_head);
  247. context->queuing = QB_FALSE;
  248. context->queued = 0;
  249. context->sent = 0;
  250. qb_ipcs_context_set(c, context);
  251. if (corosync_service[service]->lib_init_fn(c) != 0) {
  252. log_printf(LOG_ERR, "lib_init_fn failed, disconnecting");
  253. qb_ipcs_disconnect(c);
  254. return;
  255. }
  256. icmap_inc("runtime.connections.active");
  257. qb_ipcs_connection_stats_get(c, &stats, QB_FALSE);
  258. if (stats.client_pid > 0) {
  259. if (pid_to_name (stats.client_pid, proc_name, sizeof(proc_name))) {
  260. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "runtime.connections.%s:%u:%p",
  261. proc_name, stats.client_pid, c);
  262. set_proc_name = 1;
  263. } else {
  264. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "runtime.connections.%u:%p",
  265. stats.client_pid, c);
  266. }
  267. set_client_pid = 1;
  268. } else {
  269. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "runtime.connections.%p", c);
  270. }
  271. icmap_convert_name_to_valid_name(key_name);
  272. context->icmap_path = strdup(key_name);
  273. if (context->icmap_path == NULL) {
  274. qb_ipcs_disconnect(c);
  275. return;
  276. }
  277. if (set_proc_name) {
  278. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.name", context->icmap_path);
  279. icmap_set_string(key_name, proc_name);
  280. }
  281. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.client_pid", context->icmap_path);
  282. if (set_client_pid) {
  283. icmap_set_uint32(key_name, stats.client_pid);
  284. } else {
  285. icmap_set_uint32(key_name, 0);
  286. }
  287. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.service_id", context->icmap_path);
  288. icmap_set_uint32(key_name, service);
  289. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.responses", context->icmap_path);
  290. icmap_set_uint64(key_name, 0);
  291. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.dispatched", context->icmap_path);
  292. icmap_set_uint64(key_name, 0);
  293. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.requests", context->icmap_path);
  294. icmap_set_uint64(key_name, 0);
  295. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.send_retries", context->icmap_path);
  296. icmap_set_uint64(key_name, 0);
  297. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.recv_retries", context->icmap_path);
  298. icmap_set_uint64(key_name, 0);
  299. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.flow_control", context->icmap_path);
  300. icmap_set_uint32(key_name, 0);
  301. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.flow_control_count", context->icmap_path);
  302. icmap_set_uint64(key_name, 0);
  303. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.queue_size", context->icmap_path);
  304. icmap_set_uint32(key_name, 0);
  305. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.invalid_request", context->icmap_path);
  306. icmap_set_uint64(key_name, 0);
  307. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.overload", context->icmap_path);
  308. icmap_set_uint64(key_name, 0);
  309. }
  310. void cs_ipc_refcnt_inc(void *conn)
  311. {
  312. qb_ipcs_connection_ref(conn);
  313. }
  314. void cs_ipc_refcnt_dec(void *conn)
  315. {
  316. qb_ipcs_connection_unref(conn);
  317. }
  318. void *cs_ipcs_private_data_get(void *conn)
  319. {
  320. struct cs_ipcs_conn_context *cnx;
  321. cnx = qb_ipcs_context_get(conn);
  322. return &cnx->data[0];
  323. }
  324. static void cs_ipcs_connection_destroyed (qb_ipcs_connection_t *c)
  325. {
  326. struct cs_ipcs_conn_context *context;
  327. struct qb_list_head *list, *tmp_iter;
  328. struct outq_item *outq_item;
  329. log_printf(LOG_DEBUG, "%s() ", __func__);
  330. context = qb_ipcs_context_get(c);
  331. if (context) {
  332. qb_list_for_each_safe(list, tmp_iter, &(context->outq_head)) {
  333. outq_item = qb_list_entry (list, struct outq_item, list);
  334. qb_list_del (list);
  335. free (outq_item->msg);
  336. free (outq_item);
  337. }
  338. free(context);
  339. }
  340. }
  341. static int32_t cs_ipcs_connection_closed (qb_ipcs_connection_t *c)
  342. {
  343. int32_t res = 0;
  344. int32_t service = qb_ipcs_service_id_get(c);
  345. icmap_iter_t iter;
  346. char prefix[ICMAP_KEYNAME_MAXLEN];
  347. const char *key_name;
  348. struct cs_ipcs_conn_context *cnx;
  349. log_printf(LOG_DEBUG, "%s() ", __func__);
  350. res = corosync_service[service]->lib_exit_fn(c);
  351. if (res != 0) {
  352. return res;
  353. }
  354. qb_loop_job_del(cs_poll_handle_get(), QB_LOOP_HIGH, c, outq_flush);
  355. cnx = qb_ipcs_context_get(c);
  356. snprintf(prefix, ICMAP_KEYNAME_MAXLEN, "%s.", cnx->icmap_path);
  357. iter = icmap_iter_init(prefix);
  358. while ((key_name = icmap_iter_next(iter, NULL, NULL)) != NULL) {
  359. icmap_delete(key_name);
  360. }
  361. icmap_iter_finalize(iter);
  362. free(cnx->icmap_path);
  363. icmap_inc("runtime.connections.closed");
  364. icmap_dec("runtime.connections.active");
  365. return 0;
  366. }
  367. int cs_ipcs_response_iov_send (void *conn,
  368. const struct iovec *iov,
  369. unsigned int iov_len)
  370. {
  371. int32_t rc = qb_ipcs_response_sendv(conn, iov, iov_len);
  372. if (rc >= 0) {
  373. return 0;
  374. }
  375. return rc;
  376. }
  377. int cs_ipcs_response_send(void *conn, const void *msg, size_t mlen)
  378. {
  379. int32_t rc = qb_ipcs_response_send(conn, msg, mlen);
  380. if (rc >= 0) {
  381. return 0;
  382. }
  383. return rc;
  384. }
  385. static void outq_flush (void *data)
  386. {
  387. qb_ipcs_connection_t *conn = data;
  388. struct qb_list_head *list, *tmp_iter;
  389. struct outq_item *outq_item;
  390. int32_t rc;
  391. struct cs_ipcs_conn_context *context = qb_ipcs_context_get(conn);
  392. qb_list_for_each_safe(list, tmp_iter, &(context->outq_head)) {
  393. outq_item = qb_list_entry (list, struct outq_item, list);
  394. rc = qb_ipcs_event_send(conn, outq_item->msg, outq_item->mlen);
  395. if (rc < 0 && rc != -EAGAIN) {
  396. errno = -rc;
  397. qb_perror(LOG_ERR, "qb_ipcs_event_send");
  398. return;
  399. } else if (rc == -EAGAIN) {
  400. break;
  401. }
  402. assert(rc == outq_item->mlen);
  403. context->sent++;
  404. context->queued--;
  405. qb_list_del (list);
  406. free (outq_item->msg);
  407. free (outq_item);
  408. }
  409. if (qb_list_empty (&context->outq_head)) {
  410. context->queuing = QB_FALSE;
  411. log_printf(LOGSYS_LEVEL_INFO, "Q empty, queued:%d sent:%d.",
  412. context->queued, context->sent);
  413. context->queued = 0;
  414. context->sent = 0;
  415. } else {
  416. qb_loop_job_add(cs_poll_handle_get(), QB_LOOP_HIGH, conn, outq_flush);
  417. }
  418. }
  419. static void msg_send_or_queue(qb_ipcs_connection_t *conn, const struct iovec *iov, uint32_t iov_len)
  420. {
  421. int32_t rc = 0;
  422. int32_t i;
  423. int32_t bytes_msg = 0;
  424. struct outq_item *outq_item;
  425. char *write_buf = 0;
  426. struct cs_ipcs_conn_context *context = qb_ipcs_context_get(conn);
  427. for (i = 0; i < iov_len; i++) {
  428. bytes_msg += iov[i].iov_len;
  429. }
  430. if (!context->queuing) {
  431. assert(qb_list_empty (&context->outq_head));
  432. rc = qb_ipcs_event_sendv(conn, iov, iov_len);
  433. if (rc == bytes_msg) {
  434. context->sent++;
  435. return;
  436. }
  437. if (rc == -EAGAIN) {
  438. context->queued = 0;
  439. context->sent = 0;
  440. context->queuing = QB_TRUE;
  441. qb_loop_job_add(cs_poll_handle_get(), QB_LOOP_HIGH, conn, outq_flush);
  442. } else {
  443. log_printf(LOGSYS_LEVEL_ERROR, "event_send retuned %d, expected %d!", rc, bytes_msg);
  444. return;
  445. }
  446. }
  447. outq_item = malloc (sizeof (struct outq_item));
  448. if (outq_item == NULL) {
  449. qb_ipcs_disconnect(conn);
  450. return;
  451. }
  452. outq_item->msg = malloc (bytes_msg);
  453. if (outq_item->msg == NULL) {
  454. free (outq_item);
  455. qb_ipcs_disconnect(conn);
  456. return;
  457. }
  458. write_buf = outq_item->msg;
  459. for (i = 0; i < iov_len; i++) {
  460. memcpy (write_buf, iov[i].iov_base, iov[i].iov_len);
  461. write_buf += iov[i].iov_len;
  462. }
  463. outq_item->mlen = bytes_msg;
  464. qb_list_init (&outq_item->list);
  465. qb_list_add_tail (&outq_item->list, &context->outq_head);
  466. context->queued++;
  467. }
  468. int cs_ipcs_dispatch_send(void *conn, const void *msg, size_t mlen)
  469. {
  470. struct iovec iov;
  471. iov.iov_base = (void *)msg;
  472. iov.iov_len = mlen;
  473. msg_send_or_queue (conn, &iov, 1);
  474. return 0;
  475. }
  476. int cs_ipcs_dispatch_iov_send (void *conn,
  477. const struct iovec *iov,
  478. unsigned int iov_len)
  479. {
  480. msg_send_or_queue(conn, iov, iov_len);
  481. return 0;
  482. }
  483. static int32_t cs_ipcs_msg_process(qb_ipcs_connection_t *c,
  484. void *data, size_t size)
  485. {
  486. struct qb_ipc_response_header response;
  487. struct qb_ipc_request_header *request_pt = (struct qb_ipc_request_header *)data;
  488. int32_t service = qb_ipcs_service_id_get(c);
  489. int32_t send_ok = 0;
  490. int32_t is_async_call = QB_FALSE;
  491. ssize_t res = -1;
  492. int sending_allowed_private_data;
  493. struct cs_ipcs_conn_context *cnx;
  494. send_ok = corosync_sending_allowed (service,
  495. request_pt->id,
  496. request_pt,
  497. &sending_allowed_private_data);
  498. is_async_call = (service == CPG_SERVICE && request_pt->id == 2);
  499. /*
  500. * This happens when the message contains some kind of invalid
  501. * parameter, such as an invalid size
  502. */
  503. if (send_ok == -EINVAL) {
  504. response.size = sizeof (response);
  505. response.id = 0;
  506. response.error = CS_ERR_INVALID_PARAM;
  507. cnx = qb_ipcs_context_get(c);
  508. if (cnx) {
  509. cnx->invalid_request++;
  510. }
  511. if (is_async_call) {
  512. log_printf(LOGSYS_LEVEL_INFO, "*** %s() invalid message! size:%d error:%d",
  513. __func__, response.size, response.error);
  514. } else {
  515. qb_ipcs_response_send (c,
  516. &response,
  517. sizeof (response));
  518. }
  519. res = -EINVAL;
  520. } else if (send_ok < 0) {
  521. cnx = qb_ipcs_context_get(c);
  522. if (cnx) {
  523. cnx->overload++;
  524. }
  525. if (!is_async_call) {
  526. /*
  527. * Overload, tell library to retry
  528. */
  529. response.size = sizeof (response);
  530. response.id = 0;
  531. response.error = CS_ERR_TRY_AGAIN;
  532. qb_ipcs_response_send (c,
  533. &response,
  534. sizeof (response));
  535. } else {
  536. log_printf(LOGSYS_LEVEL_WARNING,
  537. "*** %s() (%d:%d - %d) %s!",
  538. __func__, service, request_pt->id,
  539. is_async_call, strerror(-send_ok));
  540. }
  541. res = -ENOBUFS;
  542. }
  543. if (send_ok >= 0) {
  544. corosync_service[service]->lib_engine[request_pt->id].lib_handler_fn(c, request_pt);
  545. res = 0;
  546. }
  547. corosync_sending_allowed_release (&sending_allowed_private_data);
  548. return res;
  549. }
  550. static int32_t cs_ipcs_job_add(enum qb_loop_priority p, void *data, qb_loop_job_dispatch_fn fn)
  551. {
  552. return qb_loop_job_add(cs_poll_handle_get(), p, data, fn);
  553. }
  554. static int32_t cs_ipcs_dispatch_add(enum qb_loop_priority p, int32_t fd, int32_t events,
  555. void *data, qb_ipcs_dispatch_fn_t fn)
  556. {
  557. return qb_loop_poll_add(cs_poll_handle_get(), p, fd, events, data, fn);
  558. }
  559. static int32_t cs_ipcs_dispatch_mod(enum qb_loop_priority p, int32_t fd, int32_t events,
  560. void *data, qb_ipcs_dispatch_fn_t fn)
  561. {
  562. return qb_loop_poll_mod(cs_poll_handle_get(), p, fd, events, data, fn);
  563. }
  564. static int32_t cs_ipcs_dispatch_del(int32_t fd)
  565. {
  566. return qb_loop_poll_del(cs_poll_handle_get(), fd);
  567. }
  568. static void cs_ipcs_low_fds_event(int32_t not_enough, int32_t fds_available)
  569. {
  570. ipc_not_enough_fds_left = not_enough;
  571. if (not_enough) {
  572. log_printf(LOGSYS_LEVEL_WARNING, "refusing new connections (fds_available:%d)",
  573. fds_available);
  574. } else {
  575. log_printf(LOGSYS_LEVEL_NOTICE, "allowing new connections (fds_available:%d)",
  576. fds_available);
  577. }
  578. }
  579. int32_t cs_ipcs_q_level_get(void)
  580. {
  581. return ipc_fc_totem_queue_level;
  582. }
  583. static qb_loop_timer_handle ipcs_check_for_flow_control_timer;
  584. static void cs_ipcs_check_for_flow_control(void)
  585. {
  586. int32_t i;
  587. int32_t fc_enabled;
  588. for (i = 0; i < SERVICES_COUNT_MAX; i++) {
  589. if (corosync_service[i] == NULL || ipcs_mapper[i].inst == NULL) {
  590. continue;
  591. }
  592. fc_enabled = QB_IPCS_RATE_OFF;
  593. if (ipc_fc_is_quorate == 1 ||
  594. corosync_service[i]->allow_inquorate == CS_LIB_ALLOW_INQUORATE) {
  595. /*
  596. * we are quorate
  597. * now check flow control
  598. */
  599. if (ipc_fc_totem_queue_level != TOTEM_Q_LEVEL_CRITICAL &&
  600. ipc_fc_sync_in_process == 0) {
  601. fc_enabled = QB_FALSE;
  602. } else if (ipc_fc_totem_queue_level != TOTEM_Q_LEVEL_CRITICAL &&
  603. i == VOTEQUORUM_SERVICE) {
  604. /*
  605. * Allow message processing for votequorum service even
  606. * in sync phase
  607. */
  608. fc_enabled = QB_FALSE;
  609. } else {
  610. fc_enabled = QB_IPCS_RATE_OFF_2;
  611. }
  612. }
  613. if (fc_enabled) {
  614. qb_ipcs_request_rate_limit(ipcs_mapper[i].inst, fc_enabled);
  615. qb_loop_timer_add(cs_poll_handle_get(), QB_LOOP_MED, 1*QB_TIME_NS_IN_MSEC,
  616. NULL, corosync_recheck_the_q_level, &ipcs_check_for_flow_control_timer);
  617. } else if (ipc_fc_totem_queue_level == TOTEM_Q_LEVEL_LOW) {
  618. qb_ipcs_request_rate_limit(ipcs_mapper[i].inst, QB_IPCS_RATE_FAST);
  619. } else if (ipc_fc_totem_queue_level == TOTEM_Q_LEVEL_GOOD) {
  620. qb_ipcs_request_rate_limit(ipcs_mapper[i].inst, QB_IPCS_RATE_NORMAL);
  621. } else if (ipc_fc_totem_queue_level == TOTEM_Q_LEVEL_HIGH) {
  622. qb_ipcs_request_rate_limit(ipcs_mapper[i].inst, QB_IPCS_RATE_SLOW);
  623. }
  624. }
  625. }
  626. static void cs_ipcs_fc_quorum_changed(int quorate, void *context)
  627. {
  628. ipc_fc_is_quorate = quorate;
  629. cs_ipcs_check_for_flow_control();
  630. }
  631. static void cs_ipcs_totem_queue_level_changed(enum totem_q_level level)
  632. {
  633. ipc_fc_totem_queue_level = level;
  634. cs_ipcs_check_for_flow_control();
  635. }
  636. void cs_ipcs_sync_state_changed(int32_t sync_in_process)
  637. {
  638. ipc_fc_sync_in_process = sync_in_process;
  639. cs_ipcs_check_for_flow_control();
  640. }
  641. void cs_ipcs_stats_update(void)
  642. {
  643. int32_t i;
  644. struct qb_ipcs_stats srv_stats;
  645. struct qb_ipcs_connection_stats stats;
  646. qb_ipcs_connection_t *c, *prev;
  647. struct cs_ipcs_conn_context *cnx;
  648. char key_name[ICMAP_KEYNAME_MAXLEN];
  649. for (i = 0; i < SERVICES_COUNT_MAX; i++) {
  650. if (corosync_service[i] == NULL || ipcs_mapper[i].inst == NULL) {
  651. continue;
  652. }
  653. qb_ipcs_stats_get(ipcs_mapper[i].inst, &srv_stats, QB_FALSE);
  654. for (c = qb_ipcs_connection_first_get(ipcs_mapper[i].inst);
  655. c;
  656. prev = c, c = qb_ipcs_connection_next_get(ipcs_mapper[i].inst, prev), qb_ipcs_connection_unref(prev)) {
  657. cnx = qb_ipcs_context_get(c);
  658. if (cnx == NULL) continue;
  659. qb_ipcs_connection_stats_get(c, &stats, QB_FALSE);
  660. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.client_pid", cnx->icmap_path);
  661. icmap_set_uint32(key_name, stats.client_pid);
  662. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.requests", cnx->icmap_path);
  663. icmap_set_uint64(key_name, stats.requests);
  664. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.responses", cnx->icmap_path);
  665. icmap_set_uint64(key_name, stats.responses);
  666. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.dispatched", cnx->icmap_path);
  667. icmap_set_uint64(key_name, stats.events);
  668. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.send_retries", cnx->icmap_path);
  669. icmap_set_uint64(key_name, stats.send_retries);
  670. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.recv_retries", cnx->icmap_path);
  671. icmap_set_uint64(key_name, stats.recv_retries);
  672. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.flow_control", cnx->icmap_path);
  673. icmap_set_uint32(key_name, stats.flow_control_state);
  674. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.flow_control_count", cnx->icmap_path);
  675. icmap_set_uint64(key_name, stats.flow_control_count);
  676. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.queue_size", cnx->icmap_path);
  677. icmap_set_uint32(key_name, cnx->queued);
  678. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.invalid_request", cnx->icmap_path);
  679. icmap_set_uint64(key_name, cnx->invalid_request);
  680. snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "%s.overload", cnx->icmap_path);
  681. icmap_set_uint64(key_name, cnx->overload);
  682. }
  683. }
  684. }
  685. static enum qb_ipc_type cs_get_ipc_type (void)
  686. {
  687. char *str;
  688. int found = 0;
  689. enum qb_ipc_type ret = QB_IPC_NATIVE;
  690. if (icmap_get_string("qb.ipc_type", &str) != CS_OK) {
  691. log_printf(LOGSYS_LEVEL_DEBUG, "No configured qb.ipc_type. Using native ipc");
  692. return QB_IPC_NATIVE;
  693. }
  694. if (strcmp(str, "native") == 0) {
  695. ret = QB_IPC_NATIVE;
  696. found = 1;
  697. }
  698. if (strcmp(str, "shm") == 0) {
  699. ret = QB_IPC_SHM;
  700. found = 1;
  701. }
  702. if (strcmp(str, "socket") == 0) {
  703. ret = QB_IPC_SOCKET;
  704. found = 1;
  705. }
  706. if (found) {
  707. log_printf(LOGSYS_LEVEL_DEBUG, "Using %s ipc", str);
  708. } else {
  709. log_printf(LOGSYS_LEVEL_DEBUG, "Unknown ipc type %s", str);
  710. }
  711. free(str);
  712. return ret;
  713. }
  714. const char *cs_ipcs_service_init(struct corosync_service_engine *service)
  715. {
  716. const char *serv_short_name;
  717. serv_short_name = cs_ipcs_serv_short_name(service->id);
  718. if (service->lib_engine_count == 0) {
  719. log_printf (LOGSYS_LEVEL_DEBUG,
  720. "NOT Initializing IPC on %s [%d]",
  721. serv_short_name,
  722. service->id);
  723. return NULL;
  724. }
  725. if (strlen(serv_short_name) >= CS_IPCS_MAPPER_SERV_NAME) {
  726. log_printf (LOGSYS_LEVEL_ERROR, "service name %s is too long", serv_short_name);
  727. return "qb_ipcs_run error";
  728. }
  729. ipcs_mapper[service->id].id = service->id;
  730. strcpy(ipcs_mapper[service->id].name, serv_short_name);
  731. log_printf (LOGSYS_LEVEL_DEBUG,
  732. "Initializing IPC on %s [%d]",
  733. ipcs_mapper[service->id].name,
  734. ipcs_mapper[service->id].id);
  735. ipcs_mapper[service->id].inst = qb_ipcs_create(ipcs_mapper[service->id].name,
  736. ipcs_mapper[service->id].id,
  737. cs_get_ipc_type(),
  738. &corosync_service_funcs);
  739. assert(ipcs_mapper[service->id].inst);
  740. qb_ipcs_poll_handlers_set(ipcs_mapper[service->id].inst,
  741. &corosync_poll_funcs);
  742. if (qb_ipcs_run(ipcs_mapper[service->id].inst) != 0) {
  743. log_printf (LOGSYS_LEVEL_ERROR, "Can't initialize IPC");
  744. return "qb_ipcs_run error";
  745. }
  746. return NULL;
  747. }
  748. void cs_ipcs_init(void)
  749. {
  750. api = apidef_get ();
  751. qb_loop_poll_low_fds_event_set(cs_poll_handle_get(), cs_ipcs_low_fds_event);
  752. api->quorum_register_callback (cs_ipcs_fc_quorum_changed, NULL);
  753. totempg_queue_level_register_callback (cs_ipcs_totem_queue_level_changed);
  754. icmap_set_uint64("runtime.connections.active", 0);
  755. icmap_set_uint64("runtime.connections.closed", 0);
  756. }