main.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623
  1. /*
  2. * Copyright (c) 2002-2006 MontaVista Software, Inc.
  3. * Copyright (c) 2006 Red Hat, Inc.
  4. * Copyright (c) 2006 Sun Microsystems, Inc.
  5. *
  6. * All rights reserved.
  7. *
  8. * Author: Steven Dake (sdake@mvista.com)
  9. *
  10. * This software licensed under BSD license, the text of which follows:
  11. *
  12. * Redistribution and use in source and binary forms, with or without
  13. * modification, are permitted provided that the following conditions are met:
  14. *
  15. * - Redistributions of source code must retain the above copyright notice,
  16. * this list of conditions and the following disclaimer.
  17. * - Redistributions in binary form must reproduce the above copyright notice,
  18. * this list of conditions and the following disclaimer in the documentation
  19. * and/or other materials provided with the distribution.
  20. * - Neither the name of the MontaVista Software, Inc. nor the names of its
  21. * contributors may be used to endorse or promote products derived from this
  22. * software without specific prior written permission.
  23. *
  24. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  25. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  26. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  28. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  30. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  31. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  32. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  33. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  34. * THE POSSIBILITY OF SUCH DAMAGE.
  35. */
  36. #include <pthread.h>
  37. #include <assert.h>
  38. #include <pwd.h>
  39. #include <grp.h>
  40. #include <sys/types.h>
  41. #include <sys/poll.h>
  42. #include <sys/uio.h>
  43. #include <sys/mman.h>
  44. #include <sys/socket.h>
  45. #include <sys/un.h>
  46. #include <sys/time.h>
  47. #include <sys/resource.h>
  48. #include <netinet/in.h>
  49. #include <arpa/inet.h>
  50. #include <unistd.h>
  51. #include <fcntl.h>
  52. #include <stdlib.h>
  53. #include <stdio.h>
  54. #include <errno.h>
  55. #include <signal.h>
  56. #include <sched.h>
  57. #include <time.h>
  58. #include "swab.h"
  59. #include "../include/saAis.h"
  60. #include "../include/list.h"
  61. #include "../include/queue.h"
  62. #include "../lcr/lcr_ifact.h"
  63. #include "poll.h"
  64. #include "totempg.h"
  65. #include "totemsrp.h"
  66. #include "mempool.h"
  67. #include "mainconfig.h"
  68. #include "totemconfig.h"
  69. #include "main.h"
  70. #include "service.h"
  71. #include "sync.h"
  72. #include "swab.h"
  73. #include "objdb.h"
  74. #include "config.h"
  75. #include "ipc.h"
  76. #include "timer.h"
  77. #include "logsys.h"
  78. #include "util.h"
  79. #include "flow.h"
  80. #include "version.h"
  81. LOGSYS_DECLARE_SYSTEM ("openais",
  82. LOG_MODE_OUTPUT_STDERR | LOG_MODE_OUTPUT_SYSLOG_THREADED | LOG_MODE_DISPLAY_DEBUG | LOG_MODE_BUFFER_BEFORE_CONFIG,
  83. NULL,
  84. LOG_DAEMON);
  85. LOGSYS_DECLARE_SUBSYS ("MAIN", LOG_INFO);
  86. #define SERVER_BACKLOG 5
  87. static int ais_uid = 0;
  88. static int gid_valid = 0;
  89. static unsigned int service_count = 32;
  90. static pthread_mutex_t serialize_mutex = PTHREAD_MUTEX_INITIALIZER;
  91. static struct totem_logging_configuration totem_logging_configuration;
  92. static char delivery_data[MESSAGE_SIZE_MAX];
  93. SaClmClusterNodeT *(*main_clm_get_by_nodeid) (unsigned int node_id);
  94. static void sigusr2_handler (int num)
  95. {
  96. int i;
  97. for (i = 0; ais_service[i]; i++) {
  98. if (ais_service[i]->exec_dump_fn) {
  99. ais_service[i]->exec_dump_fn ();
  100. }
  101. }
  102. }
  103. static void sigsegv_handler (int num)
  104. {
  105. signal (SIGSEGV, SIG_DFL);
  106. logsys_flush ();
  107. raise (SIGSEGV);
  108. }
  109. static void sigabrt_handler (int num)
  110. {
  111. signal (SIGABRT, SIG_DFL);
  112. logsys_flush ();
  113. raise (SIGABRT);
  114. }
  115. #define LOCALHOST_IP inet_addr("127.0.0.1")
  116. totempg_groups_handle openais_group_handle;
  117. struct totempg_group openais_group = {
  118. .group = "a",
  119. .group_len = 1
  120. };
  121. void sigintr_handler (int signum)
  122. {
  123. #ifdef DEBUG_MEMPOOL
  124. int stats_inuse[MEMPOOL_GROUP_SIZE];
  125. int stats_avail[MEMPOOL_GROUP_SIZE];
  126. int stats_memoryused[MEMPOOL_GROUP_SIZE];
  127. int i;
  128. mempool_getstats (stats_inuse, stats_avail, stats_memoryused);
  129. log_printf (LOG_LEVEL_DEBUG, "Memory pools:\n");
  130. for (i = 0; i < MEMPOOL_GROUP_SIZE; i++) {
  131. log_printf (LOG_LEVEL_DEBUG, "order %d size %d inuse %d avail %d memory used %d\n",
  132. i, 1<<i, stats_inuse[i], stats_avail[i], stats_memoryused[i]);
  133. }
  134. #endif
  135. totempg_finalize ();
  136. openais_exit_error (AIS_DONE_EXIT);
  137. }
  138. static int pool_sizes[] = { 0, 0, 0, 0, 0, 4096, 0, 1, 0, /* 256 */
  139. 1024, 0, 1, 4096, 0, 0, 0, 0, /* 65536 */
  140. 1, 1, 1, 1, 1, 1, 1, 1, 1 };
  141. void serialize_mutex_lock (void)
  142. {
  143. pthread_mutex_lock (&serialize_mutex);
  144. }
  145. void serialize_mutex_unlock (void)
  146. {
  147. pthread_mutex_unlock (&serialize_mutex);
  148. }
  149. static void openais_sync_completed (void)
  150. {
  151. }
  152. static int openais_sync_callbacks_retrieve (int sync_id,
  153. struct sync_callbacks *callbacks)
  154. {
  155. if (ais_service[sync_id] == NULL) {
  156. memset (callbacks, 0, sizeof (struct sync_callbacks));
  157. return (-1);
  158. }
  159. callbacks->name = ais_service[sync_id]->name;
  160. callbacks->sync_init = ais_service[sync_id]->sync_init;
  161. callbacks->sync_process = ais_service[sync_id]->sync_process;
  162. callbacks->sync_activate = ais_service[sync_id]->sync_activate;
  163. callbacks->sync_abort = ais_service[sync_id]->sync_abort;
  164. return (0);
  165. }
  166. static struct memb_ring_id aisexec_ring_id;
  167. static void confchg_fn (
  168. enum totem_configuration_type configuration_type,
  169. unsigned int *member_list, int member_list_entries,
  170. unsigned int *left_list, int left_list_entries,
  171. unsigned int *joined_list, int joined_list_entries,
  172. struct memb_ring_id *ring_id)
  173. {
  174. int i;
  175. memcpy (&aisexec_ring_id, ring_id, sizeof (struct memb_ring_id));
  176. /*
  177. * Call configuration change for all services
  178. */
  179. for (i = 0; i < service_count; i++) {
  180. if (ais_service[i] && ais_service[i]->confchg_fn) {
  181. ais_service[i]->confchg_fn (configuration_type,
  182. member_list, member_list_entries,
  183. left_list, left_list_entries,
  184. joined_list, joined_list_entries, ring_id);
  185. }
  186. }
  187. }
  188. static void aisexec_uid_determine (struct main_config *main_config)
  189. {
  190. struct passwd *passwd;
  191. passwd = getpwnam(main_config->user);
  192. if (passwd == 0) {
  193. log_printf (LOG_LEVEL_ERROR, "ERROR: The '%s' user is not found in /etc/passwd, please read the documentation.\n", main_config->user);
  194. openais_exit_error (AIS_DONE_UID_DETERMINE);
  195. }
  196. ais_uid = passwd->pw_uid;
  197. endpwent ();
  198. }
  199. static void aisexec_gid_determine (struct main_config *main_config)
  200. {
  201. struct group *group;
  202. group = getgrnam (main_config->group);
  203. if (group == 0) {
  204. log_printf (LOG_LEVEL_ERROR, "ERROR: The '%s' group is not found in /etc/group, please read the documentation.\n", group->gr_name);
  205. openais_exit_error (AIS_DONE_GID_DETERMINE);
  206. }
  207. gid_valid = group->gr_gid;
  208. endgrent ();
  209. }
  210. static void aisexec_priv_drop (void)
  211. {
  212. return;
  213. setuid (ais_uid);
  214. setegid (ais_uid);
  215. }
  216. static void aisexec_mempool_init (void)
  217. {
  218. int res;
  219. res = mempool_init (pool_sizes);
  220. if (res == ENOMEM) {
  221. log_printf (LOG_LEVEL_ERROR, "Couldn't allocate memory pools, not enough memory");
  222. openais_exit_error (AIS_DONE_MEMPOOL_INIT);
  223. }
  224. }
  225. static void aisexec_tty_detach (void)
  226. {
  227. /*
  228. * Disconnect from TTY if this is not a debug run
  229. */
  230. switch (fork ()) {
  231. case -1:
  232. openais_exit_error (AIS_DONE_FORK);
  233. break;
  234. case 0:
  235. /*
  236. * child which is disconnected, run this process
  237. */
  238. break;
  239. default:
  240. exit (0);
  241. break;
  242. }
  243. }
  244. static void aisexec_setscheduler (void)
  245. {
  246. #if ! defined(TS_CLASS) && (defined(OPENAIS_BSD) || defined(OPENAIS_LINUX) || defined(OPENAIS_SOLARIS))
  247. struct sched_param sched_param;
  248. int res;
  249. res = sched_get_priority_max (SCHED_RR);
  250. if (res != -1) {
  251. sched_param.sched_priority = 1;//res;
  252. res = sched_setscheduler (0, SCHED_RR, &sched_param);
  253. if (res == -1) {
  254. log_printf (LOG_LEVEL_WARNING, "Could not set SCHED_RR at priority %d: %s\n",
  255. sched_param.sched_priority, strerror (errno));
  256. }
  257. } else
  258. log_printf (LOG_LEVEL_WARNING, "Could not get maximum scheduler priority: %s\n", strerror (errno));
  259. #else
  260. log_printf(LOG_LEVEL_WARNING, "Scheduler priority left to default value (no OS support)\n");
  261. #endif
  262. }
  263. static void aisexec_mlockall (void)
  264. {
  265. #if !defined(OPENAIS_BSD)
  266. int res;
  267. #endif
  268. struct rlimit rlimit;
  269. rlimit.rlim_cur = RLIM_INFINITY;
  270. rlimit.rlim_max = RLIM_INFINITY;
  271. #ifndef OPENAIS_SOLARIS
  272. setrlimit (RLIMIT_MEMLOCK, &rlimit);
  273. #else
  274. setrlimit (RLIMIT_VMEM, &rlimit);
  275. #endif
  276. #if defined(OPENAIS_BSD)
  277. /* under FreeBSD a process with locked page cannot call dlopen
  278. * code disabled until FreeBSD bug i386/93396 was solved
  279. */
  280. log_printf (LOG_LEVEL_WARNING, "Could not lock memory of service to avoid page faults\n");
  281. #else
  282. res = mlockall (MCL_CURRENT | MCL_FUTURE);
  283. if (res == -1) {
  284. log_printf (LOG_LEVEL_WARNING, "Could not lock memory of service to avoid page faults: %s\n", strerror (errno));
  285. };
  286. #endif
  287. }
  288. static void deliver_fn (
  289. unsigned int nodeid,
  290. struct iovec *iovec,
  291. int iov_len,
  292. int endian_conversion_required)
  293. {
  294. mar_req_header_t *header;
  295. int pos = 0;
  296. int i;
  297. int service;
  298. int fn_id;
  299. /*
  300. * Build buffer without iovecs to make processing easier
  301. * This is only used for messages which are multicast with iovecs
  302. * and self-delivered. All other mechanisms avoid the copy.
  303. */
  304. if (iov_len > 1) {
  305. for (i = 0; i < iov_len; i++) {
  306. memcpy (&delivery_data[pos], iovec[i].iov_base, iovec[i].iov_len);
  307. pos += iovec[i].iov_len;
  308. assert (pos < MESSAGE_SIZE_MAX);
  309. }
  310. header = (mar_req_header_t *)delivery_data;
  311. } else {
  312. header = (mar_req_header_t *)iovec[0].iov_base;
  313. }
  314. if (endian_conversion_required) {
  315. header->id = swab32 (header->id);
  316. header->size = swab32 (header->size);
  317. }
  318. // assert(iovec->iov_len == header->size);
  319. /*
  320. * Call the proper executive handler
  321. */
  322. service = header->id >> 16;
  323. fn_id = header->id & 0xffff;
  324. if (endian_conversion_required) {
  325. assert(ais_service[service]->exec_service[fn_id].exec_endian_convert_fn != NULL);
  326. ais_service[service]->exec_service[fn_id].exec_endian_convert_fn
  327. (header);
  328. }
  329. ais_service[service]->exec_service[fn_id].exec_handler_fn
  330. (header, nodeid);
  331. }
  332. int main (int argc, char **argv)
  333. {
  334. char *error_string;
  335. struct main_config main_config;
  336. struct totem_config totem_config;
  337. unsigned int objdb_handle;
  338. unsigned int config_handle;
  339. unsigned int config_version = 0;
  340. struct objdb_iface_ver0 *objdb;
  341. void *objdb_p;
  342. struct config_iface_ver0 *config;
  343. void *config_p;
  344. char *config_iface;
  345. int res, ch;
  346. int background, setprio;
  347. int totem_log_service;
  348. /* default configuration
  349. */
  350. background = 1;
  351. setprio = 1;
  352. while ((ch = getopt (argc, argv, "fp")) != EOF) {
  353. switch (ch) {
  354. case 'f':
  355. background = 0;
  356. break;
  357. case 'p':
  358. setprio = 0;
  359. break;
  360. default:
  361. fprintf(stderr, \
  362. "usage:\n"\
  363. " -f : Start application in foreground.\n"\
  364. " -p : Do not set process priority. \n");
  365. return EXIT_FAILURE;
  366. }
  367. }
  368. if (background)
  369. aisexec_tty_detach ();
  370. log_printf (LOG_LEVEL_NOTICE, "AIS Executive Service RELEASE '%s'\n", RELEASE_VERSION);
  371. log_printf (LOG_LEVEL_NOTICE, "Copyright (C) 2002-2006 MontaVista Software, Inc and contributors.\n");
  372. log_printf (LOG_LEVEL_NOTICE, "Copyright (C) 2006-2007 Red Hat, Inc.\n");
  373. signal (SIGINT, sigintr_handler);
  374. signal (SIGUSR2, sigusr2_handler);
  375. signal (SIGSEGV, sigsegv_handler);
  376. signal (SIGABRT, sigabrt_handler);
  377. openais_timer_init (
  378. serialize_mutex_lock,
  379. serialize_mutex_unlock);
  380. log_printf (LOG_LEVEL_NOTICE, "AIS Executive Service: started and ready to provide service.\n");
  381. aisexec_poll_handle = poll_create (
  382. serialize_mutex_lock,
  383. serialize_mutex_unlock);
  384. /*
  385. * Load the object database interface
  386. */
  387. res = lcr_ifact_reference (
  388. &objdb_handle,
  389. "objdb",
  390. 0,
  391. &objdb_p,
  392. 0);
  393. if (res == -1) {
  394. log_printf (LOG_LEVEL_ERROR, "AIS Executive couldn't open configuration object database component.\n");
  395. openais_exit_error (AIS_DONE_OBJDB);
  396. }
  397. objdb = (struct objdb_iface_ver0 *)objdb_p;
  398. objdb->objdb_init ();
  399. /* User's bootstrap config service */
  400. config_iface = getenv("OPENAIS_DEFAULT_CONFIG_IFACE");
  401. if (!config_iface) {
  402. config_iface = "aisparser";
  403. }
  404. res = lcr_ifact_reference (
  405. &config_handle,
  406. config_iface,
  407. config_version,
  408. &config_p,
  409. 0);
  410. config = (struct config_iface_ver0 *)config_p;
  411. if (res == -1) {
  412. log_printf (LOG_LEVEL_ERROR, "AIS Executive couldn't open configuration component.\n");
  413. openais_exit_error (AIS_DONE_MAINCONFIGREAD);
  414. }
  415. res = config->config_readconfig(objdb, &error_string);
  416. if (res == -1) {
  417. log_printf (LOG_LEVEL_ERROR, error_string);
  418. openais_exit_error (AIS_DONE_MAINCONFIGREAD);
  419. }
  420. log_printf (LOG_LEVEL_NOTICE, error_string);
  421. openais_service_default_objdb_set (objdb);
  422. res = openais_service_link_all (objdb);
  423. if (res == -1) {
  424. log_printf (LOG_LEVEL_ERROR, "Could not load services\n");
  425. openais_exit_error (AIS_DONE_DYNAMICLOAD);
  426. }
  427. res = openais_main_config_read (objdb, &error_string, &main_config);
  428. if (res == -1) {
  429. log_printf (LOG_LEVEL_ERROR, error_string);
  430. openais_exit_error (AIS_DONE_MAINCONFIGREAD);
  431. }
  432. res = totem_config_read (objdb, &totem_config, &error_string);
  433. if (res == -1) {
  434. log_printf (LOG_LEVEL_ERROR, error_string);
  435. openais_exit_error (AIS_DONE_MAINCONFIGREAD);
  436. }
  437. res = totem_config_keyread (objdb, &totem_config, &error_string);
  438. if (res == -1) {
  439. log_printf (LOG_LEVEL_ERROR, error_string);
  440. openais_exit_error (AIS_DONE_MAINCONFIGREAD);
  441. }
  442. res = totem_config_validate (&totem_config, &error_string);
  443. if (res == -1) {
  444. log_printf (LOG_LEVEL_ERROR, error_string);
  445. openais_exit_error (AIS_DONE_MAINCONFIGREAD);
  446. }
  447. res = logsys_config_file_set (&error_string, main_config.logfile);
  448. if (res == -1) {
  449. log_printf (LOG_LEVEL_ERROR, error_string);
  450. openais_exit_error (AIS_DONE_LOGSETUP);
  451. }
  452. logsys_config_facility_set ("openais", main_config.syslog_facility);
  453. logsys_config_mode_set (main_config.logmode);
  454. aisexec_uid_determine (&main_config);
  455. aisexec_gid_determine (&main_config);
  456. /*
  457. * Set round robin realtime scheduling with priority 99
  458. * Lock all memory to avoid page faults which may interrupt
  459. * application healthchecking
  460. */
  461. if (setprio)
  462. aisexec_setscheduler ();
  463. aisexec_mlockall ();
  464. totem_config.totem_logging_configuration = totem_logging_configuration;
  465. totem_log_service = _logsys_subsys_create ("TOTEM", LOG_INFO);
  466. totem_config.totem_logging_configuration.log_level_security = logsys_mkpri (LOG_LEVEL_SECURITY, totem_log_service);
  467. totem_config.totem_logging_configuration.log_level_error = logsys_mkpri (LOG_LEVEL_ERROR, totem_log_service);
  468. totem_config.totem_logging_configuration.log_level_warning = logsys_mkpri (LOG_LEVEL_WARNING, totem_log_service);
  469. totem_config.totem_logging_configuration.log_level_notice = logsys_mkpri (LOG_LEVEL_NOTICE, totem_log_service);
  470. totem_config.totem_logging_configuration.log_level_debug = logsys_mkpri (LOG_LEVEL_DEBUG, totem_log_service);
  471. totem_config.totem_logging_configuration.log_printf = logsys_log_printf;
  472. /*
  473. * Sleep for a while to let other nodes in the cluster
  474. * understand that this node has been away (if it was
  475. * an aisexec restart).
  476. */
  477. // TODO what is this hack for? usleep(totem_config.token_timeout * 2000);
  478. /*
  479. * if totempg_initialize doesn't have root priveleges, it cannot
  480. * bind to a specific interface. This only matters if
  481. * there is more then one interface in a system, so
  482. * in this case, only a warning is printed
  483. */
  484. /*
  485. * Join multicast group and setup delivery
  486. * and configuration change functions
  487. */
  488. totempg_initialize (
  489. aisexec_poll_handle,
  490. &totem_config);
  491. totempg_groups_initialize (
  492. &openais_group_handle,
  493. deliver_fn,
  494. confchg_fn);
  495. totempg_groups_join (
  496. openais_group_handle,
  497. &openais_group,
  498. 1);
  499. /*
  500. * This must occur after totempg is initialized because "this_ip" must be set
  501. */
  502. res = openais_service_init_all (service_count, objdb);
  503. if (res == -1) {
  504. log_printf (LOG_LEVEL_ERROR, "Could not init services\n");
  505. openais_exit_error (AIS_DONE_INIT_SERVICES);
  506. }
  507. sync_register (openais_sync_callbacks_retrieve, openais_sync_completed,
  508. totem_config.vsf_type);
  509. res = openais_flow_control_initialize ();
  510. /*
  511. * Drop root privleges to user 'ais'
  512. * TODO: Don't really need full root capabilities;
  513. * needed capabilities are:
  514. * CAP_NET_RAW (bindtodevice)
  515. * CAP_SYS_NICE (setscheduler)
  516. * CAP_IPC_LOCK (mlockall)
  517. */
  518. aisexec_priv_drop ();
  519. aisexec_mempool_init ();
  520. openais_ipc_init (
  521. serialize_mutex_lock,
  522. serialize_mutex_unlock,
  523. gid_valid);
  524. /*
  525. * Start main processing loop
  526. */
  527. poll_run (aisexec_poll_handle);
  528. return EXIT_SUCCESS;
  529. }