| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380 |
- /*
- * Copyright (c) 2005 MontaVista Software, Inc.
- * Copyright (c) 2006-2018 Red Hat, Inc.
- *
- * All rights reserved.
- *
- * Author: Steven Dake (sdake@redhat.com)
- * This software licensed under BSD license, the text of which follows:
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- *
- * - Redistributions of source code must retain the above copyright notice,
- * this list of conditions and the following disclaimer.
- * - Redistributions in binary form must reproduce the above copyright notice,
- * this list of conditions and the following disclaimer in the documentation
- * and/or other materials provided with the distribution.
- * - Neither the name of the MontaVista Software, Inc. nor the names of its
- * contributors may be used to endorse or promote products derived from this
- * software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
- * THE POSSIBILITY OF SUCH DAMAGE.
- */
- #include <config.h>
- #include <assert.h>
- #include <sys/mman.h>
- #include <sys/types.h>
- #include <sys/stat.h>
- #include <sys/socket.h>
- #include <netdb.h>
- #include <sys/un.h>
- #include <sys/ioctl.h>
- #include <sys/param.h>
- #include <netinet/in.h>
- #include <arpa/inet.h>
- #include <unistd.h>
- #include <fcntl.h>
- #include <stdlib.h>
- #include <stdio.h>
- #include <errno.h>
- #include <sched.h>
- #include <time.h>
- #include <sys/time.h>
- #include <sys/poll.h>
- #include <sys/uio.h>
- #include <limits.h>
- #include <qb/qblist.h>
- #include <qb/qbdefs.h>
- #include <qb/qbloop.h>
- #include <corosync/sq.h>
- #include <corosync/swab.h>
- #define LOGSYS_UTILS_ONLY 1
- #include <corosync/logsys.h>
- #include "totemudpu.h"
- #include "util.h"
- #ifndef MSG_NOSIGNAL
- #define MSG_NOSIGNAL 0
- #endif
- #define MCAST_SOCKET_BUFFER_SIZE (TRANSMITS_ALLOWED * UDP_RECEIVE_FRAME_SIZE_MAX)
- #define NETIF_STATE_REPORT_UP 1
- #define NETIF_STATE_REPORT_DOWN 2
- #define BIND_STATE_UNBOUND 0
- #define BIND_STATE_REGULAR 1
- #define BIND_STATE_LOOPBACK 2
- struct totemudpu_member {
- struct qb_list_head list;
- struct totem_ip_address member;
- int fd;
- int active;
- };
- struct totemudpu_instance {
- qb_loop_t *totemudpu_poll_handle;
- struct totem_interface *totem_interface;
- int netif_state_report;
- int netif_bind_state;
- void *context;
- int (*totemudpu_deliver_fn) (
- void *context,
- const void *msg,
- unsigned int msg_len,
- const struct sockaddr_storage *system_from);
- int (*totemudpu_iface_change_fn) (
- void *context,
- const struct totem_ip_address *iface_address,
- unsigned int ring_no);
- void (*totemudpu_target_set_completed) (void *context);
- /*
- * Function and data used to log messages
- */
- int totemudpu_log_level_security;
- int totemudpu_log_level_error;
- int totemudpu_log_level_warning;
- int totemudpu_log_level_notice;
- int totemudpu_log_level_debug;
- int totemudpu_subsys_id;
- void (*totemudpu_log_printf) (
- int level,
- int subsys,
- const char *function,
- const char *file,
- int line,
- const char *format,
- ...)__attribute__((format(printf, 6, 7)));
- void *udpu_context;
- char iov_buffer[UDP_RECEIVE_FRAME_SIZE_MAX + 1];
- struct iovec totemudpu_iov_recv;
- struct qb_list_head member_list;
- int stats_sent;
- int stats_recv;
- int stats_delv;
- int stats_remcasts;
- int stats_orf_token;
- struct timeval stats_tv_start;
- struct totem_ip_address my_id;
- int firstrun;
- qb_loop_timer_handle timer_netif_check_timeout;
- unsigned int my_memb_entries;
- struct totem_config *totem_config;
- totemsrp_stats_t *stats;
- struct totem_ip_address token_target;
- int token_socket;
- int local_loop_sock[2];
- qb_loop_timer_handle timer_merge_detect_timeout;
- int send_merge_detect_message;
- unsigned int merge_detect_messages_sent_before_timeout;
- };
- struct work_item {
- const void *msg;
- unsigned int msg_len;
- struct totemudpu_instance *instance;
- };
- static int totemudpu_build_sockets (
- struct totemudpu_instance *instance,
- struct totem_ip_address *bindnet_address,
- struct totem_ip_address *bound_to);
- static int totemudpu_create_sending_socket(
- void *udpu_context,
- const struct totem_ip_address *member);
- int totemudpu_member_list_rebind_ip (
- void *udpu_context);
- static void totemudpu_start_merge_detect_timeout(
- void *udpu_context);
- static void totemudpu_stop_merge_detect_timeout(
- void *udpu_context);
- static void totemudpu_instance_initialize (struct totemudpu_instance *instance)
- {
- memset (instance, 0, sizeof (struct totemudpu_instance));
- instance->netif_state_report = NETIF_STATE_REPORT_UP | NETIF_STATE_REPORT_DOWN;
- instance->totemudpu_iov_recv.iov_base = instance->iov_buffer;
- instance->totemudpu_iov_recv.iov_len = UDP_RECEIVE_FRAME_SIZE_MAX + 1; //sizeof (instance->iov_buffer) + 1;
- /*
- * There is always atleast 1 processor
- */
- instance->my_memb_entries = 1;
- qb_list_init (&instance->member_list);
- }
- #define log_printf(level, format, args...) \
- do { \
- instance->totemudpu_log_printf ( \
- level, instance->totemudpu_subsys_id, \
- __FUNCTION__, __FILE__, __LINE__, \
- (const char *)format, ##args); \
- } while (0);
- #define LOGSYS_PERROR(err_num, level, fmt, args...) \
- do { \
- char _error_str[LOGSYS_MAX_PERROR_MSG_LEN]; \
- const char *_error_ptr = qb_strerror_r(err_num, _error_str, sizeof(_error_str)); \
- instance->totemudpu_log_printf ( \
- level, instance->totemudpu_subsys_id, \
- __FUNCTION__, __FILE__, __LINE__, \
- fmt ": %s (%d)", ##args, _error_ptr, err_num); \
- } while(0)
- int totemudpu_crypto_set (
- void *udpu_context,
- const char *cipher_type,
- const char *hash_type)
- {
- return (0);
- }
- static inline void ucast_sendmsg (
- struct totemudpu_instance *instance,
- struct totem_ip_address *system_to,
- const void *msg,
- unsigned int msg_len)
- {
- struct msghdr msg_ucast;
- int res = 0;
- struct sockaddr_storage sockaddr;
- struct iovec iovec;
- int addrlen;
- int send_sock;
- iovec.iov_base = (void *)msg;
- iovec.iov_len = msg_len;
- /*
- * Build unicast message
- */
- totemip_totemip_to_sockaddr_convert(system_to,
- instance->totem_interface->ip_port, &sockaddr, &addrlen);
- memset(&msg_ucast, 0, sizeof(msg_ucast));
- msg_ucast.msg_name = &sockaddr;
- msg_ucast.msg_namelen = addrlen;
- msg_ucast.msg_iov = (void *)&iovec;
- msg_ucast.msg_iovlen = 1;
- if (instance->netif_bind_state == BIND_STATE_REGULAR) {
- send_sock = instance->token_socket;
- } else {
- send_sock = instance->local_loop_sock[1];
- msg_ucast.msg_name = NULL;
- msg_ucast.msg_namelen = 0;
- }
- /*
- * Transmit unicast message
- * An error here is recovered by totemsrp
- */
- res = sendmsg (send_sock, &msg_ucast, MSG_NOSIGNAL);
- if (res < 0) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_debug,
- "sendmsg(ucast) failed (non-critical)");
- }
- }
- static inline void mcast_sendmsg (
- struct totemudpu_instance *instance,
- const void *msg,
- unsigned int msg_len,
- int only_active)
- {
- struct msghdr msg_mcast;
- int res = 0;
- struct iovec iovec;
- struct sockaddr_storage sockaddr;
- int addrlen;
- struct qb_list_head *list;
- struct totemudpu_member *member;
- iovec.iov_base = (void *)msg;
- iovec.iov_len = msg_len;
- memset(&msg_mcast, 0, sizeof(msg_mcast));
- /*
- * Build multicast message
- */
- if (instance->netif_bind_state == BIND_STATE_REGULAR) {
- qb_list_for_each(list, &(instance->member_list)) {
- member = qb_list_entry (list, struct totemudpu_member, list);
- /*
- * Do not send multicast message if message is not "flush", member
- * is inactive and timeout for sending merge message didn't expired.
- */
- if (only_active && !member->active && !instance->send_merge_detect_message)
- continue ;
- totemip_totemip_to_sockaddr_convert(&member->member,
- instance->totem_interface->ip_port, &sockaddr, &addrlen);
- memset(&msg_mcast, 0, sizeof(msg_mcast));
- msg_mcast.msg_name = &sockaddr;
- msg_mcast.msg_namelen = addrlen;
- msg_mcast.msg_iov = (void *)&iovec;
- msg_mcast.msg_iovlen = 1;
- /*
- * Transmit multicast message
- * An error here is recovered by totemsrp
- */
- res = sendmsg (member->fd, &msg_mcast, MSG_NOSIGNAL);
- if (res < 0) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_debug,
- "sendmsg(mcast) failed (non-critical)");
- }
- }
- if (!only_active || instance->send_merge_detect_message) {
- /*
- * Current message was sent to all nodes
- */
- instance->merge_detect_messages_sent_before_timeout++;
- instance->send_merge_detect_message = 0;
- }
- } else {
- /*
- * Transmit multicast message to local unix mcast loop
- * An error here is recovered by totemsrp
- */
- msg_mcast.msg_name = NULL;
- msg_mcast.msg_namelen = 0;
- msg_mcast.msg_iov = (void *)&iovec;
- msg_mcast.msg_iovlen = 1;
- res = sendmsg (instance->local_loop_sock[1], &msg_mcast,
- MSG_NOSIGNAL);
- if (res < 0) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_debug,
- "sendmsg(local mcast loop) failed (non-critical)");
- }
- }
- }
- int totemudpu_finalize (
- void *udpu_context)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int res = 0;
- if (instance->token_socket > 0) {
- qb_loop_poll_del (instance->totemudpu_poll_handle,
- instance->token_socket);
- close (instance->token_socket);
- }
- if (instance->local_loop_sock[0] > 0) {
- qb_loop_poll_del (instance->totemudpu_poll_handle,
- instance->local_loop_sock[0]);
- close (instance->local_loop_sock[0]);
- close (instance->local_loop_sock[1]);
- }
- totemudpu_stop_merge_detect_timeout(instance);
- return (res);
- }
- static struct totemudpu_member *find_member_by_sockaddr(
- const void *udpu_context,
- const struct sockaddr *sa)
- {
- struct qb_list_head *list;
- struct totemudpu_member *member;
- struct totemudpu_member *res_member;
- const struct totemudpu_instance *instance = (const struct totemudpu_instance *)udpu_context;
- res_member = NULL;
- qb_list_for_each(list, &(instance->member_list)) {
- member = qb_list_entry (list,
- struct totemudpu_member,
- list);
- if (totemip_sa_equal(&member->member, sa)) {
- res_member = member;
- break ;
- }
- }
- return (res_member);
- }
- static int net_deliver_fn (
- int fd,
- int revents,
- void *data)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)data;
- struct msghdr msg_recv;
- struct iovec *iovec;
- struct sockaddr_storage system_from;
- int bytes_received;
- iovec = &instance->totemudpu_iov_recv;
- /*
- * Receive datagram
- */
- memset(&msg_recv, 0, sizeof(msg_recv));
- msg_recv.msg_name = &system_from;
- msg_recv.msg_namelen = sizeof (struct sockaddr_storage);
- msg_recv.msg_iov = iovec;
- msg_recv.msg_iovlen = 1;
- bytes_received = recvmsg (fd, &msg_recv, MSG_NOSIGNAL | MSG_DONTWAIT);
- if (bytes_received == -1) {
- return (0);
- } else {
- instance->stats_recv += bytes_received;
- }
- if (bytes_received >= UDP_RECEIVE_FRAME_SIZE_MAX + 1) {
- /*
- * Maximum packet size should be UDP_RECEIVE_FRAME_SIZE_MAX.
- * If received packet is UDP_RECEIVE_FRAME_SIZE_MAX + 1 it means packet was truncated
- * (iov_buffer size and iov_len are intentionally set to UDP_RECEIVE_FRAME_SIZE_MAX + 1).
- */
- log_printf (instance->totemudpu_log_level_error,
- "Received too big message. This may be because something bad is happening "
- "on the network (attack?), or you tried join more nodes than corosync is "
- "compiled with (%u) or bug in the code (bad estimation of "
- "the UDP_RECEIVE_FRAME_SIZE_MAX). Dropping packet.", PROCESSOR_COUNT_MAX);
- return (0);
- }
- if (instance->totem_config->block_unlisted_ips &&
- instance->netif_bind_state == BIND_STATE_REGULAR &&
- find_member_by_sockaddr(instance, (const struct sockaddr *)&system_from) == NULL) {
- log_printf(instance->totemudpu_log_level_debug, "Packet rejected from %s",
- totemip_sa_print((const struct sockaddr *)&system_from));
- return (0);
- }
- iovec->iov_len = bytes_received;
- /*
- * Handle incoming message
- */
- instance->totemudpu_deliver_fn (
- instance->context,
- iovec->iov_base,
- iovec->iov_len,
- &system_from);
- iovec->iov_len = UDP_RECEIVE_FRAME_SIZE_MAX + 1;
- return (0);
- }
- static int netif_determine (
- struct totemudpu_instance *instance,
- struct totem_ip_address *bindnet,
- struct totem_ip_address *bound_to,
- int *interface_up,
- int *interface_num)
- {
- int res;
- res = totemip_iface_check (bindnet, bound_to,
- interface_up, interface_num,
- instance->totem_config->clear_node_high_bit);
- return (res);
- }
- /*
- * If the interface is up, the sockets for totem are built. If the interface is down
- * this function is requeued in the timer list to retry building the sockets later.
- */
- static void timer_function_netif_check_timeout (
- void *data)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)data;
- int interface_up;
- int interface_num;
- /*
- * Build sockets for every interface
- */
- netif_determine (instance,
- &instance->totem_interface->bindnet,
- &instance->totem_interface->boundto,
- &interface_up, &interface_num);
- /*
- * If the network interface isn't back up and we are already
- * in loopback mode, add timer to check again and return
- */
- if ((instance->netif_bind_state == BIND_STATE_LOOPBACK &&
- interface_up == 0) ||
- (instance->my_memb_entries == 1 &&
- instance->netif_bind_state == BIND_STATE_REGULAR &&
- interface_up == 1)) {
- qb_loop_timer_add (instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->totem_config->downcheck_timeout*QB_TIME_NS_IN_MSEC,
- (void *)instance,
- timer_function_netif_check_timeout,
- &instance->timer_netif_check_timeout);
- /*
- * Add a timer to check for a downed regular interface
- */
- return;
- }
- if (instance->token_socket > 0) {
- qb_loop_poll_del (instance->totemudpu_poll_handle,
- instance->token_socket);
- close (instance->token_socket);
- instance->token_socket = -1;
- }
- if (interface_up == 0) {
- if (instance->netif_bind_state == BIND_STATE_UNBOUND) {
- log_printf (instance->totemudpu_log_level_error,
- "One of your ip addresses are now bound to localhost. "
- "Corosync would not work correctly.");
- exit(COROSYNC_DONE_FATAL_ERR);
- }
- /*
- * Interface is not up
- */
- instance->netif_bind_state = BIND_STATE_LOOPBACK;
- /*
- * Add a timer to retry building interfaces and request memb_gather_enter
- */
- qb_loop_timer_add (instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->totem_config->downcheck_timeout*QB_TIME_NS_IN_MSEC,
- (void *)instance,
- timer_function_netif_check_timeout,
- &instance->timer_netif_check_timeout);
- } else {
- /*
- * Interface is up
- */
- instance->netif_bind_state = BIND_STATE_REGULAR;
- }
- /*
- * Create and bind the multicast and unicast sockets
- */
- totemudpu_build_sockets (instance,
- &instance->totem_interface->bindnet,
- &instance->totem_interface->boundto);
- if (instance->netif_bind_state == BIND_STATE_REGULAR) {
- qb_loop_poll_add (instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->token_socket,
- POLLIN, instance, net_deliver_fn);
- }
- totemip_copy (&instance->my_id, &instance->totem_interface->boundto);
- /*
- * This reports changes in the interface to the user and totemsrp
- */
- if (instance->netif_bind_state == BIND_STATE_REGULAR) {
- if (instance->netif_state_report & NETIF_STATE_REPORT_UP) {
- log_printf (instance->totemudpu_log_level_notice,
- "The network interface [%s] is now up.",
- totemip_print (&instance->totem_interface->boundto));
- instance->netif_state_report = NETIF_STATE_REPORT_DOWN;
- instance->totemudpu_iface_change_fn (instance->context, &instance->my_id, 0);
- }
- /*
- * Add a timer to check for interface going down in single membership
- */
- if (instance->my_memb_entries == 1) {
- qb_loop_timer_add (instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->totem_config->downcheck_timeout*QB_TIME_NS_IN_MSEC,
- (void *)instance,
- timer_function_netif_check_timeout,
- &instance->timer_netif_check_timeout);
- }
- } else {
- if (instance->netif_state_report & NETIF_STATE_REPORT_DOWN) {
- log_printf (instance->totemudpu_log_level_notice,
- "The network interface is down.");
- instance->totemudpu_iface_change_fn (instance->context, &instance->my_id, 0);
- }
- instance->netif_state_report = NETIF_STATE_REPORT_UP;
- }
- }
- /* Set the socket priority to INTERACTIVE to ensure
- that our messages don't get queued behind anything else */
- static void totemudpu_traffic_control_set(struct totemudpu_instance *instance, int sock)
- {
- #ifdef SO_PRIORITY
- int prio = 6; /* TC_PRIO_INTERACTIVE */
- if (setsockopt(sock, SOL_SOCKET, SO_PRIORITY, &prio, sizeof(int))) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "Could not set traffic priority");
- }
- #endif
- }
- static int totemudpu_build_sockets_ip (
- struct totemudpu_instance *instance,
- struct totem_ip_address *bindnet_address,
- struct totem_ip_address *bound_to,
- int interface_num)
- {
- struct sockaddr_storage sockaddr;
- int addrlen;
- int res;
- unsigned int recvbuf_size;
- unsigned int optlen = sizeof (recvbuf_size);
- unsigned int retries = 0;
- /*
- * Setup unicast socket
- */
- instance->token_socket = socket (bindnet_address->family, SOCK_DGRAM, 0);
- if (instance->token_socket == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "socket() failed");
- return (-1);
- }
- totemip_nosigpipe (instance->token_socket);
- res = fcntl (instance->token_socket, F_SETFL, O_NONBLOCK);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "Could not set non-blocking operation on token socket");
- return (-1);
- }
- /*
- * Bind to unicast socket used for token send/receives
- * This has the side effect of binding to the correct interface
- */
- totemip_totemip_to_sockaddr_convert(bound_to, instance->totem_interface->ip_port, &sockaddr, &addrlen);
- while (1) {
- res = bind (instance->token_socket, (struct sockaddr *)&sockaddr, addrlen);
- if (res == 0) {
- break;
- }
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "bind token socket failed");
- if (++retries > BIND_MAX_RETRIES) {
- break;
- }
- /*
- * Wait for a while
- */
- (void)poll(NULL, 0, BIND_RETRIES_INTERVAL * retries);
- }
- if (res == -1) {
- return (-1);
- }
- /*
- * the token_socket can receive many messages. Allow a large number
- * of receive messages on this socket
- */
- recvbuf_size = MCAST_SOCKET_BUFFER_SIZE;
- res = setsockopt (instance->token_socket, SOL_SOCKET, SO_RCVBUF,
- &recvbuf_size, optlen);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_notice,
- "Could not set recvbuf size");
- }
- res = set_socket_dscp(instance->token_socket,
- instance->totem_config->ip_dscp);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_notice,
- "Could not set IP_TOS bits");
- }
- return 0;
- }
- int totemudpu_nodestatus_get (void *udpu_context, unsigned int nodeid,
- struct totem_node_status *node_status)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- struct qb_list_head *list;
- struct totemudpu_member *member;
- qb_list_for_each(list, &(instance->member_list)) {
- member = qb_list_entry (list,
- struct totemudpu_member,
- list);
- if (member->member.nodeid == nodeid) {
- node_status->nodeid = nodeid;
- /* reachable is filled in by totemsrp */
- if (instance->netif_bind_state == BIND_STATE_REGULAR) {
- node_status->link_status[0].enabled = 1;
- } else {
- node_status->link_status[0].enabled = 0;
- }
- node_status->link_status[0].connected = node_status->reachable;
- node_status->link_status[0].mtu = instance->totem_config->net_mtu;
- strncpy(node_status->link_status[0].src_ipaddr, totemip_print(&member->member), KNET_MAX_HOST_LEN-1);
- }
- }
- return (0);
- }
- int totemudpu_ifaces_get (
- void *net_context,
- char ***status,
- unsigned int *iface_count)
- {
- static char *statuses[INTERFACE_MAX] = {(char*)"OK"};
- if (status) {
- *status = statuses;
- }
- *iface_count = 1;
- return (0);
- }
- static int totemudpu_build_local_sockets(
- struct totemudpu_instance *instance)
- {
- int i;
- unsigned int sendbuf_size;
- unsigned int recvbuf_size;
- unsigned int optlen = sizeof (sendbuf_size);
- int res;
- /*
- * Create local multicast loop socket
- */
- if (socketpair(AF_UNIX, SOCK_DGRAM, 0, instance->local_loop_sock) == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "socket() failed");
- return (-1);
- }
- for (i = 0; i < 2; i++) {
- totemip_nosigpipe (instance->local_loop_sock[i]);
- res = fcntl (instance->local_loop_sock[i], F_SETFL, O_NONBLOCK);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "Could not set non-blocking operation on multicast socket");
- return (-1);
- }
- }
- recvbuf_size = MCAST_SOCKET_BUFFER_SIZE;
- sendbuf_size = MCAST_SOCKET_BUFFER_SIZE;
- res = setsockopt (instance->local_loop_sock[0], SOL_SOCKET, SO_RCVBUF, &recvbuf_size, optlen);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_debug,
- "Unable to set SO_RCVBUF size on UDP local mcast loop socket");
- return (-1);
- }
- res = setsockopt (instance->local_loop_sock[1], SOL_SOCKET, SO_SNDBUF, &sendbuf_size, optlen);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_debug,
- "Unable to set SO_SNDBUF size on UDP local mcast loop socket");
- return (-1);
- }
- res = getsockopt (instance->local_loop_sock[0], SOL_SOCKET, SO_RCVBUF, &recvbuf_size, &optlen);
- if (res == 0) {
- log_printf (instance->totemudpu_log_level_debug,
- "Local receive multicast loop socket recv buffer size (%d bytes).", recvbuf_size);
- }
- res = getsockopt (instance->local_loop_sock[1], SOL_SOCKET, SO_SNDBUF, &sendbuf_size, &optlen);
- if (res == 0) {
- log_printf (instance->totemudpu_log_level_debug,
- "Local transmit multicast loop socket send buffer size (%d bytes).", sendbuf_size);
- }
- return (0);
- }
- static int totemudpu_build_sockets (
- struct totemudpu_instance *instance,
- struct totem_ip_address *bindnet_address,
- struct totem_ip_address *bound_to)
- {
- int interface_num;
- int interface_up;
- int res;
- /*
- * Determine the ip address bound to and the interface name
- */
- res = netif_determine (instance,
- bindnet_address,
- bound_to,
- &interface_up,
- &interface_num);
- if (res == -1) {
- return (-1);
- }
- totemip_copy(&instance->my_id, bound_to);
- res = totemudpu_build_sockets_ip (instance,
- bindnet_address, bound_to, interface_num);
- if (res == -1) {
- /* if we get here, corosync won't work anyway, so better leaving than faking to work */
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_error,
- "Unable to create sockets, exiting");
- exit(EXIT_FAILURE);
- }
- /* We only send out of the token socket */
- totemudpu_traffic_control_set(instance, instance->token_socket);
- /*
- * Rebind all members to new ips
- */
- totemudpu_member_list_rebind_ip(instance);
- return res;
- }
- /*
- * Totem Network interface
- * depends on poll abstraction, POSIX, IPV4
- */
- /*
- * Create an instance
- */
- int totemudpu_initialize (
- qb_loop_t *poll_handle,
- void **udpu_context,
- struct totem_config *totem_config,
- totemsrp_stats_t *stats,
- void *context,
- int (*deliver_fn) (
- void *context,
- const void *msg,
- unsigned int msg_len,
- const struct sockaddr_storage *system_from),
- int (*iface_change_fn) (
- void *context,
- const struct totem_ip_address *iface_address,
- unsigned int ring_no),
- void (*mtu_changed) (
- void *context,
- int net_mtu),
- void (*target_set_completed) (
- void *context))
- {
- struct totemudpu_instance *instance;
- instance = malloc (sizeof (struct totemudpu_instance));
- if (instance == NULL) {
- return (-1);
- }
- totemudpu_instance_initialize (instance);
- instance->totem_config = totem_config;
- instance->stats = stats;
- /*
- * Configure logging
- */
- instance->totemudpu_log_level_security = 1; //totem_config->totem_logging_configuration.log_level_security;
- instance->totemudpu_log_level_error = totem_config->totem_logging_configuration.log_level_error;
- instance->totemudpu_log_level_warning = totem_config->totem_logging_configuration.log_level_warning;
- instance->totemudpu_log_level_notice = totem_config->totem_logging_configuration.log_level_notice;
- instance->totemudpu_log_level_debug = totem_config->totem_logging_configuration.log_level_debug;
- instance->totemudpu_subsys_id = totem_config->totem_logging_configuration.log_subsys_id;
- instance->totemudpu_log_printf = totem_config->totem_logging_configuration.log_printf;
- /*
- * Initialize local variables for totemudpu
- */
- instance->totem_interface = &totem_config->interfaces[0];
- memset (instance->iov_buffer, 0, UDP_RECEIVE_FRAME_SIZE_MAX + 1);
- instance->totemudpu_poll_handle = poll_handle;
- instance->totem_interface->bindnet.nodeid = instance->totem_config->node_id;
- instance->context = context;
- instance->totemudpu_deliver_fn = deliver_fn;
- instance->totemudpu_iface_change_fn = iface_change_fn;
- instance->totemudpu_target_set_completed = target_set_completed;
- /*
- * Create static local mcast sockets
- */
- if (totemudpu_build_local_sockets(instance) == -1) {
- free(instance);
- return (-1);
- }
- qb_loop_poll_add (
- instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->local_loop_sock[0],
- POLLIN, instance, net_deliver_fn);
- /*
- * RRP layer isn't ready to receive message because it hasn't
- * initialized yet. Add short timer to check the interfaces.
- */
- qb_loop_timer_add (instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- 100*QB_TIME_NS_IN_MSEC,
- (void *)instance,
- timer_function_netif_check_timeout,
- &instance->timer_netif_check_timeout);
- totemudpu_start_merge_detect_timeout((void*)instance);
- *udpu_context = instance;
- return (0);
- }
- void *totemudpu_buffer_alloc (void)
- {
- return malloc (FRAME_SIZE_MAX);
- }
- void totemudpu_buffer_release (void *ptr)
- {
- return free (ptr);
- }
- int totemudpu_processor_count_set (
- void *udpu_context,
- int processor_count)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int res = 0;
- instance->my_memb_entries = processor_count;
- qb_loop_timer_del (instance->totemudpu_poll_handle,
- instance->timer_netif_check_timeout);
- if (processor_count == 1) {
- qb_loop_timer_add (instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->totem_config->downcheck_timeout*QB_TIME_NS_IN_MSEC,
- (void *)instance,
- timer_function_netif_check_timeout,
- &instance->timer_netif_check_timeout);
- }
- return (res);
- }
- int totemudpu_recv_flush (void *udpu_context)
- {
- int res = 0;
- return (res);
- }
- int totemudpu_send_flush (void *udpu_context)
- {
- int res = 0;
- return (res);
- }
- int totemudpu_token_send (
- void *udpu_context,
- const void *msg,
- unsigned int msg_len)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int res = 0;
- ucast_sendmsg (instance, &instance->token_target, msg, msg_len);
- return (res);
- }
- int totemudpu_mcast_flush_send (
- void *udpu_context,
- const void *msg,
- unsigned int msg_len)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int res = 0;
- mcast_sendmsg (instance, msg, msg_len, 0);
- return (res);
- }
- int totemudpu_mcast_noflush_send (
- void *udpu_context,
- const void *msg,
- unsigned int msg_len)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int res = 0;
- mcast_sendmsg (instance, msg, msg_len, 1);
- return (res);
- }
- extern int totemudpu_iface_check (void *udpu_context)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int res = 0;
- timer_function_netif_check_timeout (instance);
- return (res);
- }
- extern void totemudpu_net_mtu_adjust (void *udpu_context, struct totem_config *totem_config)
- {
- totem_config->net_mtu -= totemip_udpip_header_size(totem_config->interfaces[0].bindnet.family);
- }
- int totemudpu_token_target_set (
- void *udpu_context,
- unsigned int nodeid)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- struct qb_list_head *list;
- struct totemudpu_member *member;
- int res = 0;
- qb_list_for_each(list, &(instance->member_list)) {
- member = qb_list_entry (list,
- struct totemudpu_member,
- list);
- if (member->member.nodeid == nodeid) {
- memcpy (&instance->token_target, &member->member,
- sizeof (struct totem_ip_address));
- instance->totemudpu_target_set_completed (instance->context);
- break;
- }
- }
- return (res);
- }
- extern int totemudpu_recv_mcast_empty (
- void *udpu_context)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- unsigned int res;
- struct sockaddr_storage system_from;
- struct msghdr msg_recv;
- struct pollfd ufd;
- int nfds, i;
- int msg_processed = 0;
- int sock;
- /*
- * Receive datagram
- */
- memset(&msg_recv, 0, sizeof(msg_recv));
- msg_recv.msg_name = &system_from;
- msg_recv.msg_namelen = sizeof (struct sockaddr_storage);
- msg_recv.msg_iov = &instance->totemudpu_iov_recv;
- msg_recv.msg_iovlen = 1;
- for (i = 0; i < 2; i++) {
- sock = -1;
- if (i == 0) {
- if (instance->netif_bind_state == BIND_STATE_REGULAR) {
- sock = instance->token_socket;
- } else {
- continue;
- }
- }
- if (i == 1) {
- sock = instance->local_loop_sock[0];
- }
- assert(sock != -1);
- do {
- ufd.fd = sock;
- ufd.events = POLLIN;
- nfds = poll (&ufd, 1, 0);
- if (nfds == 1 && ufd.revents & POLLIN) {
- res = recvmsg (sock, &msg_recv, MSG_NOSIGNAL | MSG_DONTWAIT);
- if (res != -1) {
- msg_processed = 1;
- } else {
- msg_processed = -1;
- }
- }
- } while (nfds == 1);
- }
- return (msg_processed);
- }
- static int totemudpu_create_sending_socket(
- void *udpu_context,
- const struct totem_ip_address *member)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- int fd;
- int res;
- unsigned int sendbuf_size;
- unsigned int optlen = sizeof (sendbuf_size);
- struct sockaddr_storage sockaddr;
- int addrlen;
- fd = socket (member->family, SOCK_DGRAM, 0);
- if (fd == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "Could not create socket for new member");
- return (-1);
- }
- totemip_nosigpipe (fd);
- res = fcntl (fd, F_SETFL, O_NONBLOCK);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "Could not set non-blocking operation on token socket");
- goto error_close_fd;
- }
- /*
- * These sockets are used to send multicast messages, so their buffers
- * should be large
- */
- sendbuf_size = MCAST_SOCKET_BUFFER_SIZE;
- res = setsockopt (fd, SOL_SOCKET, SO_SNDBUF,
- &sendbuf_size, optlen);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_notice,
- "Could not set sendbuf size");
- /*
- * Fail in setting sendbuf size is not fatal -> don't exit
- */
- }
- res = set_socket_dscp(fd, instance->totem_config->ip_dscp);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_notice,
- "Could not set IP_TOS bits");
- }
- /*
- * Bind to sending interface
- */
- totemip_totemip_to_sockaddr_convert(&instance->my_id, 0, &sockaddr, &addrlen);
- res = bind (fd, (struct sockaddr *)&sockaddr, addrlen);
- if (res == -1) {
- LOGSYS_PERROR (errno, instance->totemudpu_log_level_warning,
- "bind token socket failed");
- goto error_close_fd;
- }
- return (fd);
- error_close_fd:
- close(fd);
- return (-1);
- }
- int totemudpu_iface_set (void *net_context,
- const struct totem_ip_address *local_addr,
- unsigned short ip_port,
- unsigned int iface_no)
- {
- /* Not supported */
- return (-1);
- }
- int totemudpu_member_add (
- void *udpu_context,
- const struct totem_ip_address *local,
- const struct totem_ip_address *member,
- int ring_no)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- struct totemudpu_member *new_member;
- new_member = malloc (sizeof (struct totemudpu_member));
- if (new_member == NULL) {
- return (-1);
- }
- memset(new_member, 0, sizeof(*new_member));
- log_printf (LOGSYS_LEVEL_NOTICE, "adding new UDPU member {%s}",
- totemip_print(member));
- qb_list_init (&new_member->list);
- qb_list_add_tail (&new_member->list, &instance->member_list);
- memcpy (&new_member->member, member, sizeof (struct totem_ip_address));
- new_member->fd = totemudpu_create_sending_socket(udpu_context, member);
- new_member->active = 1;
- return (0);
- }
- int totemudpu_member_remove (
- void *udpu_context,
- const struct totem_ip_address *token_target,
- int ring_no)
- {
- int found = 0;
- struct qb_list_head *list;
- struct totemudpu_member *member;
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- /*
- * Find the member to remove and close its socket
- */
- qb_list_for_each(list, &(instance->member_list)) {
- member = qb_list_entry (list,
- struct totemudpu_member,
- list);
- if (totemip_compare (token_target, &member->member)==0) {
- log_printf(LOGSYS_LEVEL_NOTICE,
- "removing UDPU member {%s}",
- totemip_print(&member->member));
- if (member->fd > 0) {
- log_printf(LOGSYS_LEVEL_DEBUG,
- "Closing socket to: {%s}",
- totemip_print(&member->member));
- qb_loop_poll_del (instance->totemudpu_poll_handle,
- member->fd);
- close (member->fd);
- }
- found = 1;
- break;
- }
- }
- /*
- * Delete the member from the list
- */
- if (found) {
- qb_list_del (list);
- }
- instance = NULL;
- return (0);
- }
- int totemudpu_member_list_rebind_ip (
- void *udpu_context)
- {
- struct qb_list_head *list;
- struct totemudpu_member *member;
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- qb_list_for_each(list, &(instance->member_list)) {
- member = qb_list_entry (list,
- struct totemudpu_member,
- list);
- if (member->fd > 0) {
- close (member->fd);
- }
- member->fd = totemudpu_create_sending_socket(udpu_context, &member->member);
- }
- return (0);
- }
- static void timer_function_merge_detect_timeout (
- void *data)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)data;
- if (instance->merge_detect_messages_sent_before_timeout == 0) {
- instance->send_merge_detect_message = 1;
- }
- instance->merge_detect_messages_sent_before_timeout = 0;
- totemudpu_start_merge_detect_timeout(instance);
- }
- static void totemudpu_start_merge_detect_timeout(
- void *udpu_context)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- qb_loop_timer_add(instance->totemudpu_poll_handle,
- QB_LOOP_MED,
- instance->totem_config->merge_timeout * 2 * QB_TIME_NS_IN_MSEC,
- (void *)instance,
- timer_function_merge_detect_timeout,
- &instance->timer_merge_detect_timeout);
- }
- static void totemudpu_stop_merge_detect_timeout(
- void *udpu_context)
- {
- struct totemudpu_instance *instance = (struct totemudpu_instance *)udpu_context;
- qb_loop_timer_del(instance->totemudpu_poll_handle,
- instance->timer_merge_detect_timeout);
- }
- int totemudpu_reconfigure (
- void *udpu_context,
- struct totem_config *totem_config)
- {
- /* Not supported */
- return (-1);
- }
|