mirror of
				https://git.proxmox.com/git/mirror_corosync
				synced 2025-10-25 17:17:43 +00:00 
			
		
		
		
	 45dd9861ff
			
		
	
	
		45dd9861ff
		
	
	
	
	
		
			
			Error message is displayed when it's impossible to create symlink to fdata file. Signed-off-by: Jan Friesse <jfriesse@redhat.com> Reviewed-by: Christine Caulfield <ccaulfie@redhat.com>
		
			
				
	
	
		
			1339 lines
		
	
	
		
			39 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			1339 lines
		
	
	
		
			39 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2002-2006 MontaVista Software, Inc.
 | |
|  * Copyright (c) 2006-2012 Red Hat, Inc.
 | |
|  *
 | |
|  * All rights reserved.
 | |
|  *
 | |
|  * Author: Steven Dake (sdake@redhat.com)
 | |
|  *
 | |
|  * This software licensed under BSD license, the text of which follows:
 | |
|  *
 | |
|  * Redistribution and use in source and binary forms, with or without
 | |
|  * modification, are permitted provided that the following conditions are met:
 | |
|  *
 | |
|  * - Redistributions of source code must retain the above copyright notice,
 | |
|  *   this list of conditions and the following disclaimer.
 | |
|  * - Redistributions in binary form must reproduce the above copyright notice,
 | |
|  *   this list of conditions and the following disclaimer in the documentation
 | |
|  *   and/or other materials provided with the distribution.
 | |
|  * - Neither the name of the MontaVista Software, Inc. nor the names of its
 | |
|  *   contributors may be used to endorse or promote products derived from this
 | |
|  *   software without specific prior written permission.
 | |
|  *
 | |
|  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | |
|  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | |
|  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | |
|  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 | |
|  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 | |
|  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 | |
|  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 | |
|  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 | |
|  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 | |
|  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
 | |
|  * THE POSSIBILITY OF SUCH DAMAGE.
 | |
|  */
 | |
| 
 | |
| /**
 | |
|  * \mainpage Corosync
 | |
|  *
 | |
|  * This is the doxygen generated developer documentation for the Corosync
 | |
|  * project.  For more information about Corosync, please see the project
 | |
|  * web site, <a href="http://www.corosync.org">corosync.org</a>.
 | |
|  *
 | |
|  * \section license License
 | |
|  *
 | |
|  * This software licensed under BSD license, the text of which follows:
 | |
|  *
 | |
|  * Redistribution and use in source and binary forms, with or without
 | |
|  * modification, are permitted provided that the following conditions are met:
 | |
|  *
 | |
|  * - Redistributions of source code must retain the above copyright notice,
 | |
|  *   this list of conditions and the following disclaimer.
 | |
|  * - Redistributions in binary form must reproduce the above copyright notice,
 | |
|  *   this list of conditions and the following disclaimer in the documentation
 | |
|  *   and/or other materials provided with the distribution.
 | |
|  * - Neither the name of the MontaVista Software, Inc. nor the names of its
 | |
|  *   contributors may be used to endorse or promote products derived from this
 | |
|  *   software without specific prior written permission.
 | |
|  *
 | |
|  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | |
|  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | |
|  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | |
|  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 | |
|  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 | |
|  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 | |
|  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 | |
|  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 | |
|  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 | |
|  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
 | |
|  * THE POSSIBILITY OF SUCH DAMAGE.
 | |
|  */
 | |
| 
 | |
| #include <config.h>
 | |
| 
 | |
| #include <pthread.h>
 | |
| #include <assert.h>
 | |
| #include <sys/types.h>
 | |
| #include <sys/file.h>
 | |
| #include <sys/poll.h>
 | |
| #include <sys/uio.h>
 | |
| #include <sys/mman.h>
 | |
| #include <sys/socket.h>
 | |
| #include <sys/un.h>
 | |
| #include <sys/time.h>
 | |
| #include <sys/resource.h>
 | |
| #include <sys/stat.h>
 | |
| #include <netinet/in.h>
 | |
| #include <arpa/inet.h>
 | |
| #include <unistd.h>
 | |
| #include <fcntl.h>
 | |
| #include <stdlib.h>
 | |
| #include <stdio.h>
 | |
| #include <errno.h>
 | |
| #include <signal.h>
 | |
| #include <sched.h>
 | |
| #include <time.h>
 | |
| #include <semaphore.h>
 | |
| 
 | |
| #include <qb/qbdefs.h>
 | |
| #include <qb/qblog.h>
 | |
| #include <qb/qbloop.h>
 | |
| #include <qb/qbutil.h>
 | |
| #include <qb/qbipcs.h>
 | |
| 
 | |
| #include <corosync/swab.h>
 | |
| #include <corosync/corotypes.h>
 | |
| #include <corosync/corodefs.h>
 | |
| #include <corosync/list.h>
 | |
| #include <corosync/totem/totempg.h>
 | |
| #include <corosync/logsys.h>
 | |
| #include <corosync/icmap.h>
 | |
| 
 | |
| #include "quorum.h"
 | |
| #include "totemsrp.h"
 | |
| #include "logconfig.h"
 | |
| #include "totemconfig.h"
 | |
| #include "main.h"
 | |
| #include "sync.h"
 | |
| #include "timer.h"
 | |
| #include "util.h"
 | |
| #include "apidef.h"
 | |
| #include "service.h"
 | |
| #include "schedwrk.h"
 | |
| 
 | |
| #ifdef HAVE_SMALL_MEMORY_FOOTPRINT
 | |
| #define IPC_LOGSYS_SIZE			1024*64
 | |
| #else
 | |
| #define IPC_LOGSYS_SIZE			8192*128
 | |
| #endif
 | |
| 
 | |
| LOGSYS_DECLARE_SYSTEM ("corosync",
 | |
| 	LOGSYS_MODE_OUTPUT_STDERR | LOGSYS_MODE_OUTPUT_SYSLOG,
 | |
| 	LOG_DAEMON,
 | |
| 	LOG_INFO);
 | |
| 
 | |
| LOGSYS_DECLARE_SUBSYS ("MAIN");
 | |
| 
 | |
| #define SERVER_BACKLOG 5
 | |
| 
 | |
| static int sched_priority = 0;
 | |
| 
 | |
| static unsigned int service_count = 32;
 | |
| 
 | |
| static struct totem_logging_configuration totem_logging_configuration;
 | |
| 
 | |
| static struct corosync_api_v1 *api = NULL;
 | |
| 
 | |
| static int sync_in_process = 1;
 | |
| 
 | |
| static qb_loop_t *corosync_poll_handle;
 | |
| 
 | |
| struct sched_param global_sched_param;
 | |
| 
 | |
| static corosync_timer_handle_t corosync_stats_timer_handle;
 | |
| 
 | |
| static const char *corosync_lock_file = LOCALSTATEDIR"/run/corosync.pid";
 | |
| 
 | |
| static int ip_version = AF_INET;
 | |
| 
 | |
| qb_loop_t *cs_poll_handle_get (void)
 | |
| {
 | |
| 	return (corosync_poll_handle);
 | |
| }
 | |
| 
 | |
| int cs_poll_dispatch_add (qb_loop_t * handle,
 | |
| 		int fd,
 | |
| 		int events,
 | |
| 		void *data,
 | |
| 
 | |
| 		int (*dispatch_fn) (int fd,
 | |
| 			int revents,
 | |
| 			void *data))
 | |
| {
 | |
| 	return qb_loop_poll_add(handle, QB_LOOP_MED, fd, events, data,
 | |
| 				dispatch_fn);
 | |
| }
 | |
| 
 | |
| int cs_poll_dispatch_delete(qb_loop_t * handle, int fd)
 | |
| {
 | |
| 	return qb_loop_poll_del(handle, fd);
 | |
| }
 | |
| 
 | |
| void corosync_state_dump (void)
 | |
| {
 | |
| 	int i;
 | |
| 
 | |
| 	for (i = 0; i < SERVICES_COUNT_MAX; i++) {
 | |
| 		if (corosync_service[i] && corosync_service[i]->exec_dump_fn) {
 | |
| 			corosync_service[i]->exec_dump_fn ();
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static void corosync_blackbox_write_to_file (void)
 | |
| {
 | |
| 	char fname[PATH_MAX];
 | |
| 	char time_str[PATH_MAX];
 | |
| 	struct tm cur_time_tm;
 | |
| 	time_t cur_time_t;
 | |
| 
 | |
| 	cur_time_t = time(NULL);
 | |
| 	localtime_r(&cur_time_t, &cur_time_tm);
 | |
| 
 | |
| 	strftime(time_str, PATH_MAX, "%Y-%m-%dT%H:%M:%S", &cur_time_tm);
 | |
| 	snprintf(fname, PATH_MAX, "%s/fdata-%s-%lld",
 | |
| 	    LOCALSTATEDIR "/lib/corosync",
 | |
| 	    time_str,
 | |
| 	    (long long int)getpid());
 | |
| 
 | |
| 	qb_log_blackbox_write_to_file(fname);
 | |
| 
 | |
| 	unlink(LOCALSTATEDIR "/lib/corosync/fdata");
 | |
| 	if (symlink(fname, LOCALSTATEDIR "/lib/corosync/fdata") == -1) {
 | |
| 		log_printf(LOGSYS_LEVEL_ERROR, "Can't create symlink to '%s' for corosync blackbox file '%s'",
 | |
| 		    fname, LOCALSTATEDIR "/lib/corosync/fdata");
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static void unlink_all_completed (void)
 | |
| {
 | |
| 	api->timer_delete (corosync_stats_timer_handle);
 | |
| 	qb_loop_stop (corosync_poll_handle);
 | |
| 	icmap_fini();
 | |
| }
 | |
| 
 | |
| void corosync_shutdown_request (void)
 | |
| {
 | |
| 	corosync_service_unlink_all (api, unlink_all_completed);
 | |
| }
 | |
| 
 | |
| static int32_t sig_diag_handler (int num, void *data)
 | |
| {
 | |
| 	corosync_state_dump ();
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int32_t sig_exit_handler (int num, void *data)
 | |
| {
 | |
| 	log_printf(LOGSYS_LEVEL_NOTICE, "Node was shut down by a signal");
 | |
| 	corosync_service_unlink_all (api, unlink_all_completed);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static void sigsegv_handler (int num)
 | |
| {
 | |
| 	(void)signal (SIGSEGV, SIG_DFL);
 | |
| 	corosync_blackbox_write_to_file ();
 | |
| 	qb_log_fini();
 | |
| 	raise (SIGSEGV);
 | |
| }
 | |
| 
 | |
| static void sigabrt_handler (int num)
 | |
| {
 | |
| 	(void)signal (SIGABRT, SIG_DFL);
 | |
| 	corosync_blackbox_write_to_file ();
 | |
| 	qb_log_fini();
 | |
| 	raise (SIGABRT);
 | |
| }
 | |
| 
 | |
| #define LOCALHOST_IP inet_addr("127.0.0.1")
 | |
| 
 | |
| static void *corosync_group_handle;
 | |
| 
 | |
| static struct totempg_group corosync_group = {
 | |
| 	.group		= "a",
 | |
| 	.group_len	= 1
 | |
| };
 | |
| 
 | |
| static void serialize_lock (void)
 | |
| {
 | |
| }
 | |
| 
 | |
| static void serialize_unlock (void)
 | |
| {
 | |
| }
 | |
| 
 | |
| static void corosync_sync_completed (void)
 | |
| {
 | |
| 	log_printf (LOGSYS_LEVEL_NOTICE,
 | |
| 		"Completed service synchronization, ready to provide service.");
 | |
| 	sync_in_process = 0;
 | |
| 
 | |
| 	cs_ipcs_sync_state_changed(sync_in_process);
 | |
| 	cs_ipc_allow_connections(1);
 | |
| 	/*
 | |
| 	 * Inform totem to start using new message queue again
 | |
| 	 */
 | |
| 	totempg_trans_ack();
 | |
| }
 | |
| 
 | |
| static int corosync_sync_callbacks_retrieve (
 | |
| 	int service_id,
 | |
| 	struct sync_callbacks *callbacks)
 | |
| {
 | |
| 	if (corosync_service[service_id] == NULL) {
 | |
| 		return (-1);
 | |
| 	}
 | |
| 
 | |
| 	if (callbacks == NULL) {
 | |
| 		return (0);
 | |
| 	}
 | |
| 
 | |
| 	callbacks->name = corosync_service[service_id]->name;
 | |
| 
 | |
| 	callbacks->sync_init = corosync_service[service_id]->sync_init;
 | |
| 	callbacks->sync_process = corosync_service[service_id]->sync_process;
 | |
| 	callbacks->sync_activate = corosync_service[service_id]->sync_activate;
 | |
| 	callbacks->sync_abort = corosync_service[service_id]->sync_abort;
 | |
| 	return (0);
 | |
| }
 | |
| 
 | |
| static struct memb_ring_id corosync_ring_id;
 | |
| 
 | |
| static void member_object_joined (unsigned int nodeid)
 | |
| {
 | |
| 	char member_ip[ICMAP_KEYNAME_MAXLEN];
 | |
| 	char member_join_count[ICMAP_KEYNAME_MAXLEN];
 | |
| 	char member_status[ICMAP_KEYNAME_MAXLEN];
 | |
| 
 | |
| 	snprintf(member_ip, ICMAP_KEYNAME_MAXLEN,
 | |
| 		"runtime.totem.pg.mrp.srp.members.%u.ip", nodeid);
 | |
| 	snprintf(member_join_count, ICMAP_KEYNAME_MAXLEN,
 | |
| 		"runtime.totem.pg.mrp.srp.members.%u.join_count", nodeid);
 | |
| 	snprintf(member_status, ICMAP_KEYNAME_MAXLEN,
 | |
| 		"runtime.totem.pg.mrp.srp.members.%u.status", nodeid);
 | |
| 
 | |
| 	if (icmap_get(member_ip, NULL, NULL, NULL) == CS_OK) {
 | |
| 		icmap_inc(member_join_count);
 | |
| 		icmap_set_string(member_status, "joined");
 | |
| 	} else {
 | |
| 		icmap_set_string(member_ip, (char*)api->totem_ifaces_print (nodeid));
 | |
| 		icmap_set_uint32(member_join_count, 1);
 | |
| 		icmap_set_string(member_status, "joined");
 | |
| 	}
 | |
| 
 | |
| 	log_printf (LOGSYS_LEVEL_DEBUG,
 | |
| 		"Member joined: %s", api->totem_ifaces_print (nodeid));
 | |
| }
 | |
| 
 | |
| static void member_object_left (unsigned int nodeid)
 | |
| {
 | |
| 	char member_status[ICMAP_KEYNAME_MAXLEN];
 | |
| 
 | |
| 	snprintf(member_status, ICMAP_KEYNAME_MAXLEN,
 | |
| 		"runtime.totem.pg.mrp.srp.members.%u.status", nodeid);
 | |
| 	icmap_set_string(member_status, "left");
 | |
| 
 | |
| 	log_printf (LOGSYS_LEVEL_DEBUG,
 | |
| 		"Member left: %s", api->totem_ifaces_print (nodeid));
 | |
| }
 | |
| 
 | |
| static void confchg_fn (
 | |
| 	enum totem_configuration_type configuration_type,
 | |
| 	const unsigned int *member_list, size_t member_list_entries,
 | |
| 	const unsigned int *left_list, size_t left_list_entries,
 | |
| 	const unsigned int *joined_list, size_t joined_list_entries,
 | |
| 	const struct memb_ring_id *ring_id)
 | |
| {
 | |
| 	int i;
 | |
| 	int abort_activate = 0;
 | |
| 
 | |
| 	if (sync_in_process == 1) {
 | |
| 		abort_activate = 1;
 | |
| 	}
 | |
| 	sync_in_process = 1;
 | |
| 	cs_ipcs_sync_state_changed(sync_in_process);
 | |
| 	memcpy (&corosync_ring_id, ring_id, sizeof (struct memb_ring_id));
 | |
| 
 | |
| 	for (i = 0; i < left_list_entries; i++) {
 | |
| 		member_object_left (left_list[i]);
 | |
| 	}
 | |
| 	for (i = 0; i < joined_list_entries; i++) {
 | |
| 		member_object_joined (joined_list[i]);
 | |
| 	}
 | |
| 	/*
 | |
| 	 * Call configuration change for all services
 | |
| 	 */
 | |
| 	for (i = 0; i < service_count; i++) {
 | |
| 		if (corosync_service[i] && corosync_service[i]->confchg_fn) {
 | |
| 			corosync_service[i]->confchg_fn (configuration_type,
 | |
| 				member_list, member_list_entries,
 | |
| 				left_list, left_list_entries,
 | |
| 				joined_list, joined_list_entries, ring_id);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (abort_activate) {
 | |
| 		sync_abort ();
 | |
| 	}
 | |
| 	if (configuration_type == TOTEM_CONFIGURATION_TRANSITIONAL) {
 | |
| 		sync_save_transitional (member_list, member_list_entries, ring_id);
 | |
| 	}
 | |
| 	if (configuration_type == TOTEM_CONFIGURATION_REGULAR) {
 | |
| 		sync_start (member_list, member_list_entries, ring_id);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static void priv_drop (void)
 | |
| {
 | |
| 	return; /* TODO: we are still not dropping privs */
 | |
| }
 | |
| 
 | |
| static void corosync_tty_detach (void)
 | |
| {
 | |
| 	int devnull;
 | |
| 
 | |
| 	/*
 | |
| 	 * Disconnect from TTY if this is not a debug run
 | |
| 	 */
 | |
| 
 | |
| 	switch (fork ()) {
 | |
| 		case -1:
 | |
| 			corosync_exit_error (COROSYNC_DONE_FORK);
 | |
| 			break;
 | |
| 		case 0:
 | |
| 			/*
 | |
| 			 * child which is disconnected, run this process
 | |
| 			 */
 | |
| 			break;
 | |
| 		default:
 | |
| 			exit (0);
 | |
| 			break;
 | |
| 	}
 | |
| 
 | |
| 	/* Create new session */
 | |
| 	(void)setsid();
 | |
| 
 | |
| 	/*
 | |
| 	 * Map stdin/out/err to /dev/null.
 | |
| 	 */
 | |
| 	devnull = open("/dev/null", O_RDWR);
 | |
| 	if (devnull == -1) {
 | |
| 		corosync_exit_error (COROSYNC_DONE_STD_TO_NULL_REDIR);
 | |
| 	}
 | |
| 
 | |
| 	if (dup2(devnull, 0) < 0 || dup2(devnull, 1) < 0
 | |
| 	    || dup2(devnull, 2) < 0) {
 | |
| 		close(devnull);
 | |
| 		corosync_exit_error (COROSYNC_DONE_STD_TO_NULL_REDIR);
 | |
| 	}
 | |
| 	close(devnull);
 | |
| }
 | |
| 
 | |
| static void corosync_mlockall (void)
 | |
| {
 | |
| 	int res;
 | |
| 	struct rlimit rlimit;
 | |
| 
 | |
| 	rlimit.rlim_cur = RLIM_INFINITY;
 | |
| 	rlimit.rlim_max = RLIM_INFINITY;
 | |
| 
 | |
| #ifndef RLIMIT_MEMLOCK
 | |
| #define RLIMIT_MEMLOCK RLIMIT_VMEM
 | |
| #endif
 | |
| 
 | |
| 	setrlimit (RLIMIT_MEMLOCK, &rlimit);
 | |
| 
 | |
| 	res = mlockall (MCL_CURRENT | MCL_FUTURE);
 | |
| 	if (res == -1) {
 | |
| 		LOGSYS_PERROR (errno, LOGSYS_LEVEL_WARNING,
 | |
| 			"Could not lock memory of service to avoid page faults");
 | |
| 	};
 | |
| }
 | |
| 
 | |
| 
 | |
| static void corosync_totem_stats_updater (void *data)
 | |
| {
 | |
| 	totempg_stats_t * stats;
 | |
| 	uint32_t total_mtt_rx_token;
 | |
| 	uint32_t total_backlog_calc;
 | |
| 	uint32_t total_token_holdtime;
 | |
| 	int t, prev, i;
 | |
| 	int32_t token_count;
 | |
| 	char key_name[ICMAP_KEYNAME_MAXLEN];
 | |
| 
 | |
| 	stats = api->totem_get_stats();
 | |
| 
 | |
| 	icmap_set_uint32("runtime.totem.pg.msg_reserved", stats->msg_reserved);
 | |
| 	icmap_set_uint32("runtime.totem.pg.msg_queue_avail", stats->msg_queue_avail);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.orf_token_tx", stats->mrp->srp->orf_token_tx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.orf_token_rx", stats->mrp->srp->orf_token_rx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.memb_merge_detect_tx", stats->mrp->srp->memb_merge_detect_tx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.memb_merge_detect_rx", stats->mrp->srp->memb_merge_detect_rx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.memb_join_tx", stats->mrp->srp->memb_join_tx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.memb_join_rx", stats->mrp->srp->memb_join_rx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.mcast_tx", stats->mrp->srp->mcast_tx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.mcast_retx", stats->mrp->srp->mcast_retx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.mcast_rx", stats->mrp->srp->mcast_rx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.memb_commit_token_tx", stats->mrp->srp->memb_commit_token_tx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.memb_commit_token_rx", stats->mrp->srp->memb_commit_token_rx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.token_hold_cancel_tx", stats->mrp->srp->token_hold_cancel_tx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.token_hold_cancel_rx", stats->mrp->srp->token_hold_cancel_rx);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.operational_entered", stats->mrp->srp->operational_entered);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.operational_token_lost", stats->mrp->srp->operational_token_lost);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.gather_entered", stats->mrp->srp->gather_entered);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.gather_token_lost", stats->mrp->srp->gather_token_lost);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.commit_entered", stats->mrp->srp->commit_entered);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.commit_token_lost", stats->mrp->srp->commit_token_lost);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.recovery_entered", stats->mrp->srp->recovery_entered);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.recovery_token_lost", stats->mrp->srp->recovery_token_lost);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.consensus_timeouts", stats->mrp->srp->consensus_timeouts);
 | |
| 	icmap_set_uint64("runtime.totem.pg.mrp.srp.rx_msg_dropped", stats->mrp->srp->rx_msg_dropped);
 | |
| 	icmap_set_uint32("runtime.totem.pg.mrp.srp.continuous_gather", stats->mrp->srp->continuous_gather);
 | |
| 	icmap_set_uint32("runtime.totem.pg.mrp.srp.continuous_sendmsg_failures",
 | |
| 	    stats->mrp->srp->continuous_sendmsg_failures);
 | |
| 
 | |
| 	icmap_set_uint8("runtime.totem.pg.mrp.srp.firewall_enabled_or_nic_failure",
 | |
| 		stats->mrp->srp->continuous_gather > MAX_NO_CONT_GATHER ? 1 : 0);
 | |
| 
 | |
| 	if (stats->mrp->srp->continuous_gather > MAX_NO_CONT_GATHER ||
 | |
| 	    stats->mrp->srp->continuous_sendmsg_failures > MAX_NO_CONT_SENDMSG_FAILURES) {
 | |
| 		log_printf (LOGSYS_LEVEL_WARNING,
 | |
| 			"Totem is unable to form a cluster because of an "
 | |
| 			"operating system or network fault. The most common "
 | |
| 			"cause of this message is that the local firewall is "
 | |
| 			"configured improperly.");
 | |
| 		icmap_set_uint8("runtime.totem.pg.mrp.srp.firewall_enabled_or_nic_failure", 1);
 | |
| 	} else {
 | |
| 		icmap_set_uint8("runtime.totem.pg.mrp.srp.firewall_enabled_or_nic_failure", 0);
 | |
| 	}
 | |
| 
 | |
| 	for (i = 0; i < stats->mrp->srp->rrp->interface_count; i++) {
 | |
| 		snprintf(key_name, ICMAP_KEYNAME_MAXLEN, "runtime.totem.pg.mrp.rrp.%u.faulty", i);
 | |
| 		icmap_set_uint8(key_name, stats->mrp->srp->rrp->faulty[i]);
 | |
| 	}
 | |
| 	total_mtt_rx_token = 0;
 | |
| 	total_token_holdtime = 0;
 | |
| 	total_backlog_calc = 0;
 | |
| 	token_count = 0;
 | |
| 	t = stats->mrp->srp->latest_token;
 | |
| 	while (1) {
 | |
| 		if (t == 0)
 | |
| 			prev = TOTEM_TOKEN_STATS_MAX - 1;
 | |
| 		else
 | |
| 			prev = t - 1;
 | |
| 		if (prev == stats->mrp->srp->earliest_token)
 | |
| 			break;
 | |
| 		/* if tx == 0, then dropped token (not ours) */
 | |
| 		if (stats->mrp->srp->token[t].tx != 0 ||
 | |
| 			(stats->mrp->srp->token[t].rx - stats->mrp->srp->token[prev].rx) > 0 ) {
 | |
| 			total_mtt_rx_token += (stats->mrp->srp->token[t].rx - stats->mrp->srp->token[prev].rx);
 | |
| 			total_token_holdtime += (stats->mrp->srp->token[t].tx - stats->mrp->srp->token[t].rx);
 | |
| 			total_backlog_calc += stats->mrp->srp->token[t].backlog_calc;
 | |
| 			token_count++;
 | |
| 		}
 | |
| 		t = prev;
 | |
| 	}
 | |
| 	if (token_count) {
 | |
| 		icmap_set_uint32("runtime.totem.pg.mrp.srp.mtt_rx_token", (total_mtt_rx_token / token_count));
 | |
| 		icmap_set_uint32("runtime.totem.pg.mrp.srp.avg_token_workload", (total_token_holdtime / token_count));
 | |
| 		icmap_set_uint32("runtime.totem.pg.mrp.srp.avg_backlog_calc", (total_backlog_calc / token_count));
 | |
| 	}
 | |
| 
 | |
| 	cs_ipcs_stats_update();
 | |
| 
 | |
| 	api->timer_add_duration (1500 * MILLI_2_NANO_SECONDS, NULL,
 | |
| 		corosync_totem_stats_updater,
 | |
| 		&corosync_stats_timer_handle);
 | |
| }
 | |
| 
 | |
| static void totem_dynamic_notify(
 | |
| 	int32_t event,
 | |
| 	const char *key_name,
 | |
| 	struct icmap_notify_value new_val,
 | |
| 	struct icmap_notify_value old_val,
 | |
| 	void *user_data)
 | |
| {
 | |
| 	int res;
 | |
| 	unsigned int ring_no;
 | |
| 	unsigned int member_no;
 | |
| 	struct totem_ip_address member;
 | |
| 	int add_new_member = 0;
 | |
| 	int remove_old_member = 0;
 | |
| 	char tmp_str[ICMAP_KEYNAME_MAXLEN];
 | |
| 
 | |
| 	res = sscanf(key_name, "nodelist.node.%u.ring%u%s", &member_no, &ring_no, tmp_str);
 | |
| 	if (res != 3)
 | |
| 		return ;
 | |
| 
 | |
| 	if (strcmp(tmp_str, "_addr") != 0) {
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	if (event == ICMAP_TRACK_ADD && new_val.type == ICMAP_VALUETYPE_STRING) {
 | |
| 		add_new_member = 1;
 | |
| 	}
 | |
| 
 | |
| 	if (event == ICMAP_TRACK_DELETE && old_val.type == ICMAP_VALUETYPE_STRING) {
 | |
| 		remove_old_member = 1;
 | |
| 	}
 | |
| 
 | |
| 	if (event == ICMAP_TRACK_MODIFY && new_val.type == ICMAP_VALUETYPE_STRING &&
 | |
| 			old_val.type == ICMAP_VALUETYPE_STRING) {
 | |
| 		add_new_member = 1;
 | |
| 		remove_old_member = 1;
 | |
| 	}
 | |
| 
 | |
| 	if (remove_old_member) {
 | |
| 		log_printf(LOGSYS_LEVEL_DEBUG,
 | |
| 			"removing dynamic member %s for ring %u", (char *)old_val.data, ring_no);
 | |
| 		if (totemip_parse(&member, (char *)old_val.data, ip_version) == 0) {
 | |
| 			totempg_member_remove (&member, ring_no);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (add_new_member) {
 | |
| 		log_printf(LOGSYS_LEVEL_DEBUG,
 | |
| 			"adding dynamic member %s for ring %u", (char *)new_val.data, ring_no);
 | |
| 		if (totemip_parse(&member, (char *)new_val.data, ip_version) == 0) {
 | |
| 			totempg_member_add (&member, ring_no);
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static void corosync_totem_dynamic_init (void)
 | |
| {
 | |
| 	icmap_track_t icmap_track = NULL;
 | |
| 
 | |
| 	icmap_track_add("nodelist.node.",
 | |
| 		ICMAP_TRACK_ADD | ICMAP_TRACK_DELETE | ICMAP_TRACK_MODIFY | ICMAP_TRACK_PREFIX,
 | |
| 		totem_dynamic_notify,
 | |
| 		NULL,
 | |
| 		&icmap_track);
 | |
| }
 | |
| 
 | |
| static void corosync_totem_stats_init (void)
 | |
| {
 | |
| 	icmap_set_uint32("runtime.totem.pg.mrp.srp.mtt_rx_token", 0);
 | |
| 	icmap_set_uint32("runtime.totem.pg.mrp.srp.avg_token_workload", 0);
 | |
| 	icmap_set_uint32("runtime.totem.pg.mrp.srp.avg_backlog_calc", 0);
 | |
| 
 | |
| 	/* start stats timer */
 | |
| 	api->timer_add_duration (1500 * MILLI_2_NANO_SECONDS, NULL,
 | |
| 		corosync_totem_stats_updater,
 | |
| 		&corosync_stats_timer_handle);
 | |
| }
 | |
| 
 | |
| 
 | |
| static void deliver_fn (
 | |
| 	unsigned int nodeid,
 | |
| 	const void *msg,
 | |
| 	unsigned int msg_len,
 | |
| 	int endian_conversion_required)
 | |
| {
 | |
| 	const struct qb_ipc_request_header *header;
 | |
| 	int32_t service;
 | |
| 	int32_t fn_id;
 | |
| 	uint32_t id;
 | |
| 
 | |
| 	header = msg;
 | |
| 	if (endian_conversion_required) {
 | |
| 		id = swab32 (header->id);
 | |
| 	} else {
 | |
| 		id = header->id;
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Call the proper executive handler
 | |
| 	 */
 | |
| 	service = id >> 16;
 | |
| 	fn_id = id & 0xffff;
 | |
| 
 | |
| 	if (!corosync_service[service]) {
 | |
| 		return;
 | |
| 	}
 | |
| 	if (fn_id >= corosync_service[service]->exec_engine_count) {
 | |
| 		log_printf(LOGSYS_LEVEL_WARNING, "discarded unknown message %d for service %d (max id %d)",
 | |
| 			fn_id, service, corosync_service[service]->exec_engine_count);
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	icmap_fast_inc(service_stats_rx[service][fn_id]);
 | |
| 
 | |
| 	if (endian_conversion_required) {
 | |
| 		assert(corosync_service[service]->exec_engine[fn_id].exec_endian_convert_fn != NULL);
 | |
| 		corosync_service[service]->exec_engine[fn_id].exec_endian_convert_fn
 | |
| 			((void *)msg);
 | |
| 	}
 | |
| 
 | |
| 	corosync_service[service]->exec_engine[fn_id].exec_handler_fn
 | |
| 		(msg, nodeid);
 | |
| }
 | |
| 
 | |
| int main_mcast (
 | |
|         const struct iovec *iovec,
 | |
|         unsigned int iov_len,
 | |
|         unsigned int guarantee)
 | |
| {
 | |
| 	const struct qb_ipc_request_header *req = iovec->iov_base;
 | |
| 	int32_t service;
 | |
| 	int32_t fn_id;
 | |
| 
 | |
| 	service = req->id >> 16;
 | |
| 	fn_id = req->id & 0xffff;
 | |
| 
 | |
| 	if (corosync_service[service]) {
 | |
| 		icmap_fast_inc(service_stats_tx[service][fn_id]);
 | |
| 	}
 | |
| 
 | |
| 	return (totempg_groups_mcast_joined (corosync_group_handle, iovec, iov_len, guarantee));
 | |
| }
 | |
| 
 | |
| static qb_loop_timer_handle recheck_the_q_level_timer;
 | |
| void corosync_recheck_the_q_level(void *data)
 | |
| {
 | |
| 	totempg_check_q_level(corosync_group_handle);
 | |
| 	if (cs_ipcs_q_level_get() == TOTEM_Q_LEVEL_CRITICAL) {
 | |
| 		qb_loop_timer_add(cs_poll_handle_get(), QB_LOOP_MED, 1*QB_TIME_NS_IN_MSEC,
 | |
| 			NULL, corosync_recheck_the_q_level, &recheck_the_q_level_timer);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| struct sending_allowed_private_data_struct {
 | |
| 	int reserved_msgs;
 | |
| };
 | |
| 
 | |
| 
 | |
| int corosync_sending_allowed (
 | |
| 	unsigned int service,
 | |
| 	unsigned int id,
 | |
| 	const void *msg,
 | |
| 	void *sending_allowed_private_data)
 | |
| {
 | |
| 	struct sending_allowed_private_data_struct *pd =
 | |
| 		(struct sending_allowed_private_data_struct *)sending_allowed_private_data;
 | |
| 	struct iovec reserve_iovec;
 | |
| 	struct qb_ipc_request_header *header = (struct qb_ipc_request_header *)msg;
 | |
| 	int sending_allowed;
 | |
| 
 | |
| 	reserve_iovec.iov_base = (char *)header;
 | |
| 	reserve_iovec.iov_len = header->size;
 | |
| 
 | |
| 	pd->reserved_msgs = totempg_groups_joined_reserve (
 | |
| 		corosync_group_handle,
 | |
| 		&reserve_iovec, 1);
 | |
| 	if (pd->reserved_msgs == -1) {
 | |
| 		return -EINVAL;
 | |
| 	}
 | |
| 
 | |
| 	sending_allowed = QB_FALSE;
 | |
| 	if (corosync_quorum_is_quorate() == 1 ||
 | |
| 	    corosync_service[service]->allow_inquorate == CS_LIB_ALLOW_INQUORATE) {
 | |
| 		// we are quorate
 | |
| 		// now check flow control
 | |
| 		if (corosync_service[service]->lib_engine[id].flow_control == CS_LIB_FLOW_CONTROL_NOT_REQUIRED) {
 | |
| 			sending_allowed = QB_TRUE;
 | |
| 		} else if (pd->reserved_msgs && sync_in_process == 0) {
 | |
| 			sending_allowed = QB_TRUE;
 | |
| 		} else if (pd->reserved_msgs == 0) {
 | |
| 			return -ENOBUFS;
 | |
| 		} else /* (sync_in_process) */ {
 | |
| 			return -EINPROGRESS;
 | |
| 		}
 | |
| 	} else {
 | |
| 		return -EHOSTUNREACH;
 | |
| 	}
 | |
| 
 | |
| 	return (sending_allowed);
 | |
| }
 | |
| 
 | |
| void corosync_sending_allowed_release (void *sending_allowed_private_data)
 | |
| {
 | |
| 	struct sending_allowed_private_data_struct *pd =
 | |
| 		(struct sending_allowed_private_data_struct *)sending_allowed_private_data;
 | |
| 
 | |
| 	if (pd->reserved_msgs == -1) {
 | |
| 		return;
 | |
| 	}
 | |
| 	totempg_groups_joined_release (pd->reserved_msgs);
 | |
| }
 | |
| 
 | |
| int message_source_is_local (const mar_message_source_t *source)
 | |
| {
 | |
| 	int ret = 0;
 | |
| 
 | |
| 	assert (source != NULL);
 | |
| 	if (source->nodeid == totempg_my_nodeid_get ()) {
 | |
| 		ret = 1;
 | |
| 	}
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| void message_source_set (
 | |
| 	mar_message_source_t *source,
 | |
| 	void *conn)
 | |
| {
 | |
| 	assert ((source != NULL) && (conn != NULL));
 | |
| 	memset (source, 0, sizeof (mar_message_source_t));
 | |
| 	source->nodeid = totempg_my_nodeid_get ();
 | |
| 	source->conn = conn;
 | |
| }
 | |
| 
 | |
| struct scheduler_pause_timeout_data {
 | |
| 	struct totem_config *totem_config;
 | |
| 	qb_loop_timer_handle handle;
 | |
| 	unsigned long long tv_prev;
 | |
| 	unsigned long long max_tv_diff;
 | |
| };
 | |
| 
 | |
| static void timer_function_scheduler_timeout (void *data)
 | |
| {
 | |
| 	struct scheduler_pause_timeout_data *timeout_data = (struct scheduler_pause_timeout_data *)data;
 | |
| 	unsigned long long tv_current;
 | |
| 	unsigned long long tv_diff;
 | |
| 
 | |
| 	tv_current = qb_util_nano_current_get ();
 | |
| 
 | |
| 	if (timeout_data->tv_prev == 0) {
 | |
| 		/*
 | |
| 		 * Initial call -> just pretent everything is ok
 | |
| 		 */
 | |
| 		timeout_data->tv_prev = tv_current;
 | |
| 		timeout_data->max_tv_diff = 0;
 | |
| 	}
 | |
| 
 | |
| 	tv_diff = tv_current - timeout_data->tv_prev;
 | |
| 	timeout_data->tv_prev = tv_current;
 | |
| 
 | |
| 	if (tv_diff > timeout_data->max_tv_diff) {
 | |
| 		log_printf (LOGSYS_LEVEL_WARNING, "Corosync main process was not scheduled for %0.4f ms "
 | |
| 		    "(threshold is %0.4f ms). Consider token timeout increase.",
 | |
| 		    (float)tv_diff / QB_TIME_NS_IN_MSEC, (float)timeout_data->max_tv_diff / QB_TIME_NS_IN_MSEC);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Set next threshold, because token_timeout can change
 | |
| 	 */
 | |
| 	timeout_data->max_tv_diff = timeout_data->totem_config->token_timeout * QB_TIME_NS_IN_MSEC * 0.8;
 | |
| 	qb_loop_timer_add (corosync_poll_handle,
 | |
| 		QB_LOOP_MED,
 | |
| 		timeout_data->totem_config->token_timeout * QB_TIME_NS_IN_MSEC / 3,
 | |
| 		timeout_data,
 | |
| 		timer_function_scheduler_timeout,
 | |
| 		&timeout_data->handle);
 | |
| }
 | |
| 
 | |
| 
 | |
| static void corosync_setscheduler (void)
 | |
| {
 | |
| #if defined(HAVE_PTHREAD_SETSCHEDPARAM) && defined(HAVE_SCHED_GET_PRIORITY_MAX) && defined(HAVE_SCHED_SETSCHEDULER)
 | |
| 	int res;
 | |
| 
 | |
| 	sched_priority = sched_get_priority_max (SCHED_RR);
 | |
| 	if (sched_priority != -1) {
 | |
| 		global_sched_param.sched_priority = sched_priority;
 | |
| 		res = sched_setscheduler (0, SCHED_RR, &global_sched_param);
 | |
| 		if (res == -1) {
 | |
| 			LOGSYS_PERROR(errno, LOGSYS_LEVEL_WARNING,
 | |
| 				"Could not set SCHED_RR at priority %d",
 | |
| 				global_sched_param.sched_priority);
 | |
| 
 | |
| 			global_sched_param.sched_priority = 0;
 | |
| #ifdef HAVE_QB_LOG_THREAD_PRIORITY_SET
 | |
| 			qb_log_thread_priority_set (SCHED_OTHER, 0);
 | |
| #endif
 | |
| 		} else {
 | |
| 
 | |
| 			/*
 | |
| 			 * Turn on SCHED_RR in logsys system
 | |
| 			 */
 | |
| #ifdef HAVE_QB_LOG_THREAD_PRIORITY_SET
 | |
| 			res = qb_log_thread_priority_set (SCHED_RR, sched_priority);
 | |
| #else
 | |
| 			res = -1;
 | |
| #endif
 | |
| 			if (res == -1) {
 | |
| 				log_printf (LOGSYS_LEVEL_ERROR,
 | |
| 					    "Could not set logsys thread priority."
 | |
| 					    " Can't continue because of priority inversions.");
 | |
| 				corosync_exit_error (COROSYNC_DONE_LOGSETUP);
 | |
| 			}
 | |
| 		}
 | |
| 	} else {
 | |
| 		LOGSYS_PERROR (errno, LOGSYS_LEVEL_WARNING,
 | |
| 			"Could not get maximum scheduler priority");
 | |
| 		sched_priority = 0;
 | |
| 	}
 | |
| #else
 | |
| 	log_printf(LOGSYS_LEVEL_WARNING,
 | |
| 		"The Platform is missing process priority setting features.  Leaving at default.");
 | |
| #endif
 | |
| }
 | |
| 
 | |
| static void
 | |
| _logsys_log_printf(int level, int subsys,
 | |
| 		const char *function_name,
 | |
| 		const char *file_name,
 | |
| 		int file_line,
 | |
| 		const char *format,
 | |
| 		...) __attribute__((format(printf, 6, 7)));
 | |
| 
 | |
| static void
 | |
| _logsys_log_printf(int level, int subsys,
 | |
| 		const char *function_name,
 | |
| 		const char *file_name,
 | |
| 		int file_line,
 | |
| 		const char *format, ...)
 | |
| {
 | |
| 	va_list ap;
 | |
| 
 | |
| 	va_start(ap, format);
 | |
| 	qb_log_from_external_source_va(function_name, file_name,
 | |
| 				    format, level, file_line,
 | |
| 				    subsys, ap);
 | |
| 	va_end(ap);
 | |
| }
 | |
| 
 | |
| static void fplay_key_change_notify_fn (
 | |
| 	int32_t event,
 | |
| 	const char *key_name,
 | |
| 	struct icmap_notify_value new_val,
 | |
| 	struct icmap_notify_value old_val,
 | |
| 	void *user_data)
 | |
| {
 | |
| 	if (strcmp(key_name, "runtime.blackbox.dump_flight_data") == 0) {
 | |
| 		fprintf(stderr,"Writetofile\n");
 | |
| 		corosync_blackbox_write_to_file ();
 | |
| 	}
 | |
| 	if (strcmp(key_name, "runtime.blackbox.dump_state") == 0) {
 | |
| 		fprintf(stderr,"statefump\n");
 | |
| 		corosync_state_dump ();
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static void corosync_fplay_control_init (void)
 | |
| {
 | |
| 	icmap_track_t track = NULL;
 | |
| 
 | |
| 	icmap_set_string("runtime.blackbox.dump_flight_data", "no");
 | |
| 	icmap_set_string("runtime.blackbox.dump_state", "no");
 | |
| 
 | |
| 	icmap_track_add("runtime.blackbox.dump_flight_data",
 | |
| 			ICMAP_TRACK_ADD | ICMAP_TRACK_DELETE | ICMAP_TRACK_MODIFY,
 | |
| 			fplay_key_change_notify_fn,
 | |
| 			NULL, &track);
 | |
| 	icmap_track_add("runtime.blackbox.dump_state",
 | |
| 			ICMAP_TRACK_ADD | ICMAP_TRACK_DELETE | ICMAP_TRACK_MODIFY,
 | |
| 			fplay_key_change_notify_fn,
 | |
| 			NULL, &track);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Set RO flag for keys, which ether doesn't make sense to change by user (statistic)
 | |
|  * or which when changed are not reflected by runtime (totem.crypto_cipher, ...).
 | |
|  *
 | |
|  * Also some RO keys cannot be determined in this stage, so they are set later in
 | |
|  * other functions (like nodelist.local_node_pos, ...)
 | |
|  */
 | |
| static void set_icmap_ro_keys_flag (void)
 | |
| {
 | |
| 	/*
 | |
| 	 * Set RO flag for all keys of internal configuration and runtime statistics
 | |
| 	 */
 | |
| 	icmap_set_ro_access("internal_configuration.", CS_TRUE, CS_TRUE);
 | |
| 	icmap_set_ro_access("runtime.connections.", CS_TRUE, CS_TRUE);
 | |
| 	icmap_set_ro_access("runtime.totem.", CS_TRUE, CS_TRUE);
 | |
| 	icmap_set_ro_access("runtime.services.", CS_TRUE, CS_TRUE);
 | |
| 
 | |
| 	/*
 | |
| 	 * Set RO flag for constrete keys of configuration which can't be changed
 | |
| 	 * during runtime
 | |
| 	 */
 | |
| 	icmap_set_ro_access("totem.crypto_cipher", CS_FALSE, CS_TRUE);
 | |
| 	icmap_set_ro_access("totem.crypto_hash", CS_FALSE, CS_TRUE);
 | |
| 	icmap_set_ro_access("totem.secauth", CS_FALSE, CS_TRUE);
 | |
| 	icmap_set_ro_access("totem.ip_version", CS_FALSE, CS_TRUE);
 | |
| 	icmap_set_ro_access("totem.rrp_mode", CS_FALSE, CS_TRUE);
 | |
| 	icmap_set_ro_access("totem.netmtu", CS_FALSE, CS_TRUE);
 | |
| 	icmap_set_ro_access("qb.ipc_type", CS_FALSE, CS_TRUE);
 | |
| }
 | |
| 
 | |
| static void main_service_ready (void)
 | |
| {
 | |
| 	int res;
 | |
| 
 | |
| 	/*
 | |
| 	 * This must occur after totempg is initialized because "this_ip" must be set
 | |
| 	 */
 | |
| 	res = corosync_service_defaults_link_and_init (api);
 | |
| 	if (res == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Could not initialize default services");
 | |
| 		corosync_exit_error (COROSYNC_DONE_INIT_SERVICES);
 | |
| 	}
 | |
| 	cs_ipcs_init();
 | |
| 	corosync_totem_stats_init ();
 | |
| 	corosync_fplay_control_init ();
 | |
| 	corosync_totem_dynamic_init ();
 | |
| 	sync_init (
 | |
| 		corosync_sync_callbacks_retrieve,
 | |
| 		corosync_sync_completed);
 | |
| }
 | |
| 
 | |
| static enum e_corosync_done corosync_flock (const char *lockfile, pid_t pid)
 | |
| {
 | |
| 	struct flock lock;
 | |
| 	enum e_corosync_done err;
 | |
| 	char pid_s[17];
 | |
| 	int fd_flag;
 | |
| 	int lf;
 | |
| 
 | |
| 	err = COROSYNC_DONE_EXIT;
 | |
| 
 | |
| 	lf = open (lockfile, O_WRONLY | O_CREAT, 0640);
 | |
| 	if (lf == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't create lock file.");
 | |
| 		return (COROSYNC_DONE_AQUIRE_LOCK);
 | |
| 	}
 | |
| 
 | |
| retry_fcntl:
 | |
| 	lock.l_type = F_WRLCK;
 | |
| 	lock.l_start = 0;
 | |
| 	lock.l_whence = SEEK_SET;
 | |
| 	lock.l_len = 0;
 | |
| 	if (fcntl (lf, F_SETLK, &lock) == -1) {
 | |
| 		switch (errno) {
 | |
| 		case EINTR:
 | |
| 			goto retry_fcntl;
 | |
| 			break;
 | |
| 		case EAGAIN:
 | |
| 		case EACCES:
 | |
| 			log_printf (LOGSYS_LEVEL_ERROR, "Another Corosync instance is already running.");
 | |
| 			err = COROSYNC_DONE_ALREADY_RUNNING;
 | |
| 			goto error_close;
 | |
| 			break;
 | |
| 		default:
 | |
| 			log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't aquire lock. Error was %s",
 | |
| 			    strerror(errno));
 | |
| 			err = COROSYNC_DONE_AQUIRE_LOCK;
 | |
| 			goto error_close;
 | |
| 			break;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (ftruncate (lf, 0) == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't truncate lock file. Error was %s",
 | |
| 		    strerror (errno));
 | |
| 		err = COROSYNC_DONE_AQUIRE_LOCK;
 | |
| 		goto error_close_unlink;
 | |
| 	}
 | |
| 
 | |
| 	memset (pid_s, 0, sizeof (pid_s));
 | |
| 	snprintf (pid_s, sizeof (pid_s) - 1, "%u\n", pid);
 | |
| 
 | |
| retry_write:
 | |
| 	if (write (lf, pid_s, strlen (pid_s)) != strlen (pid_s)) {
 | |
| 		if (errno == EINTR) {
 | |
| 			goto retry_write;
 | |
| 		} else {
 | |
| 			log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't write pid to lock file. "
 | |
| 				"Error was %s", strerror (errno));
 | |
| 			err = COROSYNC_DONE_AQUIRE_LOCK;
 | |
| 			goto error_close_unlink;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if ((fd_flag = fcntl (lf, F_GETFD, 0)) == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't get close-on-exec flag from lock file. "
 | |
| 			"Error was %s", strerror (errno));
 | |
| 		err = COROSYNC_DONE_AQUIRE_LOCK;
 | |
| 		goto error_close_unlink;
 | |
| 	}
 | |
| 	fd_flag |= FD_CLOEXEC;
 | |
| 	if (fcntl (lf, F_SETFD, fd_flag) == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't set close-on-exec flag to lock file. "
 | |
| 			"Error was %s", strerror (errno));
 | |
| 		err = COROSYNC_DONE_AQUIRE_LOCK;
 | |
| 		goto error_close_unlink;
 | |
| 	}
 | |
| 
 | |
| 	return (err);
 | |
| 
 | |
| error_close_unlink:
 | |
| 	unlink (lockfile);
 | |
| error_close:
 | |
| 	close (lf);
 | |
| 
 | |
| 	return (err);
 | |
| }
 | |
| 
 | |
| int main (int argc, char **argv, char **envp)
 | |
| {
 | |
| 	const char *error_string;
 | |
| 	struct totem_config totem_config;
 | |
| 	int res, ch;
 | |
| 	int background, setprio;
 | |
| 	struct stat stat_out;
 | |
| 	char corosync_lib_dir[PATH_MAX];
 | |
| 	enum e_corosync_done flock_err;
 | |
| 	uint64_t totem_config_warnings;
 | |
| 	struct scheduler_pause_timeout_data scheduler_pause_timeout_data;
 | |
| 
 | |
| 	/* default configuration
 | |
| 	 */
 | |
| 	background = 1;
 | |
| 	setprio = 0;
 | |
| 
 | |
| 	while ((ch = getopt (argc, argv, "fprv")) != EOF) {
 | |
| 
 | |
| 		switch (ch) {
 | |
| 			case 'f':
 | |
| 				background = 0;
 | |
| 				break;
 | |
| 			case 'p':
 | |
| 				break;
 | |
| 			case 'r':
 | |
| 				setprio = 1;
 | |
| 				break;
 | |
| 			case 'v':
 | |
| 				printf ("Corosync Cluster Engine, version '%s'\n", VERSION);
 | |
| 				printf ("Copyright (c) 2006-2009 Red Hat, Inc.\n");
 | |
| 				return EXIT_SUCCESS;
 | |
| 
 | |
| 				break;
 | |
| 			default:
 | |
| 				fprintf(stderr, \
 | |
| 					"usage:\n"\
 | |
| 					"        -f     : Start application in foreground.\n"\
 | |
| 					"        -p     : Does nothing.    \n"\
 | |
| 					"        -r     : Set round robin realtime scheduling \n"\
 | |
| 					"        -v     : Display version and SVN revision of Corosync and exit.\n");
 | |
| 				return EXIT_FAILURE;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Set round robin realtime scheduling with priority 99
 | |
| 	 * Lock all memory to avoid page faults which may interrupt
 | |
| 	 * application healthchecking
 | |
| 	 */
 | |
| 	if (setprio) {
 | |
| 		corosync_setscheduler ();
 | |
| 	}
 | |
| 
 | |
| 	corosync_mlockall ();
 | |
| 
 | |
| 	/*
 | |
| 	 * Other signals are registered later via qb_loop_signal_add
 | |
| 	 */
 | |
| 	(void)signal (SIGSEGV, sigsegv_handler);
 | |
| 	(void)signal (SIGABRT, sigabrt_handler);
 | |
| #if MSG_NOSIGNAL != 0
 | |
| 	(void)signal (SIGPIPE, SIG_IGN);
 | |
| #endif
 | |
| 
 | |
| 	if (icmap_init() != CS_OK) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Corosync Executive couldn't initialize configuration component.");
 | |
| 		corosync_exit_error (COROSYNC_DONE_ICMAP);
 | |
| 	}
 | |
| 	set_icmap_ro_keys_flag();
 | |
| 
 | |
| 	/*
 | |
| 	 * Initialize the corosync_api_v1 definition
 | |
| 	 */
 | |
| 	api = apidef_get ();
 | |
| 
 | |
| 	res = coroparse_configparse(icmap_get_global_map(), &error_string);
 | |
| 	if (res == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "%s", error_string);
 | |
| 		corosync_exit_error (COROSYNC_DONE_MAINCONFIGREAD);
 | |
| 	}
 | |
| 
 | |
| 	res = corosync_log_config_read (&error_string);
 | |
| 	if (res == -1) {
 | |
| 		/*
 | |
| 		 * if we are here, we _must_ flush the logsys queue
 | |
| 		 * and try to inform that we couldn't read the config.
 | |
| 		 * this is a desperate attempt before certain death
 | |
| 		 * and there is no guarantee that we can print to stderr
 | |
| 		 * nor that logsys is sending the messages where we expect.
 | |
| 		 */
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "%s", error_string);
 | |
| 		fprintf(stderr, "%s", error_string);
 | |
| 		syslog (LOGSYS_LEVEL_ERROR, "%s", error_string);
 | |
| 		corosync_exit_error (COROSYNC_DONE_LOGCONFIGREAD);
 | |
| 	}
 | |
| 
 | |
| 	log_printf (LOGSYS_LEVEL_NOTICE, "Corosync Cluster Engine ('%s'): started and ready to provide service.", VERSION);
 | |
| 	log_printf (LOGSYS_LEVEL_INFO, "Corosync built-in features:" PACKAGE_FEATURES "");
 | |
| 
 | |
| 	/*
 | |
| 	 * Make sure required directory is present
 | |
| 	 */
 | |
| 	sprintf (corosync_lib_dir, "%s/lib/corosync", LOCALSTATEDIR);
 | |
| 	res = stat (corosync_lib_dir, &stat_out);
 | |
| 	if ((res == -1) || (res == 0 && !S_ISDIR(stat_out.st_mode))) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Required directory not present %s.  Please create it.", corosync_lib_dir);
 | |
| 		corosync_exit_error (COROSYNC_DONE_DIR_NOT_PRESENT);
 | |
| 	}
 | |
| 
 | |
| 	res = totem_config_read (&totem_config, &error_string, &totem_config_warnings);
 | |
| 	if (res == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "%s", error_string);
 | |
| 		corosync_exit_error (COROSYNC_DONE_MAINCONFIGREAD);
 | |
| 	}
 | |
| 
 | |
| 	if (totem_config_warnings & TOTEM_CONFIG_WARNING_MEMBERS_IGNORED) {
 | |
| 		log_printf (LOGSYS_LEVEL_WARNING, "member section is used together with nodelist. Members ignored.");
 | |
| 	}
 | |
| 
 | |
| 	if (totem_config_warnings & TOTEM_CONFIG_WARNING_MEMBERS_DEPRECATED) {
 | |
| 		log_printf (LOGSYS_LEVEL_WARNING, "member section is deprecated.");
 | |
| 	}
 | |
| 
 | |
| 	if (totem_config_warnings & TOTEM_CONFIG_WARNING_TOTEM_NODEID_IGNORED) {
 | |
| 		log_printf (LOGSYS_LEVEL_WARNING, "nodeid appears both in totem section and nodelist. Nodelist one is used.");
 | |
| 	}
 | |
| 
 | |
| 	if (totem_config_warnings != 0) {
 | |
| 		log_printf (LOGSYS_LEVEL_WARNING, "Please migrate config file to nodelist.");
 | |
| 	}
 | |
| 
 | |
| 	res = totem_config_keyread (&totem_config, &error_string);
 | |
| 	if (res == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "%s", error_string);
 | |
| 		corosync_exit_error (COROSYNC_DONE_MAINCONFIGREAD);
 | |
| 	}
 | |
| 
 | |
| 	res = totem_config_validate (&totem_config, &error_string);
 | |
| 	if (res == -1) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "%s", error_string);
 | |
| 		corosync_exit_error (COROSYNC_DONE_MAINCONFIGREAD);
 | |
| 	}
 | |
| 
 | |
| 	ip_version = totem_config.ip_version;
 | |
| 
 | |
| 	totem_config.totem_logging_configuration = totem_logging_configuration;
 | |
| 	totem_config.totem_logging_configuration.log_subsys_id = _logsys_subsys_create("TOTEM", "totem,"
 | |
| 			"totemmrp.c,totemrrp.c,totemip.c,totemconfig.c,totemcrypto.c,totemsrp.c,"
 | |
| 			"totempg.c,totemiba.c,totemudp.c,totemudpu.c,totemnet.c");
 | |
| 
 | |
| 	totem_config.totem_logging_configuration.log_level_security = LOGSYS_LEVEL_WARNING;
 | |
| 	totem_config.totem_logging_configuration.log_level_error = LOGSYS_LEVEL_ERROR;
 | |
| 	totem_config.totem_logging_configuration.log_level_warning = LOGSYS_LEVEL_WARNING;
 | |
| 	totem_config.totem_logging_configuration.log_level_notice = LOGSYS_LEVEL_NOTICE;
 | |
| 	totem_config.totem_logging_configuration.log_level_debug = LOGSYS_LEVEL_DEBUG;
 | |
| 	totem_config.totem_logging_configuration.log_level_trace = LOGSYS_LEVEL_TRACE;
 | |
| 	totem_config.totem_logging_configuration.log_printf = _logsys_log_printf;
 | |
| 	logsys_config_apply();
 | |
| 
 | |
| 	/*
 | |
| 	 * Now we are fully initialized.
 | |
| 	 */
 | |
| 	if (background) {
 | |
| 		corosync_tty_detach ();
 | |
| 	}
 | |
| 
 | |
| 	corosync_poll_handle = qb_loop_create ();
 | |
| 
 | |
| 	memset(&scheduler_pause_timeout_data, 0, sizeof(scheduler_pause_timeout_data));
 | |
| 	scheduler_pause_timeout_data.totem_config = &totem_config;
 | |
| 	timer_function_scheduler_timeout (&scheduler_pause_timeout_data);
 | |
| 
 | |
| 	qb_loop_signal_add(corosync_poll_handle, QB_LOOP_LOW,
 | |
| 		SIGUSR2, NULL, sig_diag_handler, NULL);
 | |
| 	qb_loop_signal_add(corosync_poll_handle, QB_LOOP_HIGH,
 | |
| 		SIGINT, NULL, sig_exit_handler, NULL);
 | |
| 	qb_loop_signal_add(corosync_poll_handle, QB_LOOP_HIGH,
 | |
| 		SIGQUIT, NULL, sig_exit_handler, NULL);
 | |
| 	qb_loop_signal_add(corosync_poll_handle, QB_LOOP_HIGH,
 | |
| 		SIGTERM, NULL, sig_exit_handler, NULL);
 | |
| 
 | |
| 	if (logsys_thread_start() != 0) {
 | |
| 		log_printf (LOGSYS_LEVEL_ERROR, "Can't initialize log thread");
 | |
| 		corosync_exit_error (COROSYNC_DONE_LOGCONFIGREAD);
 | |
| 	}
 | |
| 
 | |
| 	if ((flock_err = corosync_flock (corosync_lock_file, getpid ())) != COROSYNC_DONE_EXIT) {
 | |
| 		corosync_exit_error (flock_err);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * if totempg_initialize doesn't have root priveleges, it cannot
 | |
| 	 * bind to a specific interface.  This only matters if
 | |
| 	 * there is more then one interface in a system, so
 | |
| 	 * in this case, only a warning is printed
 | |
| 	 */
 | |
| 	/*
 | |
| 	 * Join multicast group and setup delivery
 | |
| 	 *  and configuration change functions
 | |
| 	 */
 | |
| 	totempg_initialize (
 | |
| 		corosync_poll_handle,
 | |
| 		&totem_config);
 | |
| 
 | |
| 	totempg_service_ready_register (
 | |
| 		main_service_ready);
 | |
| 
 | |
| 	totempg_groups_initialize (
 | |
| 		&corosync_group_handle,
 | |
| 		deliver_fn,
 | |
| 		confchg_fn);
 | |
| 
 | |
| 	totempg_groups_join (
 | |
| 		corosync_group_handle,
 | |
| 		&corosync_group,
 | |
| 		1);
 | |
| 
 | |
| 	/*
 | |
| 	 * Drop root privleges to user 'corosync'
 | |
| 	 * TODO: Don't really need full root capabilities;
 | |
| 	 *       needed capabilities are:
 | |
| 	 * CAP_NET_RAW (bindtodevice)
 | |
| 	 * CAP_SYS_NICE (setscheduler)
 | |
| 	 * CAP_IPC_LOCK (mlockall)
 | |
| 	 */
 | |
| 	priv_drop ();
 | |
| 
 | |
| 	schedwrk_init (
 | |
| 		serialize_lock,
 | |
| 		serialize_unlock);
 | |
| 
 | |
| 	/*
 | |
| 	 * Start main processing loop
 | |
| 	 */
 | |
| 	qb_loop_run (corosync_poll_handle);
 | |
| 
 | |
| 	/*
 | |
| 	 * Exit was requested
 | |
| 	 */
 | |
| 	totempg_finalize ();
 | |
| 
 | |
| 	/*
 | |
| 	 * free the loop resources
 | |
| 	 */
 | |
| 	qb_loop_destroy (corosync_poll_handle);
 | |
| 
 | |
| 	/*
 | |
| 	 * free up the icmap 
 | |
| 	 */
 | |
| 
 | |
| 	/*
 | |
| 	 * Remove pid lock file
 | |
| 	 */
 | |
| 	unlink (corosync_lock_file);
 | |
| 
 | |
| 	corosync_exit_error (COROSYNC_DONE_EXIT);
 | |
| 
 | |
| 	return EXIT_SUCCESS;
 | |
| }
 |