12 #include <arpa/inet.h> 15 #include <netinet/in.h> 17 #include <sys/socket.h> 18 #include <sys/utsname.h> 21 #include <corosync/cfg.h> 22 #include <corosync/cmap.h> 23 #include <corosync/corodefs.h> 24 #include <corosync/corotypes.h> 25 #include <corosync/hdb.h> 26 #include <corosync/quorum.h> 27 #include <qb/qbipcc.h> 28 #include <qb/qbutil.h> 38 static quorum_handle_t pcmk_quorum_handle = 0;
40 static gboolean (*quorum_app_callback)(
unsigned long long seq,
41 gboolean quorate) = NULL;
61 crm_info(
"Node %s is not yet known by Corosync", node->
name);
68 node_name_is_valid(
const char *key,
const char *
name)
76 }
else if (sscanf(
name,
"%d.%d.%d.%d", &octet, &octet, &octet, &octet) == 4) {
77 crm_trace(
"%s contains an IPv4 address (%s), ignoring", key,
name);
80 }
else if (strstr(
name,
":") != NULL) {
81 crm_trace(
"%s contains an IPv6 address (%s), ignoring", key,
name);
106 cs_error_t rc = CS_OK;
109 cmap_handle_t local_handle = 0;
120 if (cmap_handle == 0 && local_handle == 0) {
122 crm_trace(
"Initializing CMAP connection");
124 rc = pcmk__init_cmap(&local_handle);
127 crm_debug(
"API connection setup failed: %s. Retrying in %ds", cs_strerror(rc),
132 }
while (retries < 5 && rc != CS_OK);
135 crm_warn(
"Could not connect to Cluster Configuration Database API, error %s",
141 if (cmap_handle == 0) {
142 cmap_handle = local_handle;
144 rc = cmap_fd_get(cmap_handle, &fd);
146 crm_err(
"Could not obtain the CMAP API connection: %s (%d)",
147 cs_strerror(rc), rc);
153 &found_uid, &found_gid))) {
154 crm_err(
"CMAP provider is not authentic:" 155 " process %lld (uid: %lld, gid: %lld)",
157 (
long long) found_uid, (
long long) found_gid);
160 crm_err(
"Could not verify authenticity of CMAP provider: %s (%d)",
166 while (
name == NULL && cmap_handle != 0) {
171 rc = cmap_get_uint32(cmap_handle, key, &
id);
172 crm_trace(
"Checking %u vs %u from %s", nodeid,
id, key);
180 crm_trace(
"Searching for node name for %u in nodelist.node.%d %s",
181 nodeid, lpc, pcmk__s(
name,
"<null>"));
184 cmap_get_string(cmap_handle, key, &
name);
190 cmap_get_string(cmap_handle, key, &
name);
193 if (!node_name_is_valid(key,
name)) {
207 cmap_finalize(local_handle);
211 crm_info(
"Unable to get node name for nodeid %u", nodeid);
227 if (pcmk_quorum_handle != 0) {
228 quorum_finalize(pcmk_quorum_handle);
229 pcmk_quorum_handle = 0;
243 quorum_dispatch_cb(gpointer user_data)
245 int rc = quorum_dispatch(pcmk_quorum_handle, CS_DISPATCH_ALL);
248 crm_err(
"Connection to the Quorum API failed: %d", rc);
249 quorum_finalize(pcmk_quorum_handle);
250 pcmk_quorum_handle = 0;
267 quorum_notification_cb(quorum_handle_t handle, uint32_t quorate,
268 uint64_t ring_id, uint32_t view_list_entries,
274 static gboolean init_phase = TRUE;
276 bool is_quorate = (quorate != 0);
279 if (is_quorate && !was_quorate) {
280 crm_notice(
"Quorum acquired " QB_XS
" membership=%" PRIu64
282 ring_id, view_list_entries);
285 }
else if (!is_quorate && was_quorate) {
286 crm_warn(
"Quorum lost " QB_XS
" membership=%" PRIu64
" members=" PRIu32,
287 ring_id, view_list_entries);
291 crm_info(
"Quorum %s " QB_XS
" membership=%" PRIu64
" members=%" PRIu32,
292 (is_quorate?
"retained" :
"still lost"), ring_id,
296 if (view_list_entries == 0 && init_phase) {
297 crm_info(
"Corosync membership is still forming, ignoring");
306 while (g_hash_table_iter_next(&iter, NULL, (gpointer *) &node)) {
307 node->membership_id = 0;
311 for (i = 0; i < view_list_entries; i++) {
312 uint32_t
id = view_list[i];
318 if (node->name == NULL) {
321 crm_info(
"Obtaining name for new node %u",
id);
334 if (quorum_app_callback) {
335 quorum_app_callback(ring_id, is_quorate);
349 void (*destroy)(gpointer))
354 uint32_t quorum_type = 0;
361 quorum_fd_callbacks.
dispatch = quorum_dispatch_cb;
364 crm_debug(
"Configuring Pacemaker to obtain quorum from Corosync");
369 quorum_model_v0_data_t quorum_model_data = {
370 .model = QUORUM_MODEL_V0,
371 .quorum_notify_fn = quorum_notification_cb,
374 rc = quorum_model_initialize(&pcmk_quorum_handle, QUORUM_MODEL_V0,
375 (quorum_model_data_t *) &quorum_model_data,
378 quorum_callbacks_t quorum_callbacks = {
379 .quorum_notify_fn = quorum_notification_cb,
382 rc = quorum_initialize(&pcmk_quorum_handle, &quorum_callbacks,
388 crm_err(
"Could not connect to the Quorum API: %s (%d)",
389 cs_strerror(rc), rc);
392 }
else if (quorum_type != QUORUM_SET) {
393 crm_err(
"Corosync quorum is not configured");
397 rc = quorum_fd_get(pcmk_quorum_handle, &fd);
399 crm_err(
"Could not obtain the Quorum API connection: %s (%d)",
406 &found_uid, &found_gid))) {
407 crm_err(
"Quorum provider is not authentic:" 408 " process %lld (uid: %lld, gid: %lld)",
410 (
long long) found_uid, (
long long) found_gid);
414 crm_err(
"Could not verify authenticity of Quorum provider: %s (%d)",
420 rc = quorum_getquorate(pcmk_quorum_handle, &quorate);
422 crm_err(
"Could not obtain the current Quorum API state: %d", rc);
434 rc = quorum_trackstart(pcmk_quorum_handle, CS_TRACK_CHANGES | CS_TRACK_CURRENT);
436 crm_err(
"Could not setup Quorum API notifications: %d", rc);
446 quorum_finalize(pcmk_quorum_handle);
468 crm_err(
"Invalid cluster layer: %s " QB_XS
" cluster_layer=%d",
469 cluster_layer_s, cluster_layer);
478 crm_info(
"Connection to %s established", cluster_layer_s);
482 crm_err(
"Could not determine local node ID");
488 crm_err(
"Could not determine local node name");
508 cmap_handle_t handle;
509 int rc = pcmk__init_cmap(&handle);
512 cmap_finalize(handle);
516 crm_info(
"Failed to initialize the cmap API: %s (%d)",
517 pcmk__cs_err_str(rc), rc);
533 crm_trace(
"Corosync peer inactive: NULL");
537 crm_trace(
"Corosync peer %s inactive: state=%s",
542 crm_trace(
"Corosync peer %s inactive " QB_XS
" processes=%.16" PRIx32,
561 cs_error_t rc = CS_OK;
564 cmap_handle_t cmap_handle;
572 rc = pcmk__init_cmap(&cmap_handle);
575 crm_debug(
"API connection setup failed: %s. Retrying in %ds", cs_strerror(rc),
580 }
while (retries < 5 && rc != CS_OK);
583 crm_warn(
"Could not connect to Cluster Configuration Database API, error %d", rc);
587 rc = cmap_fd_get(cmap_handle, &fd);
589 crm_err(
"Could not obtain the CMAP API connection: %s (%d)",
590 cs_strerror(rc), rc);
596 &found_uid, &found_gid))) {
597 crm_err(
"CMAP provider is not authentic:" 598 " process %lld (uid: %lld, gid: %lld)",
600 (
long long) found_uid, (
long long) found_gid);
603 crm_err(
"Could not verify authenticity of CMAP provider: %s (%d)",
609 crm_trace(
"Initializing Corosync node list");
610 for (lpc = 0; TRUE; lpc++) {
616 rc = cmap_get_uint32(cmap_handle, key, &nodeid);
629 while (g_hash_table_iter_next(&iter, NULL, (gpointer *) &node)) {
631 && (node->cluster_layer_id > 0)
632 && (node->cluster_layer_id != nodeid)
635 crm_crit(
"Nodes %" PRIu32
" and %" PRIu32
" share the " 636 "same name '%s': shutting down",
637 node->cluster_layer_id, nodeid,
name);
643 if (nodeid > 0 ||
name != NULL) {
644 crm_trace(
"Initializing node[%d] %u = %s", lpc, nodeid,
name);
648 if (nodeid > 0 &&
name != NULL) {
662 cmap_finalize(cmap_handle);
675 cmap_handle_t handle;
676 char *cluster_name = NULL;
677 cs_error_t rc = CS_OK;
684 rc = pcmk__init_cmap(&handle);
686 crm_info(
"Failed to initialize the cmap API: %s (%d)",
687 cs_strerror(rc), rc);
691 rc = cmap_fd_get(handle, &fd);
693 crm_err(
"Could not obtain the CMAP API connection: %s (%d)",
694 cs_strerror(rc), rc);
700 &found_uid, &found_gid))) {
701 crm_err(
"CMAP provider is not authentic:" 702 " process %lld (uid: %lld, gid: %lld)",
704 (
long long) found_uid, (
long long) found_gid);
707 crm_err(
"Could not verify authenticity of CMAP provider: %s (%d)",
712 rc = cmap_get_string(handle,
"totem.cluster_name", &cluster_name);
714 crm_info(
"Cannot get totem.cluster_name: %s (%d)", cs_strerror(rc), rc);
717 crm_debug(
"cmap totem.cluster_name = '%s'", cluster_name);
721 cmap_finalize(handle);
734 cs_error_t cs_rc = CS_OK;
736 cmap_handle_t cmap_handle;
737 cmap_iter_handle_t iter_handle;
738 char key_name[CMAP_KEYNAME_MAXLEN + 1];
745 static bool got_result =
false;
746 static bool result =
false;
754 cs_rc = pcmk__init_cmap(&cmap_handle);
755 if (cs_rc != CS_OK) {
757 crm_debug(
"CMAP connection failed: %s (rc=%d, retrying in %ds)",
758 cs_strerror(cs_rc), cs_rc, retries);
761 }
while ((retries < 5) && (cs_rc != CS_OK));
762 if (cs_rc != CS_OK) {
763 crm_warn(
"Assuming Corosync does not have node list: " 764 "CMAP connection failed (%s) " QB_XS
" rc=%d",
765 cs_strerror(cs_rc), cs_rc);
770 cs_rc = cmap_fd_get(cmap_handle, &fd);
771 if (cs_rc != CS_OK) {
772 crm_warn(
"Assuming Corosync does not have node list: " 773 "CMAP unusable (%s) " QB_XS
" rc=%d",
774 cs_strerror(cs_rc), cs_rc);
780 &found_pid, &found_uid, &found_gid);
782 crm_warn(
"Assuming Corosync does not have node list: " 783 "CMAP provider is inauthentic " 784 QB_XS
" pid=%lld uid=%lld gid=%lld",
786 (
long long) found_uid, (
long long) found_gid);
789 crm_warn(
"Assuming Corosync does not have node list: " 790 "Could not verify CMAP authenticity (%s) " QB_XS
" rc=%d",
796 cs_rc = cmap_iter_init(cmap_handle,
"nodelist", &iter_handle);
797 if (cs_rc != CS_OK) {
798 crm_warn(
"Assuming Corosync does not have node list: " 799 "CMAP not readable (%s) " QB_XS
" rc=%d",
800 cs_strerror(cs_rc), cs_rc);
804 cs_rc = cmap_iter_next(cmap_handle, iter_handle, key_name, NULL, NULL);
805 if (cs_rc == CS_OK) {
809 cmap_iter_finalize(cmap_handle, iter_handle);
814 cmap_finalize(cmap_handle);
pcmk__node_status_t * pcmk__get_node(unsigned int id, const char *uname, const char *xml_id, uint32_t flags)
#define crm_notice(fmt, args...)
uint32_t pcmk__cpg_local_nodeid(cpg_handle_t handle)
const char * pcmk_strerror(int rc)
#define crm_crit(fmt, args...)
mainloop_io_t * mainloop_add_fd(const char *name, int priority, int fd, void *userdata, struct mainloop_fd_callbacks *callbacks)
_Noreturn crm_exit_t crm_exit(crm_exit_t rc)
const char * pcmk_cluster_layer_text(enum pcmk_cluster_layer layer)
Get a log-friendly string equivalent of a cluster layer.
void pcmk__reap_unseen_nodes(uint64_t ring_id)
char * pcmk__corosync_name(uint64_t cmap_handle, uint32_t nodeid)
void(* destroy)(gpointer userdata)
Destroy function for mainloop file descriptor client data.
Search for cluster nodes from membership cache.
void pcmk__corosync_quorum_connect(gboolean(*dispatch)(unsigned long long, gboolean), void(*destroy)(gpointer))
#define PCMK__SPECIAL_PID_AS_0(p)
bool pcmk__corosync_add_nodes(xmlNode *xml_parent)
char * node_name
Local node name at cluster layer.
uint32_t cluster_layer_id
Cluster-layer numeric node ID.
char * pcmk__corosync_cluster_name(void)
Wrappers for and extensions to glib mainloop.
xmlNode * pcmk__xe_create(xmlNode *parent, const char *name)
int pcmk__cpg_connect(pcmk_cluster_t *cluster)
Connect to Corosync CPG.
const char * crm_xml_add_ll(xmlNode *node, const char *name, long long value)
Create an XML attribute with specified name and long long int value.
G_GNUC_INTERNAL void pcmk__cluster_set_quorum(bool quorate)
const char * crm_xml_add(xmlNode *node, const char *name, const char *value)
Create an XML attribute with specified name and value.
int(* dispatch)(gpointer userdata)
Dispatch function for mainloop file descriptor with data ready.
#define crm_warn(fmt, args...)
#define crm_debug(fmt, args...)
bool pcmk__cluster_has_quorum(void)
int pcmk__corosync_connect(pcmk_cluster_t *cluster)
#define crm_trace(fmt, args...)
#define PCMK_VALUE_MEMBER
#define pcmk_is_set(g, f)
Convenience alias for pcmk_all_flags_set(), to check single flag.
char * pcmk__corosync_uuid(const pcmk__node_status_t *node)
Wrappers for and extensions to libxml2.
void pcmk__cluster_init_node_caches(void)
uint32_t node_id
Local node ID at cluster layer.
#define pcmk__assert(expr)
bool pcmk__corosync_is_peer_active(const pcmk__node_status_t *node)
pcmk__action_result_t result
void pcmk__cpg_disconnect(pcmk_cluster_t *cluster)
#define crm_err(fmt, args...)
pcmk__node_status_t * pcmk__update_peer_state(const char *source, pcmk__node_status_t *node, const char *state, uint64_t membership)
Update a node's state and membership information.
GHashTable * pcmk__peer_cache
pcmk_cluster_layer
Types of cluster layer.
char * pcmk__cluster_node_name(uint32_t nodeid)
bool pcmk__corosync_has_nodelist(void)
IPC interface to Pacemaker daemons.
bool pcmk__corosync_is_active(void)
#define crm_info(fmt, args...)
pcmk__cluster_private_t * priv
Node status data (may be a cluster node or a Pacemaker Remote node)
enum pcmk_cluster_layer pcmk_get_cluster_layer(void)
Get and validate the local cluster layer.
char * name
Node name as known to cluster layer, or Pacemaker Remote node name.
void pcmk__corosync_disconnect(pcmk_cluster_t *cluster)
char * crm_strdup_printf(char const *format,...) G_GNUC_PRINTF(1
int crm_ipc_is_authentic_process(int sock, uid_t refuid, gid_t refgid, pid_t *gotpid, uid_t *gotuid, gid_t *gotgid)
Check the authenticity of the IPC socket peer process (legacy)