12 #include <arpa/inet.h> 15 #include <netinet/in.h> 17 #include <sys/socket.h> 18 #include <sys/utsname.h> 21 #include <corosync/cfg.h> 22 #include <corosync/cmap.h> 23 #include <corosync/corodefs.h> 24 #include <corosync/corotypes.h> 25 #include <corosync/hdb.h> 26 #include <corosync/quorum.h> 27 #include <qb/qbipcc.h> 28 #include <qb/qbutil.h> 38 static quorum_handle_t pcmk_quorum_handle = 0;
40 static gboolean (*quorum_app_callback)(
unsigned long long seq,
41 gboolean quorate) = NULL;
61 crm_info(
"Node %s is not yet known by Corosync", node->
uname);
68 node_name_is_valid(
const char *key,
const char *
name)
76 }
else if (sscanf(
name,
"%d.%d.%d.%d", &octet, &octet, &octet, &octet) == 4) {
77 crm_trace(
"%s contains an IPv4 address (%s), ignoring", key,
name);
80 }
else if (strstr(
name,
":") != NULL) {
81 crm_trace(
"%s contains an IPv6 address (%s), ignoring", key,
name);
106 cs_error_t rc = CS_OK;
109 cmap_handle_t local_handle = 0;
120 if (cmap_handle == 0 && local_handle == 0) {
122 crm_trace(
"Initializing CMAP connection");
124 rc = pcmk__init_cmap(&local_handle);
127 crm_debug(
"API connection setup failed: %s. Retrying in %ds", cs_strerror(rc),
132 }
while (retries < 5 && rc != CS_OK);
135 crm_warn(
"Could not connect to Cluster Configuration Database API, error %s",
141 if (cmap_handle == 0) {
142 cmap_handle = local_handle;
144 rc = cmap_fd_get(cmap_handle, &fd);
146 crm_err(
"Could not obtain the CMAP API connection: %s (%d)",
147 cs_strerror(rc), rc);
153 &found_uid, &found_gid))) {
154 crm_err(
"CMAP provider is not authentic:" 155 " process %lld (uid: %lld, gid: %lld)",
157 (
long long) found_uid, (
long long) found_gid);
160 crm_err(
"Could not verify authenticity of CMAP provider: %s (%d)",
166 while (
name == NULL && cmap_handle != 0) {
171 rc = cmap_get_uint32(cmap_handle, key, &
id);
172 crm_trace(
"Checking %u vs %u from %s", nodeid,
id, key);
180 crm_trace(
"Searching for node name for %u in nodelist.node.%d %s",
181 nodeid, lpc, pcmk__s(
name,
"<null>"));
184 cmap_get_string(cmap_handle, key, &
name);
190 cmap_get_string(cmap_handle, key, &
name);
193 if (!node_name_is_valid(key,
name)) {
207 cmap_finalize(local_handle);
211 crm_info(
"Unable to get node name for nodeid %u", nodeid);
227 if (pcmk_quorum_handle != 0) {
228 quorum_finalize(pcmk_quorum_handle);
229 pcmk_quorum_handle = 0;
243 quorum_dispatch_cb(gpointer user_data)
245 int rc = quorum_dispatch(pcmk_quorum_handle, CS_DISPATCH_ALL);
248 crm_err(
"Connection to the Quorum API failed: %d", rc);
249 quorum_finalize(pcmk_quorum_handle);
250 pcmk_quorum_handle = 0;
267 quorum_notification_cb(quorum_handle_t handle, uint32_t quorate,
268 uint64_t ring_id, uint32_t view_list_entries,
274 static gboolean init_phase = TRUE;
279 ring_id, (
long unsigned int)view_list_entries);
281 crm_warn(
"Quorum lost " CRM_XS " membership=%" PRIu64
" members=%lu",
282 ring_id, (
long unsigned int)view_list_entries);
287 crm_info(
"Quorum %s " CRM_XS " membership=%" PRIu64
" members=%lu",
288 (quorate?
"retained" :
"still lost"), ring_id,
289 (
long unsigned int)view_list_entries);
292 if (view_list_entries == 0 && init_phase) {
293 crm_info(
"Corosync membership is still forming, ignoring");
302 while (g_hash_table_iter_next(&iter, NULL, (gpointer *) &node)) {
307 for (i = 0; i < view_list_entries; i++) {
308 uint32_t
id = view_list[i];
314 if (node->uname == NULL) {
317 crm_info(
"Obtaining name for new node %u",
id);
330 if (quorum_app_callback) {
331 quorum_app_callback(ring_id, quorate);
345 void (*destroy)(gpointer))
350 uint32_t quorum_type = 0;
357 quorum_fd_callbacks.
dispatch = quorum_dispatch_cb;
360 crm_debug(
"Configuring Pacemaker to obtain quorum from Corosync");
365 quorum_model_v0_data_t quorum_model_data = {
366 .model = QUORUM_MODEL_V0,
367 .quorum_notify_fn = quorum_notification_cb,
370 rc = quorum_model_initialize(&pcmk_quorum_handle, QUORUM_MODEL_V0,
371 (quorum_model_data_t *) &quorum_model_data,
374 quorum_callbacks_t quorum_callbacks = {
375 .quorum_notify_fn = quorum_notification_cb,
378 rc = quorum_initialize(&pcmk_quorum_handle, &quorum_callbacks,
384 crm_err(
"Could not connect to the Quorum API: %s (%d)",
385 cs_strerror(rc), rc);
388 }
else if (quorum_type != QUORUM_SET) {
389 crm_err(
"Corosync quorum is not configured");
393 rc = quorum_fd_get(pcmk_quorum_handle, &fd);
395 crm_err(
"Could not obtain the Quorum API connection: %s (%d)",
402 &found_uid, &found_gid))) {
403 crm_err(
"Quorum provider is not authentic:" 404 " process %lld (uid: %lld, gid: %lld)",
406 (
long long) found_uid, (
long long) found_gid);
410 crm_err(
"Could not verify authenticity of Quorum provider: %s (%d)",
416 rc = quorum_getquorate(pcmk_quorum_handle, &quorate);
418 crm_err(
"Could not obtain the current Quorum API state: %d", rc);
430 rc = quorum_trackstart(pcmk_quorum_handle, CS_TRACK_CHANGES | CS_TRACK_CURRENT);
432 crm_err(
"Could not setup Quorum API notifications: %d", rc);
442 quorum_finalize(pcmk_quorum_handle);
465 crm_err(
"Invalid cluster layer: %s " CRM_XS " cluster_layer=%d",
466 cluster_layer_s, cluster_layer);
475 crm_info(
"Connection to %s established", cluster_layer_s);
478 if (cluster->
nodeid == 0) {
479 crm_err(
"Could not determine local node ID");
484 if (cluster->
uname == NULL) {
485 crm_err(
"Could not determine local node name");
506 cmap_handle_t handle;
507 int rc = pcmk__init_cmap(&handle);
510 cmap_finalize(handle);
514 crm_info(
"Failed to initialize the cmap API: %s (%d)",
515 pcmk__cs_err_str(rc), rc);
531 crm_trace(
"Corosync peer inactive: NULL");
535 crm_trace(
"Corosync peer %s inactive: state=%s",
540 crm_trace(
"Corosync peer %s inactive " CRM_XS " processes=%.16" PRIx32,
559 cs_error_t rc = CS_OK;
562 cmap_handle_t cmap_handle;
570 rc = pcmk__init_cmap(&cmap_handle);
573 crm_debug(
"API connection setup failed: %s. Retrying in %ds", cs_strerror(rc),
578 }
while (retries < 5 && rc != CS_OK);
581 crm_warn(
"Could not connect to Cluster Configuration Database API, error %d", rc);
585 rc = cmap_fd_get(cmap_handle, &fd);
587 crm_err(
"Could not obtain the CMAP API connection: %s (%d)",
588 cs_strerror(rc), rc);
594 &found_uid, &found_gid))) {
595 crm_err(
"CMAP provider is not authentic:" 596 " process %lld (uid: %lld, gid: %lld)",
598 (
long long) found_uid, (
long long) found_gid);
601 crm_err(
"Could not verify authenticity of CMAP provider: %s (%d)",
607 crm_trace(
"Initializing Corosync node list");
608 for (lpc = 0; TRUE; lpc++) {
614 rc = cmap_get_uint32(cmap_handle, key, &nodeid);
627 while (g_hash_table_iter_next(&iter, NULL, (gpointer *) &node)) {
628 if(node && node->uname && strcasecmp(node->uname,
name) == 0) {
629 if (node->id && node->id != nodeid) {
630 crm_crit(
"Nodes %u and %u share the same name '%s': shutting down", node->id,
638 if (nodeid > 0 ||
name != NULL) {
639 crm_trace(
"Initializing node[%d] %u = %s", lpc, nodeid,
name);
643 if (nodeid > 0 &&
name != NULL) {
657 cmap_finalize(cmap_handle);
670 cmap_handle_t handle;
671 char *cluster_name = NULL;
672 cs_error_t rc = CS_OK;
679 rc = pcmk__init_cmap(&handle);
681 crm_info(
"Failed to initialize the cmap API: %s (%d)",
682 cs_strerror(rc), rc);
686 rc = cmap_fd_get(handle, &fd);
688 crm_err(
"Could not obtain the CMAP API connection: %s (%d)",
689 cs_strerror(rc), rc);
695 &found_uid, &found_gid))) {
696 crm_err(
"CMAP provider is not authentic:" 697 " process %lld (uid: %lld, gid: %lld)",
699 (
long long) found_uid, (
long long) found_gid);
702 crm_err(
"Could not verify authenticity of CMAP provider: %s (%d)",
707 rc = cmap_get_string(handle,
"totem.cluster_name", &cluster_name);
709 crm_info(
"Cannot get totem.cluster_name: %s (%d)", cs_strerror(rc), rc);
712 crm_debug(
"cmap totem.cluster_name = '%s'", cluster_name);
716 cmap_finalize(handle);
729 cs_error_t cs_rc = CS_OK;
731 cmap_handle_t cmap_handle;
732 cmap_iter_handle_t iter_handle;
733 char key_name[CMAP_KEYNAME_MAXLEN + 1];
740 static bool got_result =
false;
741 static bool result =
false;
749 cs_rc = pcmk__init_cmap(&cmap_handle);
750 if (cs_rc != CS_OK) {
752 crm_debug(
"CMAP connection failed: %s (rc=%d, retrying in %ds)",
753 cs_strerror(cs_rc), cs_rc, retries);
756 }
while ((retries < 5) && (cs_rc != CS_OK));
757 if (cs_rc != CS_OK) {
758 crm_warn(
"Assuming Corosync does not have node list: " 759 "CMAP connection failed (%s) " CRM_XS " rc=%d",
760 cs_strerror(cs_rc), cs_rc);
765 cs_rc = cmap_fd_get(cmap_handle, &fd);
766 if (cs_rc != CS_OK) {
767 crm_warn(
"Assuming Corosync does not have node list: " 768 "CMAP unusable (%s) " CRM_XS " rc=%d",
769 cs_strerror(cs_rc), cs_rc);
775 &found_pid, &found_uid, &found_gid);
777 crm_warn(
"Assuming Corosync does not have node list: " 778 "CMAP provider is inauthentic " 779 CRM_XS " pid=%lld uid=%lld gid=%lld",
781 (
long long) found_uid, (
long long) found_gid);
784 crm_warn(
"Assuming Corosync does not have node list: " 785 "Could not verify CMAP authenticity (%s) " CRM_XS " rc=%d",
791 cs_rc = cmap_iter_init(cmap_handle,
"nodelist", &iter_handle);
792 if (cs_rc != CS_OK) {
793 crm_warn(
"Assuming Corosync does not have node list: " 794 "CMAP not readable (%s) " CRM_XS " rc=%d",
795 cs_strerror(cs_rc), cs_rc);
799 cs_rc = cmap_iter_next(cmap_handle, iter_handle, key_name, NULL, NULL);
800 if (cs_rc == CS_OK) {
804 cmap_iter_finalize(cmap_handle, iter_handle);
809 cmap_finalize(cmap_handle);
#define crm_notice(fmt, args...)
uint32_t pcmk__cpg_local_nodeid(cpg_handle_t handle)
const char * pcmk_strerror(int rc)
crm_node_t * pcmk__get_node(unsigned int id, const char *uname, const char *uuid, uint32_t flags)
#define crm_crit(fmt, args...)
mainloop_io_t * mainloop_add_fd(const char *name, int priority, int fd, void *userdata, struct mainloop_fd_callbacks *callbacks)
_Noreturn crm_exit_t crm_exit(crm_exit_t rc)
bool pcmk__corosync_is_peer_active(const crm_node_t *node)
const char * pcmk_cluster_layer_text(enum pcmk_cluster_layer layer)
Get a log-friendly string equivalent of a cluster layer.
void pcmk__reap_unseen_nodes(uint64_t ring_id)
char * pcmk__corosync_name(uint64_t cmap_handle, uint32_t nodeid)
void(* destroy)(gpointer userdata)
Destroy function for mainloop file descriptor client data.
Search for cluster nodes from membership cache.
void pcmk__corosync_quorum_connect(gboolean(*dispatch)(unsigned long long, gboolean), void(*destroy)(gpointer))
#define PCMK__SPECIAL_PID_AS_0(p)
const char * crm_xml_add(xmlNode *node, const char *name, const char *value)
Create an XML attribute with specified name and value.
bool pcmk__corosync_add_nodes(xmlNode *xml_parent)
char * pcmk__corosync_cluster_name(void)
Wrappers for and extensions to glib mainloop.
int pcmk__cpg_connect(pcmk_cluster_t *cluster)
Connect to Corosync CPG.
gboolean crm_is_corosync_peer_active(const crm_node_t *node)
int(* dispatch)(gpointer userdata)
Dispatch function for mainloop file descriptor with data ready.
#define crm_warn(fmt, args...)
crm_node_t * pcmk__update_peer_state(const char *source, crm_node_t *node, const char *state, uint64_t membership)
Update a node's state and membership information.
#define crm_debug(fmt, args...)
int pcmk__corosync_connect(pcmk_cluster_t *cluster)
#define crm_trace(fmt, args...)
char * crm_strdup_printf(char const *format,...) G_GNUC_PRINTF(1
#define pcmk_is_set(g, f)
Convenience alias for pcmk_all_flags_set(), to check single flag.
Wrappers for and extensions to libxml2.
void pcmk__cluster_init_node_caches(void)
Deprecated Pacemaker cluster API.
const char * crm_xml_add_ll(xmlNode *node, const char *name, long long value)
Create an XML attribute with specified name and long long int value.
pcmk__action_result_t result
void pcmk__cpg_disconnect(pcmk_cluster_t *cluster)
#define crm_err(fmt, args...)
pcmk_cluster_layer
Types of cluster layer.
char * pcmk__cluster_node_name(uint32_t nodeid)
bool pcmk__corosync_has_nodelist(void)
IPC interface to Pacemaker daemons.
char * pcmk__corosync_uuid(const crm_node_t *node)
bool pcmk__corosync_is_active(void)
xmlNode * pcmk__xe_create(xmlNode *parent, const char *name)
GHashTable * crm_peer_cache
#define crm_info(fmt, args...)
enum pcmk_cluster_layer pcmk_get_cluster_layer(void)
Get and validate the local cluster layer.
void pcmk__corosync_disconnect(pcmk_cluster_t *cluster)
int crm_ipc_is_authentic_process(int sock, uid_t refuid, gid_t refgid, pid_t *gotpid, uid_t *gotuid, gid_t *gotgid)
Check the authenticity of the IPC socket peer process (legacy)