10 #include <sys/types.h> 20 is_matched_failure(
const char *rsc_id,
const xmlNode *conf_op_xml,
21 const xmlNode *lrm_op_xml)
23 gboolean matched = FALSE;
24 const char *conf_op_name = NULL;
25 const char *lrm_op_task = NULL;
26 const char *conf_op_interval_spec = NULL;
27 guint conf_op_interval_ms = 0;
28 guint lrm_op_interval_ms = 0;
29 const char *lrm_op_id = NULL;
30 char *last_failure_key = NULL;
32 if (rsc_id == NULL || conf_op_xml == NULL || lrm_op_xml == NULL) {
45 if ((conf_op_interval_ms != lrm_op_interval_ms)
50 lrm_op_id = pcmk__xe_id(lrm_op_xml);
51 last_failure_key =
pcmk__op_key(rsc_id,
"last_failure", 0);
57 char *expected_op_key =
pcmk__op_key(rsc_id, conf_op_name,
65 if (rc != target_rc) {
69 free(expected_op_key);
72 free(last_failure_key);
78 const xmlNode *xml_op)
100 gboolean should_block = FALSE;
105 int max = numXpathResults(xpathObj);
108 for (lpc = 0; lpc < max; lpc++) {
112 should_block = is_matched_failure(xml_name, pref, xml_op);
118 const char *conf_op_name = NULL;
119 const char *conf_op_interval_spec = NULL;
120 guint conf_op_interval_ms = 0;
121 char *lrm_op_xpath = NULL;
122 xmlXPathObject *lrm_op_xpathObj = NULL;
129 &conf_op_interval_ms);
131 #define XPATH_FMT "//" PCMK__XE_NODE_STATE "[@" PCMK_XA_UNAME "='%s']" \ 132 "//" PCMK__XE_LRM_RESOURCE "[@" PCMK_XA_ID "='%s']" \ 133 "/" PCMK__XE_LRM_RSC_OP "[@" PCMK_XA_OPERATION "='%s']" \ 134 "[@" PCMK_META_INTERVAL "='%u']" 139 conf_op_interval_ms);
145 if (lrm_op_xpathObj) {
146 int max2 = numXpathResults(lrm_op_xpathObj);
149 for (lpc2 = 0; lpc2 < max2; lpc2++) {
153 should_block = is_matched_failure(xml_name, pref,
206 generate_fail_regex(
const char *prefix,
const char *rsc_name,
bool is_unique,
209 char *pattern = NULL;
210 const char *op_pattern =
"#.+_[0-9]+";
216 const char *instance_pattern = (is_unique?
"" :
"(:[0-9]+)?");
219 instance_pattern, op_pattern);
220 if (regcomp(re, pattern, REG_EXTENDED|REG_NOSUB) != 0) {
242 generate_fail_regexes(
const pcmk_resource_t *rsc, regex_t *failcount_re,
243 regex_t *lastfailure_re)
246 char *rsc_name = rsc_fail_name(rsc);
257 regfree(failcount_re);
265 struct failcount_data {
269 const xmlNode *xml_op;
270 regex_t failcount_re;
271 regex_t lastfailure_re;
285 update_failcount_for_attr(gpointer key, gpointer value, gpointer user_data)
287 struct failcount_data *fc_data = user_data;
290 if (regexec(&(fc_data->failcount_re), (
const char *) key, 0, NULL, 0) == 0) {
296 "because '%s' is not a valid fail count: %s",
297 (
const char *) key, pcmk__node_name(fc_data->node),
302 pcmk__rsc_trace(fc_data->rsc,
"Added %s (%s) to %s fail count (now %s)",
303 (
const char *) key, (
const char *) value,
310 if (regexec(&(fc_data->lastfailure_re), (
const char *) key, 0, NULL,
316 crm_info(
"Ignoring invalid value '%s' for %s: %s",
317 (
const char *) value, (
const char *) key,
pcmk_rc_str(rc));
320 fc_data->last_failure = (time_t) QB_MAX(fc_data->last_failure, last_ll);
332 update_launched_failcount(gpointer
data, gpointer user_data)
335 struct failcount_data *fc_data = user_data;
336 time_t launched_last_failure = 0;
339 &launched_last_failure,
340 fc_data->flags, fc_data->xml_op);
341 fc_data->last_failure = QB_MAX(fc_data->last_failure, launched_last_failure);
344 #define readable_expiration(rsc) \ 345 pcmk__readable_interval((rsc)->priv->failure_expiration_ms) 365 time_t *last_failure, uint32_t
flags,
const xmlNode *xml_op)
367 struct failcount_data fc_data = {
373 .last_failure = (time_t) 0,
377 CRM_CHECK(generate_fail_regexes(rsc, &fc_data.failcount_re,
380 g_hash_table_foreach(node->
priv->
attrs, update_failcount_for_attr,
382 regfree(&(fc_data.failcount_re));
383 regfree(&(fc_data.lastfailure_re));
387 && block_failure(node, rsc, xml_op)) {
390 "because it conflicts with " 398 && (fc_data.last_failure > 0)
404 if (now > (fc_data.last_failure + expiration)) {
406 rsc->
id, pcmk__node_name(node),
408 fc_data.failcount = 0;
423 && (rsc->
priv->
launched != NULL) && !pcmk__is_bundled(rsc)) {
425 g_list_foreach(rsc->
priv->
launched, update_launched_failcount,
427 if (fc_data.failcount > 0) {
429 "Container %s and the resources within it " 430 "have failed %s time%s on %s",
433 pcmk__node_name(node));
436 }
else if (fc_data.failcount > 0) {
440 pcmk__node_name(node));
443 if (last_failure != NULL) {
444 if ((fc_data.failcount > 0) && (fc_data.last_failure > 0)) {
445 *last_failure = fc_data.last_failure;
450 return fc_data.failcount;
476 crm_notice(
"Clearing failure of %s on %s because %s " QB_XS
" %s",
477 rsc->
id, pcmk__node_name(node), reason, clear->
uuid);
#define CRM_CHECK(expr, failure_action)
#define crm_notice(fmt, args...)
const char * pcmk_readable_score(int score)
Return a displayable static string for a score value.
#define PCMK_XE_PRIMITIVE
#define pcmk__config_warn(fmt...)
#define pcmk__rsc_trace(rsc, fmt, args...)
int pe__target_rc_from_xml(const xmlNode *xml_op)
#define pcmk__rsc_info(rsc, fmt, args...)
#define pcmk__insert_meta(obj, name, value)
guint failure_expiration_ms
#define PCMK_ACTION_CLEAR_FAILCOUNT
const char * pcmk_rc_str(int rc)
Get a user-friendly description of a return code.
#define PCMK_XA_OPERATION
#define PCMK__LAST_FAILURE_PREFIX
#define pcmk__rsc_debug(rsc, fmt, args...)
int pe_get_failcount(const pcmk_node_t *node, pcmk_resource_t *rsc, time_t *last_failure, uint32_t flags, const xmlNode *xml_op)
pcmk__node_private_t * priv
int pcmk__scan_ll(const char *text, long long *result, long long default_value)
#define crm_warn(fmt, args...)
int crm_element_value_ms(const xmlNode *data, const char *name, guint *dest)
Retrieve the millisecond value of an XML attribute.
pcmk_scheduler_t * scheduler
char * clone_strip(const char *last_rsc_id)
int pcmk_parse_interval_spec(const char *input, guint *result_ms)
Parse milliseconds from a Pacemaker interval specification.
const char * crm_element_value(const xmlNode *data, const char *name)
Retrieve the value of an XML attribute.
#define pcmk_is_set(g, f)
Convenience alias for pcmk_all_flags_set(), to check single flag.
pcmk__resource_private_t * priv
Wrappers for and extensions to libxml2.
#define PCMK__FAIL_COUNT_PREFIX
char * pcmk__op_key(const char *rsc_id, const char *op_type, guint interval_ms)
Generate an operation key (RESOURCE_ACTION_INTERVAL)
int pcmk__add_scores(int score1, int score2)
pcmk_action_t * custom_action(pcmk_resource_t *rsc, char *key, const char *task, const pcmk_node_t *on_node, gboolean optional, pcmk_scheduler_t *scheduler)
Create or update an action object.
xmlXPathObjectPtr xpath_search(const xmlNode *xml_top, const char *path)
#define PCMK_META_INTERVAL
pcmk_scheduler_t * scheduler
#define PCMK__META_OP_NO_WAIT
xmlNode * getXpathResult(xmlXPathObjectPtr xpathObj, int index)
#define PCMK_META_ON_FAIL
int crm_element_value_int(const xmlNode *data, const char *name, int *dest)
Retrieve the integer value of an XML attribute.
guint pcmk__timeout_ms2s(guint timeout_ms)
int pcmk_parse_score(const char *score_s, int *score, int default_score)
Parse an integer score from a string.
#define pcmk__plural_s(i)
pcmk_action_t * pe__clear_failcount(pcmk_resource_t *rsc, const pcmk_node_t *node, const char *reason, pcmk_scheduler_t *scheduler)
Schedule a controller operation to clear a fail count.
#define readable_expiration(rsc)
time_t get_effective_time(pcmk_scheduler_t *scheduler)
void freeXpathObject(xmlXPathObjectPtr xpathObj)
#define crm_info(fmt, args...)
char * crm_strdup_printf(char const *format,...) G_GNUC_PRINTF(1