diff --git a/crmd/lrm.c b/crmd/lrm.c
index e12df4b5da..07e8e702ab 100644
--- a/crmd/lrm.c
+++ b/crmd/lrm.c
@@ -1,2520 +1,2520 @@
 /*
  * Copyright (C) 2004 Andrew Beekhof <andrew@beekhof.net>
  *
  * This program is free software; you can redistribute it and/or
  * modify it under the terms of the GNU General Public
  * License as published by the Free Software Foundation; either
  * version 2 of the License, or (at your option) any later version.
  *
  * This software is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * General Public License for more details.
  *
  * You should have received a copy of the GNU General Public
  * License along with this library; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
  */
 
 #include <crm_internal.h>
 
 #include <sys/param.h>
 #include <sys/types.h>
 #include <sys/wait.h>
 
 #include <crm/crm.h>
 #include <crm/services.h>
 
 #include <crm/msg_xml.h>
 #include <crm/common/xml.h>
 
 #include <crmd.h>
 #include <crmd_fsa.h>
 #include <crmd_messages.h>
 #include <crmd_callbacks.h>
 #include <crmd_lrm.h>
 
 #define START_DELAY_THRESHOLD 5 * 60 * 1000
 #define MAX_LRM_REG_FAILS 30
 
 struct delete_event_s {
     int rc;
     const char *rsc;
     lrm_state_t *lrm_state;
 };
 
 static gboolean is_rsc_active(lrm_state_t * lrm_state, const char *rsc_id);
 static gboolean build_active_RAs(lrm_state_t * lrm_state, xmlNode * rsc_list);
 static gboolean stop_recurring_actions(gpointer key, gpointer value, gpointer user_data);
 static int delete_rsc_status(lrm_state_t * lrm_state, const char *rsc_id, int call_options,
                              const char *user_name);
 
 static lrmd_event_data_t *construct_op(lrm_state_t * lrm_state, xmlNode * rsc_op,
                                        const char *rsc_id, const char *operation);
 static void do_lrm_rsc_op(lrm_state_t * lrm_state, lrmd_rsc_info_t * rsc, const char *operation,
                           xmlNode * msg, xmlNode * request);
 
 void send_direct_ack(const char *to_host, const char *to_sys,
                      lrmd_rsc_info_t * rsc, lrmd_event_data_t * op, const char *rsc_id);
 
 static gboolean lrm_state_verify_stopped(lrm_state_t * lrm_state, enum crmd_fsa_state cur_state,
                                          int log_level);
 static int do_update_resource(const char *node_name, lrmd_rsc_info_t * rsc, lrmd_event_data_t * op);
 
 static void
 lrm_connection_destroy(void)
 {
     if (is_set(fsa_input_register, R_LRM_CONNECTED)) {
         crm_crit("LRM Connection failed");
         register_fsa_input(C_FSA_INTERNAL, I_ERROR, NULL);
         clear_bit(fsa_input_register, R_LRM_CONNECTED);
 
     } else {
         crm_info("LRM Connection disconnected");
     }
 
 }
 
 static char *
 make_stop_id(const char *rsc, int call_id)
 {
     char *op_id = NULL;
 
     op_id = calloc(1, strlen(rsc) + 34);
     if (op_id != NULL) {
         snprintf(op_id, strlen(rsc) + 34, "%s:%d", rsc, call_id);
     }
     return op_id;
 }
 
 static void
 copy_instance_keys(gpointer key, gpointer value, gpointer user_data)
 {
     if (strstr(key, CRM_META "_") == NULL) {
         g_hash_table_replace(user_data, strdup((const char *)key), strdup((const char *)value));
     }
 }
 
 static void
 copy_meta_keys(gpointer key, gpointer value, gpointer user_data)
 {
     if (strstr(key, CRM_META "_") != NULL) {
         g_hash_table_replace(user_data, strdup((const char *)key), strdup((const char *)value));
     }
 }
 
 /*!
  * \internal
  * \brief Remove a recurring operation from a resource's history
  *
  * \param[in,out] history  Resource history to modify
  * \param[in]     op       Operation to remove
  *
  * \return TRUE if the operation was found and removed, FALSE otherwise
  */
 static gboolean
 history_remove_recurring_op(rsc_history_t *history, const lrmd_event_data_t *op)
 {
     GList *iter;
 
     for (iter = history->recurring_op_list; iter != NULL; iter = iter->next) {
         lrmd_event_data_t *existing = iter->data;
 
         if ((op->interval == existing->interval)
             && crm_str_eq(op->rsc_id, existing->rsc_id, TRUE)
             && safe_str_eq(op->op_type, existing->op_type)) {
 
             history->recurring_op_list = g_list_delete_link(history->recurring_op_list, iter);
             lrmd_free_event(existing);
             return TRUE;
         }
     }
     return FALSE;
 }
 
 /*!
  * \internal
  * \brief Free all recurring operations in resource history
  *
  * \param[in,out] history  Resource history to modify
  */
 static void
 history_free_recurring_ops(rsc_history_t *history)
 {
     GList *iter;
 
     for (iter = history->recurring_op_list; iter != NULL; iter = iter->next) {
         lrmd_free_event(iter->data);
     }
     g_list_free(history->recurring_op_list);
     history->recurring_op_list = NULL;
 }
 
 /*!
  * \internal
  * \brief Free resource history
  *
  * \param[in,out] history  Resource history to free
  */
 void
 history_free(gpointer data)
 {
     rsc_history_t *history = (rsc_history_t*)data;
 
     if (history->stop_params) {
         g_hash_table_destroy(history->stop_params);
     }
 
     /* Don't need to free history->rsc.id because it's set to history->id */
     free(history->rsc.type);
     free(history->rsc.class);
     free(history->rsc.provider);
 
     lrmd_free_event(history->failed);
     lrmd_free_event(history->last);
     free(history->id);
     history_free_recurring_ops(history);
     free(history);
 }
 
 static void
 update_history_cache(lrm_state_t * lrm_state, lrmd_rsc_info_t * rsc, lrmd_event_data_t * op)
 {
     int target_rc = 0;
     rsc_history_t *entry = NULL;
 
     if (op->rsc_deleted) {
         crm_debug("Purged history for '%s' after %s", op->rsc_id, op->op_type);
         delete_rsc_status(lrm_state, op->rsc_id, cib_quorum_override, NULL);
         return;
     }
 
     if (safe_str_eq(op->op_type, RSC_NOTIFY)) {
         return;
     }
 
     crm_debug("Updating history for '%s' with %s op", op->rsc_id, op->op_type);
 
     entry = g_hash_table_lookup(lrm_state->resource_history, op->rsc_id);
     if (entry == NULL && rsc) {
         entry = calloc(1, sizeof(rsc_history_t));
         entry->id = strdup(op->rsc_id);
         g_hash_table_insert(lrm_state->resource_history, entry->id, entry);
 
         entry->rsc.id = entry->id;
         entry->rsc.type = strdup(rsc->type);
         entry->rsc.class = strdup(rsc->class);
         if (rsc->provider) {
             entry->rsc.provider = strdup(rsc->provider);
         } else {
             entry->rsc.provider = NULL;
         }
 
     } else if (entry == NULL) {
         crm_info("Resource %s no longer exists, not updating cache", op->rsc_id);
         return;
     }
 
     entry->last_callid = op->call_id;
     target_rc = rsc_op_expected_rc(op);
     if (op->op_status == PCMK_LRM_OP_CANCELLED) {
         if (op->interval > 0) {
             crm_trace("Removing cancelled recurring op: %s_%s_%d", op->rsc_id, op->op_type,
                       op->interval);
             history_remove_recurring_op(entry, op);
             return;
         } else {
             crm_trace("Skipping %s_%s_%d rc=%d, status=%d", op->rsc_id, op->op_type, op->interval,
                       op->rc, op->op_status);
         }
 
     } else if (did_rsc_op_fail(op, target_rc)) {
         /* We must store failed monitors here
          * - otherwise the block below will cause them to be forgetten them when a stop happens
          */
         if (entry->failed) {
             lrmd_free_event(entry->failed);
         }
         entry->failed = lrmd_copy_event(op);
 
     } else if (op->interval == 0) {
         if (entry->last) {
             lrmd_free_event(entry->last);
         }
         entry->last = lrmd_copy_event(op);
 
         if (op->params &&
             (safe_str_eq(CRMD_ACTION_START, op->op_type) ||
              safe_str_eq("reload", op->op_type) ||
              safe_str_eq(CRMD_ACTION_STATUS, op->op_type))) {
 
             if (entry->stop_params) {
                 g_hash_table_destroy(entry->stop_params);
             }
             entry->stop_params = g_hash_table_new_full(crm_str_hash,
                                                        g_str_equal, g_hash_destroy_str,
                                                        g_hash_destroy_str);
 
             g_hash_table_foreach(op->params, copy_instance_keys, entry->stop_params);
         }
     }
 
     if (op->interval > 0) {
         /* Ensure there are no duplicates */
         history_remove_recurring_op(entry, op);
 
         crm_trace("Adding recurring op: %s_%s_%d", op->rsc_id, op->op_type, op->interval);
         entry->recurring_op_list = g_list_prepend(entry->recurring_op_list, lrmd_copy_event(op));
 
     } else if (entry->recurring_op_list && safe_str_eq(op->op_type, RSC_STATUS) == FALSE) {
         crm_trace("Dropping %d recurring ops because of: %s_%s_%d",
                   g_list_length(entry->recurring_op_list), op->rsc_id,
                   op->op_type, op->interval);
         history_free_recurring_ops(entry);
     }
 }
 
 /*!
  * \internal
  * \brief Send a direct OK ack for a resource task
  *
  * \param[in] lrm_state  LRM connection
  * \param[in] input      Input message being ack'ed
  * \param[in] rsc_id     ID of affected resource
  * \param[in] rsc        Affected resource (if available)
  * \param[in] task       Operation task being ack'ed
  * \param[in] ack_host   Name of host to send ack to
  * \param[in] ack_sys    IPC system name to ack
  */
 static void
 send_task_ok_ack(lrm_state_t *lrm_state, ha_msg_input_t *input,
                  const char *rsc_id, lrmd_rsc_info_t *rsc, const char *task,
                  const char *ack_host, const char *ack_sys)
 {
     lrmd_event_data_t *op = construct_op(lrm_state, input->xml, rsc_id, task);
 
     CRM_ASSERT(op != NULL);
     op->rc = PCMK_OCF_OK;
     op->op_status = PCMK_LRM_OP_DONE;
     send_direct_ack(ack_host, ack_sys, rsc, op, rsc_id);
     lrmd_free_event(op);
 }
 
 void
 lrm_op_callback(lrmd_event_data_t * op)
 {
     const char *nodename = NULL;
     lrm_state_t *lrm_state = NULL;
 
     CRM_CHECK(op != NULL, return);
 
     /* determine the node name for this connection. */
     nodename = op->remote_nodename ? op->remote_nodename : fsa_our_uname;
 
     if (op->type == lrmd_event_disconnect && (safe_str_eq(nodename, fsa_our_uname))) {
         /* if this is the local lrmd ipc connection, set the right bits in the
          * crmd when the connection goes down */
         lrm_connection_destroy();
         return;
     } else if (op->type != lrmd_event_exec_complete) {
         /* we only need to process execution results */
         return;
     }
 
     lrm_state = lrm_state_find(nodename);
     CRM_ASSERT(lrm_state != NULL);
 
     process_lrm_event(lrm_state, op, NULL);
 }
 
 /*	 A_LRM_CONNECT	*/
 void
 do_lrm_control(long long action,
                enum crmd_fsa_cause cause,
                enum crmd_fsa_state cur_state,
                enum crmd_fsa_input current_input, fsa_data_t * msg_data)
 {
     /* This only pertains to local lrmd connections.  Remote connections are handled as
      * resources within the pengine.  Connecting and disconnecting from remote lrmd instances
      * handled differently than the local. */
 
     lrm_state_t *lrm_state = NULL;
 
     if(fsa_our_uname == NULL) {
         return; /* Nothing to do */
     }
     lrm_state = lrm_state_find_or_create(fsa_our_uname);
     if (lrm_state == NULL) {
         register_fsa_error(C_FSA_INTERNAL, I_ERROR, NULL);
         return;
     }
 
     if (action & A_LRM_DISCONNECT) {
         if (lrm_state_verify_stopped(lrm_state, cur_state, LOG_INFO) == FALSE) {
             if (action == A_LRM_DISCONNECT) {
                 crmd_fsa_stall(FALSE);
                 return;
             }
         }
 
         clear_bit(fsa_input_register, R_LRM_CONNECTED);
         crm_info("Disconnecting from the LRM");
         lrm_state_disconnect(lrm_state);
         lrm_state_reset_tables(lrm_state);
         crm_notice("Disconnected from the LRM");
     }
 
     if (action & A_LRM_CONNECT) {
         int ret = pcmk_ok;
 
         crm_debug("Connecting to the LRM");
         ret = lrm_state_ipc_connect(lrm_state);
 
         if (ret != pcmk_ok) {
             if (lrm_state->num_lrm_register_fails < MAX_LRM_REG_FAILS) {
                 crm_warn("Failed to sign on to the LRM %d"
                          " (%d max) times", lrm_state->num_lrm_register_fails, MAX_LRM_REG_FAILS);
 
                 crm_timer_start(wait_timer);
                 crmd_fsa_stall(FALSE);
                 return;
             }
         }
 
         if (ret != pcmk_ok) {
             crm_err("Failed to sign on to the LRM %d" " (max) times",
                     lrm_state->num_lrm_register_fails);
             register_fsa_error(C_FSA_INTERNAL, I_ERROR, NULL);
             return;
         }
 
         set_bit(fsa_input_register, R_LRM_CONNECTED);
         crm_info("LRM connection established");
     }
 
     if (action & ~(A_LRM_CONNECT | A_LRM_DISCONNECT)) {
         crm_err("Unexpected action %s in %s", fsa_action2string(action), __FUNCTION__);
     }
 }
 
 static gboolean
 lrm_state_verify_stopped(lrm_state_t * lrm_state, enum crmd_fsa_state cur_state, int log_level)
 {
     int counter = 0;
     gboolean rc = TRUE;
     const char *when = "lrm disconnect";
 
     GHashTableIter gIter;
     const char *key = NULL;
     rsc_history_t *entry = NULL;
     struct recurring_op_s *pending = NULL;
 
     crm_debug("Checking for active resources before exit");
 
     if (cur_state == S_TERMINATE) {
         log_level = LOG_ERR;
         when = "shutdown";
 
     } else if (is_set(fsa_input_register, R_SHUTDOWN)) {
         when = "shutdown... waiting";
     }
 
     if (lrm_state->pending_ops && lrm_state_is_connected(lrm_state) == TRUE) {
         guint removed = g_hash_table_foreach_remove(
             lrm_state->pending_ops, stop_recurring_actions, lrm_state);
         guint nremaining = g_hash_table_size(lrm_state->pending_ops);
 
         if (removed || nremaining) {
             crm_notice("Stopped %u recurring operations at %s (%u operations remaining)",
                        removed, when, nremaining);
         }
     }
 
     if (lrm_state->pending_ops) {
         g_hash_table_iter_init(&gIter, lrm_state->pending_ops);
         while (g_hash_table_iter_next(&gIter, NULL, (void **)&pending)) {
             /* Ignore recurring actions in the shutdown calculations */
             if (pending->interval == 0) {
                 counter++;
             }
         }
     }
 
     if (counter > 0) {
         do_crm_log(log_level, "%d pending LRM operations at %s", counter, when);
 
         if (cur_state == S_TERMINATE || !is_set(fsa_input_register, R_SENT_RSC_STOP)) {
             g_hash_table_iter_init(&gIter, lrm_state->pending_ops);
             while (g_hash_table_iter_next(&gIter, (gpointer*)&key, (gpointer*)&pending)) {
                 do_crm_log(log_level, "Pending action: %s (%s)", key, pending->op_key);
             }
 
         } else {
             rc = FALSE;
         }
         return rc;
     }
 
     if (lrm_state->resource_history == NULL) {
         return rc;
     }
 
     if (cur_state == S_TERMINATE || is_set(fsa_input_register, R_SHUTDOWN)) {
         /* At this point we're not waiting, we're just shutting down */
         when = "shutdown";
     }
 
     counter = 0;
     g_hash_table_iter_init(&gIter, lrm_state->resource_history);
     while (g_hash_table_iter_next(&gIter, NULL, (gpointer*)&entry)) {
         if (is_rsc_active(lrm_state, entry->id) == FALSE) {
             continue;
         }
 
         counter++;
         crm_trace("Found %s active", entry->id);
         if (lrm_state->pending_ops) {
             GHashTableIter hIter;
 
             g_hash_table_iter_init(&hIter, lrm_state->pending_ops);
             while (g_hash_table_iter_next(&hIter, (gpointer*)&key, (gpointer*)&pending)) {
                 if (crm_str_eq(entry->id, pending->rsc_id, TRUE)) {
                     crm_notice("%sction %s (%s) incomplete at %s",
                                pending->interval == 0 ? "A" : "Recurring a",
                                key, pending->op_key, when);
                 }
             }
         }
     }
 
     if (counter) {
         crm_err("%d resources were active at %s.", counter, when);
     }
 
     return rc;
 }
 
 GHashTable *metadata_hash = NULL;
 
 static char *
 get_rsc_metadata(const char *type, const char *rclass, const char *provider, bool force)
 {
     int rc = pcmk_ok;
     int len = 0;
     char *key = NULL;
     char *metadata = NULL;
 
     /* Always use a local connection for this operation */
     lrm_state_t *lrm_state = lrm_state_find(fsa_our_uname);
 
     CRM_CHECK(type != NULL, return NULL);
     CRM_CHECK(rclass != NULL, return NULL);
     CRM_CHECK(lrm_state != NULL, return NULL);
 
     if (provider == NULL) {
         provider = "heartbeat";
     }
 
     if (metadata_hash == NULL) {
         metadata_hash = g_hash_table_new_full(crm_str_hash, g_str_equal, g_hash_destroy_str, g_hash_destroy_str);
     }
 
     len = strlen(type) + strlen(rclass) + strlen(provider) + 4;
     key = malloc(len);
     if(key == NULL) {
         return NULL;
     }
 
     snprintf(key, len, "%s::%s:%s", rclass, provider, type);
     if(force == FALSE) {
         metadata = g_hash_table_lookup(metadata_hash, key);
         if (metadata) {
             crm_trace("Retrieved cached metadata for %s", key);
         }
     }
 
     if(metadata == NULL) {
         rc = lrm_state_get_metadata(lrm_state, rclass, provider, type, &metadata, 0);
         if(rc == pcmk_ok) {
             crm_trace("Retrieved live metadata for %s", key);
             CRM_LOG_ASSERT(metadata != NULL);
             g_hash_table_insert(metadata_hash, key, metadata);
             key = NULL;
         } else {
             crm_trace("No metadata found for %s: %s" CRM_XS " rc=%d",
                      key, pcmk_strerror(rc), rc);
             CRM_CHECK(metadata == NULL, metadata = NULL);
         }
     }
 
     free(key);
     return metadata;
 }
 
 static char *
 build_parameter_list(lrmd_event_data_t *op, xmlNode *metadata, xmlNode *result,
                      const char *criteria, bool target, bool invert_for_xml)
 {
     int len = 0;
     int max = 0;
     char *list = NULL;
 
     xmlNode *param = NULL;
     xmlNode *params = NULL;
 
     const char *secure_terms[] = {
         "password",
         "passwd",
         "user",
     };
 
     if(safe_str_eq("private", criteria)) {
         /* It will take time for the agents to be updated
          * Check for some common terms
          */
         max = DIMOF(secure_terms);
     }
 
     params = find_xml_node(metadata, "parameters", TRUE);
     for (param = __xml_first_child(params); param != NULL; param = __xml_next(param)) {
         if (crm_str_eq((const char *)param->name, "parameter", TRUE)) {
             bool accept = FALSE;
             const char *name = crm_element_value(param, "name");
             const char *value = crm_element_value(param, criteria);
 
             if(max && value) {
                 /* Turn off the compatibility logic once an agent has been updated to know about 'private' */
                 max = 0;
             }
 
             if (name == NULL) {
                 crm_err("Invalid parameter in %s metadata", op->rsc_id);
 
             } else if(target == crm_is_true(value)) {
                 accept = TRUE;
 
             } else if(max) {
                 int lpc = 0;
                 bool found = FALSE;
 
                 for(lpc = 0; found == FALSE && lpc < max; lpc++) {
                     if(safe_str_eq(secure_terms[lpc], name)) {
                         found = TRUE;
                     }
                 }
 
                 if(found == target) {
                     accept = TRUE;
                 }
             }
 
             if(accept) {
                 int start = len;
 
                 crm_trace("Attr %s is %s%s", name, target?"":"not ", criteria);
 
                 len += strlen(name) + 2;
                 list = realloc_safe(list, len + 1);
                 sprintf(list + start, " %s ", name);
 
             } else {
                 crm_trace("Rejecting %s for %s", name, criteria);
             }
 
             if(invert_for_xml) {
                 crm_trace("Inverting %s match for %s xml", name, criteria);
                 accept = !accept;
             }
 
             if(result && accept) {
                 value = g_hash_table_lookup(op->params, name);
 
                 if(value != NULL) {
                     char *summary = crm_versioned_param_summary(op->versioned_params, name);
 
                     if (summary) {
                         crm_trace("Adding attr %s=%s to the xml result", name, summary);
                         crm_xml_add(result, name, summary);
                         free(summary);
                     } else {
                         crm_trace("Adding attr %s=%s to the xml result", name, value);
                         crm_xml_add(result, name, value);
                     }
                 }
             }
         }
     }
 
     return list;
 }
 
 static bool
 resource_supports_action(xmlNode *metadata, const char *name) 
 {
     const char *value = NULL;
 
     xmlNode *action = NULL;
     xmlNode *actions = NULL;
 
     actions = find_xml_node(metadata, "actions", TRUE);
     for (action = __xml_first_child(actions); action != NULL; action = __xml_next(action)) {
         if (crm_str_eq((const char *)action->name, "action", TRUE)) {
             value = crm_element_value(action, "name");
             if (safe_str_eq(name, value)) {
                 return TRUE;
             }
         }
     }
 
     return FALSE;
 }
 
 static void
 append_restart_list(lrmd_event_data_t *op, xmlNode *metadata, xmlNode * update, const char *version)
 {
     char *list = NULL;
     char *digest = NULL;
     xmlNode *restart = NULL;
 
     CRM_LOG_ASSERT(op->params != NULL);
 
     if (op->interval > 0) {
         /* monitors are not reloadable */
         return;
     }
 
     if(resource_supports_action(metadata, "reload")) {
         restart = create_xml_node(NULL, XML_TAG_PARAMS);
         /* Any parameters with unique="1" should be added into the "op-force-restart" list. */
         list = build_parameter_list(op, metadata, restart, "unique", TRUE, FALSE);
 
     } else {
         /* Resource does not support reloads */
         return;
     }
 
     digest = calculate_operation_digest(restart, version);
     /* Add "op-force-restart" and "op-restart-digest" to indicate the resource supports reload,
      * no matter if it actually supports any parameters with unique="1"). */
     crm_xml_add(update, XML_LRM_ATTR_OP_RESTART, list? list: "");
     crm_xml_add(update, XML_LRM_ATTR_RESTART_DIGEST, digest);
 
     crm_trace("%s: %s, %s", op->rsc_id, digest, list);
     crm_log_xml_trace(restart, "restart digest source");
 
     free_xml(restart);
     free(digest);
     free(list);
 }
 
 static void
 append_secure_list(lrmd_event_data_t *op, xmlNode *metadata, xmlNode * update, const char *version)
 {
     char *list = NULL;
     char *digest = NULL;
     xmlNode *secure = NULL;
 
     CRM_LOG_ASSERT(op->params != NULL);
 
     /*
      * To keep XML_LRM_ATTR_OP_SECURE short, we want it to contain the
      * secure parameters but XML_LRM_ATTR_SECURE_DIGEST to be based on
      * the insecure ones
      */
     secure = create_xml_node(NULL, XML_TAG_PARAMS);
     list = build_parameter_list(op, metadata, secure, "private", TRUE, TRUE);
 
     if (list != NULL) {
         digest = calculate_operation_digest(secure, version);
         crm_xml_add(update, XML_LRM_ATTR_OP_SECURE, list);
         crm_xml_add(update, XML_LRM_ATTR_SECURE_DIGEST, digest);
 
         crm_trace("%s: %s, %s", op->rsc_id, digest, list);
         crm_log_xml_trace(secure, "secure digest source");
     } else {
         crm_trace("%s: no secure parameters", op->rsc_id);
     }
 
     free_xml(secure);
     free(digest);
     free(list);
 }
 
 static gboolean
 build_operation_update(xmlNode * parent, lrmd_rsc_info_t * rsc, lrmd_event_data_t * op,
                        const char *src)
 {
     int target_rc = 0;
     xmlNode *xml_op = NULL;
     xmlNode *metadata = NULL;
     const char *m_string = NULL;
     const char *caller_version = NULL;
 
     if (op == NULL) {
         return FALSE;
     }
 
     target_rc = rsc_op_expected_rc(op);
 
     /* there is a small risk in formerly mixed clusters that it will
      * be sub-optimal.
      *
      * however with our upgrade policy, the update we send should
      * still be completely supported anyway
      */
     caller_version = g_hash_table_lookup(op->params, XML_ATTR_CRM_VERSION);
     CRM_LOG_ASSERT(caller_version != NULL);
 
     if(caller_version == NULL) {
         caller_version = CRM_FEATURE_SET;
     }
 
     crm_trace("Building %s operation update with originator version: %s", op->rsc_id, caller_version);
     xml_op = create_operation_update(parent, op, caller_version, target_rc, fsa_our_uname, src, LOG_DEBUG);
     if (xml_op == NULL) {
         return TRUE;
     }
 
     if (rsc == NULL || op->params == NULL || crm_str_eq(CRMD_ACTION_STOP, op->op_type, TRUE)) {
         /* Stopped resources don't need the digest logic */
         crm_trace("No digests needed for %s %p %p %s", op->rsc_id, op->params, rsc, op->op_type);
         return TRUE;
     }
 
     m_string = get_rsc_metadata(rsc->type, rsc->class, rsc->provider, safe_str_eq(op->op_type, RSC_START));
     if(m_string == NULL) {
         crm_err("No metadata for %s::%s:%s", rsc->class, rsc->provider, rsc->type);
         return TRUE;
     }
 
     metadata = string2xml(m_string);
     if(metadata == NULL) {
         crm_err("Metadata for %s::%s:%s is not valid XML", rsc->class, rsc->provider, rsc->type);
         return TRUE;
     }
 
     crm_trace("Including additional digests for %s::%s:%s", rsc->class, rsc->provider, rsc->type);
     append_restart_list(op, metadata, xml_op, caller_version);
     append_secure_list(op, metadata, xml_op, caller_version);
 
     free_xml(metadata);
     return TRUE;
 }
 
 static gboolean
 is_rsc_active(lrm_state_t * lrm_state, const char *rsc_id)
 {
     rsc_history_t *entry = NULL;
 
     entry = g_hash_table_lookup(lrm_state->resource_history, rsc_id);
     if (entry == NULL || entry->last == NULL) {
         return FALSE;
     }
 
     crm_trace("Processing %s: %s.%d=%d",
               rsc_id, entry->last->op_type, entry->last->interval, entry->last->rc);
     if (entry->last->rc == PCMK_OCF_OK && safe_str_eq(entry->last->op_type, CRMD_ACTION_STOP)) {
         return FALSE;
 
     } else if (entry->last->rc == PCMK_OCF_OK
                && safe_str_eq(entry->last->op_type, CRMD_ACTION_MIGRATE)) {
         /* a stricter check is too complex...
          * leave that to the PE
          */
         return FALSE;
 
     } else if (entry->last->rc == PCMK_OCF_NOT_RUNNING) {
         return FALSE;
 
     } else if (entry->last->interval == 0 && entry->last->rc == PCMK_OCF_NOT_CONFIGURED) {
         /* Badly configured resources can't be reliably stopped */
         return FALSE;
     }
 
     return TRUE;
 }
 
 static gboolean
 build_active_RAs(lrm_state_t * lrm_state, xmlNode * rsc_list)
 {
     GHashTableIter iter;
     rsc_history_t *entry = NULL;
 
     g_hash_table_iter_init(&iter, lrm_state->resource_history);
     while (g_hash_table_iter_next(&iter, NULL, (void **)&entry)) {
 
         GList *gIter = NULL;
         xmlNode *xml_rsc = create_xml_node(rsc_list, XML_LRM_TAG_RESOURCE);
 
         crm_xml_add(xml_rsc, XML_ATTR_ID, entry->id);
         crm_xml_add(xml_rsc, XML_ATTR_TYPE, entry->rsc.type);
         crm_xml_add(xml_rsc, XML_AGENT_ATTR_CLASS, entry->rsc.class);
         crm_xml_add(xml_rsc, XML_AGENT_ATTR_PROVIDER, entry->rsc.provider);
 
         if (entry->last && entry->last->params) {
             const char *container = g_hash_table_lookup(entry->last->params, CRM_META"_"XML_RSC_ATTR_CONTAINER);
             if (container) {
                 crm_trace("Resource %s is a part of container resource %s", entry->id, container);
                 crm_xml_add(xml_rsc, XML_RSC_ATTR_CONTAINER, container);
             }
         }
         build_operation_update(xml_rsc, &(entry->rsc), entry->failed, __FUNCTION__);
         build_operation_update(xml_rsc, &(entry->rsc), entry->last, __FUNCTION__);
         for (gIter = entry->recurring_op_list; gIter != NULL; gIter = gIter->next) {
             build_operation_update(xml_rsc, &(entry->rsc), gIter->data, __FUNCTION__);
         }
     }
 
     return FALSE;
 }
 
 static xmlNode *
 do_lrm_query_internal(lrm_state_t *lrm_state, int update_flags)
 {
     xmlNode *xml_state = NULL;
     xmlNode *xml_data = NULL;
     xmlNode *rsc_list = NULL;
     crm_node_t *peer = NULL;
 
     peer = crm_get_peer_full(0, lrm_state->node_name, CRM_GET_PEER_ANY);
     CRM_CHECK(peer != NULL, return NULL);
 
     xml_state = create_node_state_update(peer, update_flags, NULL,
                                          __FUNCTION__);
 
     xml_data = create_xml_node(xml_state, XML_CIB_TAG_LRM);
     crm_xml_add(xml_data, XML_ATTR_ID, peer->uuid);
     rsc_list = create_xml_node(xml_data, XML_LRM_TAG_RESOURCES);
 
     /* Build a list of active (not always running) resources */
     build_active_RAs(lrm_state, rsc_list);
 
     crm_log_xml_trace(xml_state, "Current state of the LRM");
 
     return xml_state;
 }
 
 xmlNode *
 do_lrm_query(gboolean is_replace, const char *node_name)
 {
     lrm_state_t *lrm_state = lrm_state_find(node_name);
     xmlNode *xml_state;
 
     if (!lrm_state) {
         crm_err("Could not query lrm state for lrmd node %s", node_name);
         return NULL;
     }
     xml_state = do_lrm_query_internal(lrm_state,
                                       node_update_cluster|node_update_peer);
 
     /* In case this function is called to generate a join confirmation to
      * send to the DC, force the current and expected join state to member.
      * This isn't necessary for newer DCs but is backward compatible.
      */
     crm_xml_add(xml_state, XML_NODE_JOIN_STATE, CRMD_JOINSTATE_MEMBER);
     crm_xml_add(xml_state, XML_NODE_EXPECTED, CRMD_JOINSTATE_MEMBER);
 
     return xml_state;
 }
 
 static void
 notify_deleted(lrm_state_t * lrm_state, ha_msg_input_t * input, const char *rsc_id, int rc)
 {
     lrmd_event_data_t *op = NULL;
     const char *from_sys = crm_element_value(input->msg, F_CRM_SYS_FROM);
     const char *from_host = crm_element_value(input->msg, F_CRM_HOST_FROM);
 
     crm_info("Notifying %s on %s that %s was%s deleted",
              from_sys, from_host, rsc_id, rc == pcmk_ok ? "" : " not");
 
     op = construct_op(lrm_state, input->xml, rsc_id, CRMD_ACTION_DELETE);
     CRM_ASSERT(op != NULL);
 
     if (rc == pcmk_ok) {
         op->op_status = PCMK_LRM_OP_DONE;
         op->rc = PCMK_OCF_OK;
     } else {
         op->op_status = PCMK_LRM_OP_ERROR;
         op->rc = PCMK_OCF_UNKNOWN_ERROR;
     }
 
     send_direct_ack(from_host, from_sys, NULL, op, rsc_id);
     lrmd_free_event(op);
 
     if (safe_str_neq(from_sys, CRM_SYSTEM_TENGINE)) {
         /* this isn't expected - trigger a new transition */
         time_t now = time(NULL);
         char *now_s = crm_itoa(now);
 
         crm_debug("Triggering a refresh after %s deleted %s from the LRM", from_sys, rsc_id);
 
         update_attr_delegate(fsa_cib_conn, cib_none, XML_CIB_TAG_CRMCONFIG, NULL, NULL, NULL, NULL,
                              "last-lrm-refresh", now_s, FALSE, NULL, NULL);
 
         free(now_s);
     }
 }
 
 static gboolean
 lrm_remove_deleted_rsc(gpointer key, gpointer value, gpointer user_data)
 {
     struct delete_event_s *event = user_data;
     struct pending_deletion_op_s *op = value;
 
     if (crm_str_eq(event->rsc, op->rsc, TRUE)) {
         notify_deleted(event->lrm_state, op->input, event->rsc, event->rc);
         return TRUE;
     }
     return FALSE;
 }
 
 static gboolean
 lrm_remove_deleted_op(gpointer key, gpointer value, gpointer user_data)
 {
     const char *rsc = user_data;
     struct recurring_op_s *pending = value;
 
     if (crm_str_eq(rsc, pending->rsc_id, TRUE)) {
         crm_info("Removing op %s:%d for deleted resource %s",
                  pending->op_key, pending->call_id, rsc);
         return TRUE;
     }
     return FALSE;
 }
 
 /*
  * Remove the rsc from the CIB
  *
  * Avoids refreshing the entire LRM section of this host
  */
 #define rsc_template "//"XML_CIB_TAG_STATE"[@uname='%s']//"XML_LRM_TAG_RESOURCE"[@id='%s']"
 
 static int
 delete_rsc_status(lrm_state_t * lrm_state, const char *rsc_id, int call_options,
                   const char *user_name)
 {
     char *rsc_xpath = NULL;
     int max = 0;
     int rc = pcmk_ok;
 
     CRM_CHECK(rsc_id != NULL, return -ENXIO);
 
     max = strlen(rsc_template) + strlen(rsc_id) + strlen(lrm_state->node_name) + 1;
     rsc_xpath = calloc(1, max);
     snprintf(rsc_xpath, max, rsc_template, lrm_state->node_name, rsc_id);
 
     rc = cib_internal_op(fsa_cib_conn, CIB_OP_DELETE, NULL, rsc_xpath,
                          NULL, NULL, call_options | cib_xpath, user_name);
 
     free(rsc_xpath);
     return rc;
 }
 
 static void
 delete_rsc_entry(lrm_state_t * lrm_state, ha_msg_input_t * input, const char *rsc_id,
                  GHashTableIter * rsc_gIter, int rc, const char *user_name)
 {
     struct delete_event_s event;
 
     CRM_CHECK(rsc_id != NULL, return);
 
     if (rc == pcmk_ok) {
         char *rsc_id_copy = strdup(rsc_id);
 
         if (rsc_gIter)
             g_hash_table_iter_remove(rsc_gIter);
         else
             g_hash_table_remove(lrm_state->resource_history, rsc_id_copy);
         crm_debug("sync: Sending delete op for %s", rsc_id_copy);
         delete_rsc_status(lrm_state, rsc_id_copy, cib_quorum_override, user_name);
 
         g_hash_table_foreach_remove(lrm_state->pending_ops, lrm_remove_deleted_op, rsc_id_copy);
         free(rsc_id_copy);
     }
 
     if (input) {
         notify_deleted(lrm_state, input, rsc_id, rc);
     }
 
     event.rc = rc;
     event.rsc = rsc_id;
     event.lrm_state = lrm_state;
     g_hash_table_foreach_remove(lrm_state->deletion_ops, lrm_remove_deleted_rsc, &event);
 }
 
 /*
  * Remove the op from the CIB
  *
  * Avoids refreshing the entire LRM section of this host
  */
 
 #define op_template "//"XML_CIB_TAG_STATE"[@uname='%s']//"XML_LRM_TAG_RESOURCE"[@id='%s']/"XML_LRM_TAG_RSC_OP"[@id='%s']"
 #define op_call_template "//"XML_CIB_TAG_STATE"[@uname='%s']//"XML_LRM_TAG_RESOURCE"[@id='%s']/"XML_LRM_TAG_RSC_OP"[@id='%s' and @"XML_LRM_ATTR_CALLID"='%d']"
 
 static void
 delete_op_entry(lrm_state_t * lrm_state, lrmd_event_data_t * op, const char *rsc_id,
                 const char *key, int call_id)
 {
     xmlNode *xml_top = NULL;
 
     if (op != NULL) {
         xml_top = create_xml_node(NULL, XML_LRM_TAG_RSC_OP);
         crm_xml_add_int(xml_top, XML_LRM_ATTR_CALLID, op->call_id);
         crm_xml_add(xml_top, XML_ATTR_TRANSITION_KEY, op->user_data);
 
         if (op->interval > 0) {
             char *op_id = generate_op_key(op->rsc_id, op->op_type, op->interval);
 
             /* Avoid deleting last_failure too (if it was a result of this recurring op failing) */
             crm_xml_add(xml_top, XML_ATTR_ID, op_id);
             free(op_id);
         }
 
         crm_debug("async: Sending delete op for %s_%s_%d (call=%d)",
                   op->rsc_id, op->op_type, op->interval, op->call_id);
 
         fsa_cib_conn->cmds->delete(fsa_cib_conn, XML_CIB_TAG_STATUS, xml_top, cib_quorum_override);
 
     } else if (rsc_id != NULL && key != NULL) {
         int max = 0;
         char *op_xpath = NULL;
 
         if (call_id > 0) {
             max =
                 strlen(op_call_template) + strlen(rsc_id) + strlen(lrm_state->node_name) +
                 strlen(key) + 10;
             op_xpath = calloc(1, max);
             snprintf(op_xpath, max, op_call_template, lrm_state->node_name, rsc_id, key, call_id);
 
         } else {
             max =
                 strlen(op_template) + strlen(rsc_id) + strlen(lrm_state->node_name) + strlen(key) +
                 1;
             op_xpath = calloc(1, max);
             snprintf(op_xpath, max, op_template, lrm_state->node_name, rsc_id, key);
         }
 
         crm_debug("sync: Sending delete op for %s (call=%d)", rsc_id, call_id);
         fsa_cib_conn->cmds->delete(fsa_cib_conn, op_xpath, NULL, cib_quorum_override | cib_xpath);
 
         free(op_xpath);
 
     } else {
         crm_err("Not enough information to delete op entry: rsc=%p key=%p", rsc_id, key);
         return;
     }
 
     crm_log_xml_trace(xml_top, "op:cancel");
     free_xml(xml_top);
 }
 
 void
 lrm_clear_last_failure(const char *rsc_id, const char *node_name)
 {
     char *attr = NULL;
     GHashTableIter iter;
     GList *lrm_state_list = lrm_state_get_list();
     GList *state_entry;
     rsc_history_t *entry = NULL;
 
     attr = generate_op_key(rsc_id, "last_failure", 0);
 
     /* This clears last failure for every lrm state that has this rsc.*/
     for (state_entry = lrm_state_list; state_entry != NULL; state_entry = state_entry->next) {
         lrm_state_t *lrm_state = state_entry->data;
 
         if (node_name != NULL) {
             if (strcmp(node_name, lrm_state->node_name) != 0) {
                 /* filter by node_name if node_name is present */
                 continue;
             }
         }
 
         delete_op_entry(lrm_state, NULL, rsc_id, attr, 0);
 
         if (!lrm_state->resource_history) {
             continue;
         }
 
         g_hash_table_iter_init(&iter, lrm_state->resource_history);
         while (g_hash_table_iter_next(&iter, NULL, (void **)&entry)) {
             if (crm_str_eq(rsc_id, entry->id, TRUE)) {
                 lrmd_free_event(entry->failed);
                 entry->failed = NULL;
             }
         }
     }
     free(attr);
     g_list_free(lrm_state_list);
 }
 
 /* Returns: gboolean - cancellation is in progress */
 static gboolean
 cancel_op(lrm_state_t * lrm_state, const char *rsc_id, const char *key, int op, gboolean remove)
 {
     int rc = pcmk_ok;
     char *local_key = NULL;
     struct recurring_op_s *pending = NULL;
 
     CRM_CHECK(op != 0, return FALSE);
     CRM_CHECK(rsc_id != NULL, return FALSE);
     if (key == NULL) {
         local_key = make_stop_id(rsc_id, op);
         key = local_key;
     }
     pending = g_hash_table_lookup(lrm_state->pending_ops, key);
 
     if (pending) {
         if (remove && pending->remove == FALSE) {
             pending->remove = TRUE;
             crm_debug("Scheduling %s for removal", key);
         }
 
         if (pending->cancelled) {
             crm_debug("Operation %s already cancelled", key);
             free(local_key);
             return FALSE;
         }
 
         pending->cancelled = TRUE;
 
     } else {
         crm_info("No pending op found for %s", key);
         free(local_key);
         return FALSE;
     }
 
     crm_debug("Cancelling op %d for %s (%s)", op, rsc_id, key);
     rc = lrm_state_cancel(lrm_state, pending->rsc_id, pending->op_type, pending->interval);
     if (rc == pcmk_ok) {
         crm_debug("Op %d for %s (%s): cancelled", op, rsc_id, key);
         free(local_key);
         return TRUE;
     }
 
     crm_debug("Op %d for %s (%s): Nothing to cancel", op, rsc_id, key);
     /* The caller needs to make sure the entry is
      * removed from the pending_ops list
      *
      * Usually by returning TRUE inside the worker function
      * supplied to g_hash_table_foreach_remove()
      *
      * Not removing the entry from pending_ops will block
      * the node from shutting down
      */
     free(local_key);
     return FALSE;
 }
 
 struct cancel_data {
     gboolean done;
     gboolean remove;
     const char *key;
     lrmd_rsc_info_t *rsc;
     lrm_state_t *lrm_state;
 };
 
 static gboolean
 cancel_action_by_key(gpointer key, gpointer value, gpointer user_data)
 {
     gboolean remove = FALSE;
     struct cancel_data *data = user_data;
     struct recurring_op_s *op = (struct recurring_op_s *)value;
 
     if (crm_str_eq(op->op_key, data->key, TRUE)) {
         data->done = TRUE;
         remove = !cancel_op(data->lrm_state, data->rsc->id, key, op->call_id, data->remove);
     }
     return remove;
 }
 
 static gboolean
 cancel_op_key(lrm_state_t * lrm_state, lrmd_rsc_info_t * rsc, const char *key, gboolean remove)
 {
     guint removed = 0;
     struct cancel_data data;
 
     CRM_CHECK(rsc != NULL, return FALSE);
     CRM_CHECK(key != NULL, return FALSE);
 
     data.key = key;
     data.rsc = rsc;
     data.done = FALSE;
     data.remove = remove;
     data.lrm_state = lrm_state;
 
     removed = g_hash_table_foreach_remove(lrm_state->pending_ops, cancel_action_by_key, &data);
     crm_trace("Removed %u op cache entries, new size: %u",
               removed, g_hash_table_size(lrm_state->pending_ops));
     return data.done;
 }
 
 static lrmd_rsc_info_t *
 get_lrm_resource(lrm_state_t * lrm_state, xmlNode * resource, xmlNode * op_msg, gboolean do_create)
 {
     lrmd_rsc_info_t *rsc = NULL;
     const char *id = ID(resource);
     const char *type = crm_element_value(resource, XML_ATTR_TYPE);
     const char *class = crm_element_value(resource, XML_AGENT_ATTR_CLASS);
     const char *provider = crm_element_value(resource, XML_AGENT_ATTR_PROVIDER);
     const char *long_id = crm_element_value(resource, XML_ATTR_ID_LONG);
 
     crm_trace("Retrieving %s from the LRM.", id);
     CRM_CHECK(id != NULL, return NULL);
 
     rsc = lrm_state_get_rsc_info(lrm_state, id, 0);
 
     if (!rsc && long_id) {
         rsc = lrm_state_get_rsc_info(lrm_state, long_id, 0);
     }
 
     if (!rsc && do_create) {
         CRM_CHECK(class != NULL, return NULL);
         CRM_CHECK(type != NULL, return NULL);
 
         crm_trace("Adding rsc %s before operation", id);
 
         lrm_state_register_rsc(lrm_state, id, class, provider, type, lrmd_opt_drop_recurring);
 
         rsc = lrm_state_get_rsc_info(lrm_state, id, 0);
 
         if (!rsc) {
             fsa_data_t *msg_data = NULL;
 
             crm_err("Could not add resource %s to LRM %s", id, lrm_state->node_name);
             /* only register this as a internal error if this involves the local
              * lrmd. Otherwise we're likely dealing with an unresponsive remote-node
              * which is not a FSA failure. */
             if (lrm_state_is_local(lrm_state) == TRUE) {
                 register_fsa_error(C_FSA_INTERNAL, I_FAIL, NULL);
             }
         }
     }
 
     return rsc;
 }
 
 static void
 delete_resource(lrm_state_t * lrm_state,
                 const char *id,
                 lrmd_rsc_info_t * rsc,
                 GHashTableIter * gIter,
                 const char *sys,
                 const char *host,
                 const char *user,
                 ha_msg_input_t * request,
                 gboolean unregister)
 {
     int rc = pcmk_ok;
 
     crm_info("Removing resource %s for %s (%s) on %s", id, sys, user ? user : "internal", host);
 
     if (rsc && unregister) {
         rc = lrm_state_unregister_rsc(lrm_state, id, 0);
     }
 
     if (rc == pcmk_ok) {
         crm_trace("Resource '%s' deleted", id);
     } else if (rc == -EINPROGRESS) {
         crm_info("Deletion of resource '%s' pending", id);
         if (request) {
             struct pending_deletion_op_s *op = NULL;
             char *ref = crm_element_value_copy(request->msg, XML_ATTR_REFERENCE);
 
             op = calloc(1, sizeof(struct pending_deletion_op_s));
             op->rsc = strdup(rsc->id);
             op->input = copy_ha_msg_input(request);
             g_hash_table_insert(lrm_state->deletion_ops, ref, op);
         }
         return;
     } else {
         crm_warn("Deletion of resource '%s' for %s (%s) on %s failed: %d",
                  id, sys, user ? user : "internal", host, rc);
     }
 
     delete_rsc_entry(lrm_state, request, id, gIter, rc, user);
 }
 
 static int
 get_fake_call_id(lrm_state_t *lrm_state, const char *rsc_id)
 {
     int call_id = 999999999;
     rsc_history_t *entry = NULL;
 
     if(lrm_state) {
         entry = g_hash_table_lookup(lrm_state->resource_history, rsc_id);
     }
 
     /* Make sure the call id is greater than the last successful operation,
      * otherwise the failure will not result in a possible recovery of the resource
      * as it could appear the failure occurred before the successful start */
     if (entry) {
         call_id = entry->last_callid + 1;
     }
 
     if (call_id < 0) {
         call_id = 1;
     }
     return call_id;
 }
 
 static void
 force_reprobe(lrm_state_t *lrm_state, const char *from_sys, const char *from_host, const char *user_name, gboolean is_remote_node)
 {
         GHashTableIter gIter;
         rsc_history_t *entry = NULL;
 
 
         crm_info("clearing resource history on node %s", lrm_state->node_name);
         g_hash_table_iter_init(&gIter, lrm_state->resource_history);
         while (g_hash_table_iter_next(&gIter, NULL, (void **)&entry)) {
             /* only unregister the resource during a reprobe if it is not a remote connection
              * resource. otherwise unregistering the connection will terminate remote-node
              * membership */
             gboolean unregister = TRUE;
 
             if (is_remote_lrmd_ra(NULL, NULL, entry->id)) {
                 lrm_state_t *remote_lrm_state = lrm_state_find(entry->id);
                 if (remote_lrm_state) {
                     /* when forcing a reprobe, make sure to clear remote node before
                      * clearing the remote node's connection resource */ 
                     force_reprobe(remote_lrm_state, from_sys, from_host, user_name, TRUE);
                 }
                 unregister = FALSE;
             }
 
             delete_resource(lrm_state, entry->id, &entry->rsc, &gIter, from_sys, from_host,
                             user_name, NULL, unregister);
         }
 
         /* Now delete the copy in the CIB */
         erase_status_tag(lrm_state->node_name, XML_CIB_TAG_LRM, cib_scope_local);
 
         /* And finally, _delete_ the value in attrd
          * Setting it to FALSE results in the PE sending us back here again
          */
         update_attrd(lrm_state->node_name, CRM_OP_PROBED, NULL, user_name, is_remote_node);
 }
 
 static void
 synthesize_lrmd_failure(lrm_state_t *lrm_state, xmlNode *action, int rc) 
 {
     lrmd_event_data_t *op = NULL;
     const char *operation = crm_element_value(action, XML_LRM_ATTR_TASK);
     const char *target_node = crm_element_value(action, XML_LRM_ATTR_TARGET);
     xmlNode *xml_rsc = find_xml_node(action, XML_CIB_TAG_RESOURCE, TRUE);
 
     if(xml_rsc == NULL) {
         /* @TODO Should we do something else, like direct ack? */
         crm_info("Skipping %s=%d on %s (%p): no resource",
                  crm_element_value(action, XML_LRM_ATTR_TASK_KEY), rc, target_node, lrm_state);
         return;
 
     } else if(operation == NULL) {
         /* This probably came from crm_resource -C, nothing to do */
         crm_info("Skipping %s=%d on %s (%p): no operation",
                  crm_element_value(action, XML_ATTR_TRANSITION_KEY), rc, target_node, lrm_state);
         return;
     }
 
     op = construct_op(lrm_state, action, ID(xml_rsc), operation);
     CRM_ASSERT(op != NULL);
 
     op->call_id = get_fake_call_id(lrm_state, op->rsc_id);
     if(safe_str_eq(operation, RSC_NOTIFY)) {
         /* Notifications can't fail yet */
         op->op_status = PCMK_LRM_OP_DONE;
         op->rc = PCMK_OCF_OK;
 
     } else {
         op->op_status = PCMK_LRM_OP_ERROR;
         op->rc = rc;
     }
     op->t_run = time(NULL);
     op->t_rcchange = op->t_run;
 
     crm_info("Faking result %d for %s_%s_%d on %s (%p)", op->rc, op->rsc_id, op->op_type, op->interval, target_node, lrm_state);
 
     if(lrm_state) {
         process_lrm_event(lrm_state, op, NULL);
 
     } else {
         lrmd_rsc_info_t rsc;
 
         rsc.id = strdup(op->rsc_id);
         rsc.type = crm_element_value_copy(xml_rsc, XML_ATTR_TYPE);
         rsc.class = crm_element_value_copy(xml_rsc, XML_AGENT_ATTR_CLASS);
         rsc.provider = crm_element_value_copy(xml_rsc, XML_AGENT_ATTR_PROVIDER);
 
         do_update_resource(target_node, &rsc, op);
 
         free(rsc.id);
         free(rsc.type);
         free(rsc.class);
         free(rsc.provider);
     }
     lrmd_free_event(op);
 }
 
 
 /*	 A_LRM_INVOKE	*/
 void
 do_lrm_invoke(long long action,
               enum crmd_fsa_cause cause,
               enum crmd_fsa_state cur_state,
               enum crmd_fsa_input current_input, fsa_data_t * msg_data)
 {
     gboolean create_rsc = TRUE;
     lrm_state_t *lrm_state = NULL;
     const char *crm_op = NULL;
     const char *from_sys = NULL;
     const char *from_host = NULL;
     const char *operation = NULL;
     ha_msg_input_t *input = fsa_typed_data(fsa_dt_ha_msg);
     const char *user_name = NULL;
     const char *target_node = NULL;
     gboolean is_remote_node = FALSE;
     gboolean crm_rsc_delete = FALSE;
 
     if (input->xml != NULL) {
         /* Remote node operations are routed here to their remote connections */
         target_node = crm_element_value(input->xml, XML_LRM_ATTR_TARGET);
     }
     if (target_node == NULL) {
         target_node = fsa_our_uname;
     } else if (safe_str_neq(target_node, fsa_our_uname)) {
         is_remote_node = TRUE;
     }
 
     lrm_state = lrm_state_find(target_node);
 
     if (lrm_state == NULL && is_remote_node) {
         crm_err("no lrmd connection for remote node %s found on cluster node %s. Can not process request.",
             target_node, fsa_our_uname);
 
         /* The action must be recorded here and in the CIB as failed */
         synthesize_lrmd_failure(NULL, input->xml, PCMK_OCF_CONNECTION_DIED);
         return;
     }
 
     CRM_ASSERT(lrm_state != NULL);
 
 #if ENABLE_ACL
     user_name = crm_acl_get_set_user(input->msg, F_CRM_USER, NULL);
     crm_trace("LRM command from user '%s'", user_name);
 #endif
 
     crm_op = crm_element_value(input->msg, F_CRM_TASK);
     from_sys = crm_element_value(input->msg, F_CRM_SYS_FROM);
     if (safe_str_neq(from_sys, CRM_SYSTEM_TENGINE)) {
         from_host = crm_element_value(input->msg, F_CRM_HOST_FROM);
     }
 
     crm_trace("LRM command from: %s", from_sys);
 
     if (safe_str_eq(crm_op, CRM_OP_LRM_DELETE)) {
         /* remember this delete op came from crm_resource */
         crm_rsc_delete = TRUE;
         operation = CRMD_ACTION_DELETE;
 
     } else if (safe_str_eq(crm_op, CRM_OP_LRM_REFRESH)) {
         operation = CRM_OP_LRM_REFRESH;
 
     } else if (safe_str_eq(crm_op, CRM_OP_LRM_FAIL)) {
         lrmd_event_data_t *op = NULL;
         lrmd_rsc_info_t *rsc = NULL;
         xmlNode *xml_rsc = find_xml_node(input->xml, XML_CIB_TAG_RESOURCE, TRUE);
 
         CRM_CHECK(xml_rsc != NULL, return);
 
         /* The lrmd can not fail a resource, it does not understand the
          * concept of success or failure in relation to a resource, it simply
          * executes operations and reports the results. We determine what a failure is.
          * Because of this, if we want to fail a resource we have to fake what we
          * understand a failure to look like.
          *
          * To do this we create a fake lrmd operation event for the resource
          * we want to fail.  We then pass that event to the lrmd client callback
          * so it will be processed as if it actually came from the lrmd. */
         op = construct_op(lrm_state, input->xml, ID(xml_rsc), "asyncmon");
         CRM_ASSERT(op != NULL);
 
         free((char *)op->user_data);
         op->user_data = NULL;
         op->call_id = get_fake_call_id(lrm_state, op->rsc_id);
         op->interval = 0;
         op->op_status = PCMK_LRM_OP_DONE;
         op->rc = PCMK_OCF_UNKNOWN_ERROR;
         op->t_run = time(NULL);
         op->t_rcchange = op->t_run;
 
 #if ENABLE_ACL
         if (user_name && is_privileged(user_name) == FALSE) {
             crm_err("%s does not have permission to fail %s", user_name, ID(xml_rsc));
             send_direct_ack(from_host, from_sys, NULL, op, ID(xml_rsc));
             lrmd_free_event(op);
             return;
         }
 #endif
 
         rsc = get_lrm_resource(lrm_state, xml_rsc, input->xml, create_rsc);
         if (rsc) {
             crm_info("Failing resource %s...", rsc->id);
             process_lrm_event(lrm_state, op, NULL);
             op->op_status = PCMK_LRM_OP_DONE;
             op->rc = PCMK_OCF_OK;
             lrmd_free_rsc_info(rsc);
         } else {
             crm_info("Cannot find/create resource in order to fail it...");
             crm_log_xml_warn(input->msg, "bad input");
         }
 
         send_direct_ack(from_host, from_sys, NULL, op, ID(xml_rsc));
         lrmd_free_event(op);
         return;
 
     } else if (input->xml != NULL) {
         operation = crm_element_value(input->xml, XML_LRM_ATTR_TASK);
     }
 
     if (safe_str_eq(crm_op, CRM_OP_LRM_REFRESH)) {
         int rc = pcmk_ok;
         xmlNode *fragment = do_lrm_query_internal(lrm_state, node_update_all);
 
         fsa_cib_update(XML_CIB_TAG_STATUS, fragment, cib_quorum_override, rc, user_name);
         crm_info("Forced a local LRM refresh: call=%d", rc);
 
         if(strcmp(CRM_SYSTEM_CRMD, from_sys) != 0) {
             xmlNode *reply = create_request(
                 CRM_OP_INVOKE_LRM, fragment,
                 from_host, from_sys, CRM_SYSTEM_LRMD, fsa_our_uuid);
 
             crm_debug("ACK'ing refresh from %s (%s)", from_sys, from_host);
 
             if (relay_message(reply, TRUE) == FALSE) {
                 crm_log_xml_err(reply, "Unable to route reply");
             }
             free_xml(reply);
         }
 
         free_xml(fragment);
 
     } else if (safe_str_eq(crm_op, CRM_OP_LRM_QUERY)) {
         xmlNode *data = do_lrm_query_internal(lrm_state, node_update_all);
         xmlNode *reply = create_reply(input->msg, data);
 
         if (relay_message(reply, TRUE) == FALSE) {
             crm_err("Unable to route reply");
             crm_log_xml_err(reply, "reply");
         }
         free_xml(reply);
         free_xml(data);
 
     } else if (safe_str_eq(operation, CRM_OP_PROBED)) {
         update_attrd(lrm_state->node_name, CRM_OP_PROBED, XML_BOOLEAN_TRUE, user_name, is_remote_node);
 
     } else if (safe_str_eq(operation, CRM_OP_REPROBE) || safe_str_eq(crm_op, CRM_OP_REPROBE)) {
         crm_notice("Forcing the status of all resources to be redetected");
 
         force_reprobe(lrm_state, from_sys, from_host, user_name, is_remote_node);
 
         if(strcmp(CRM_SYSTEM_TENGINE, from_sys) != 0
            && strcmp(CRM_SYSTEM_TENGINE, from_sys) != 0) {
             xmlNode *reply = create_request(
                 CRM_OP_INVOKE_LRM, NULL,
                 from_host, from_sys, CRM_SYSTEM_LRMD, fsa_our_uuid);
 
             crm_debug("ACK'ing re-probe from %s (%s)", from_sys, from_host);
 
             if (relay_message(reply, TRUE) == FALSE) {
                 crm_log_xml_err(reply, "Unable to route reply");
             }
             free_xml(reply);
         }
 
     } else if (operation != NULL) {
         lrmd_rsc_info_t *rsc = NULL;
         xmlNode *params = NULL;
         xmlNode *xml_rsc = find_xml_node(input->xml, XML_CIB_TAG_RESOURCE, TRUE);
 
         CRM_CHECK(xml_rsc != NULL, return);
 
         params = find_xml_node(input->xml, XML_TAG_ATTRS, TRUE);
 
         if (safe_str_eq(operation, CRMD_ACTION_DELETE)) {
             create_rsc = FALSE;
         }
 
         if(lrm_state_is_connected(lrm_state) == FALSE) {
             synthesize_lrmd_failure(lrm_state, input->xml, PCMK_OCF_CONNECTION_DIED);
             return;
         }
 
         rsc = get_lrm_resource(lrm_state, xml_rsc, input->xml, create_rsc);
         if (rsc == NULL && create_rsc) {
             crm_err("Invalid resource definition for %s", ID(xml_rsc));
             crm_log_xml_warn(input->msg, "bad input");
 
             /* if the operation couldn't complete because we can't register
              * the resource, return a generic error */
             synthesize_lrmd_failure(lrm_state, input->xml, PCMK_OCF_NOT_CONFIGURED);
 
         } else if (rsc == NULL) {
             crm_notice("Not creating resource for a %s event: %s", operation, ID(input->xml));
             delete_rsc_entry(lrm_state, input, ID(xml_rsc), NULL, pcmk_ok, user_name);
 
             /* Deleting something that does not exist is a success */
             send_task_ok_ack(lrm_state, input, ID(xml_rsc), NULL, operation,
                              from_host, from_sys);
 
         } else if (safe_str_eq(operation, CRMD_ACTION_CANCEL)) {
             char *op_key = NULL;
             char *meta_key = NULL;
             int call = 0;
             const char *call_id = NULL;
             const char *op_task = NULL;
             const char *op_interval = NULL;
             gboolean in_progress = FALSE;
 
             CRM_CHECK(params != NULL, crm_log_xml_warn(input->xml, "Bad command");
                       lrmd_free_rsc_info(rsc); return);
 
             meta_key = crm_meta_name(XML_LRM_ATTR_INTERVAL);
             op_interval = crm_element_value(params, meta_key);
             free(meta_key);
 
             meta_key = crm_meta_name(XML_LRM_ATTR_TASK);
             op_task = crm_element_value(params, meta_key);
             free(meta_key);
 
             meta_key = crm_meta_name(XML_LRM_ATTR_CALLID);
             call_id = crm_element_value(params, meta_key);
             free(meta_key);
 
             CRM_CHECK(op_task != NULL, crm_log_xml_warn(input->xml, "Bad command");
                       lrmd_free_rsc_info(rsc); return);
             CRM_CHECK(op_interval != NULL, crm_log_xml_warn(input->xml, "Bad command");
                       lrmd_free_rsc_info(rsc); return);
 
             op_key = generate_op_key(rsc->id, op_task, crm_parse_int(op_interval, "0"));
 
             crm_debug("PE requested op %s (call=%s) be cancelled",
                       op_key, call_id ? call_id : "NA");
             call = crm_parse_int(call_id, "0");
             if (call == 0) {
                 /* the normal case when the PE cancels a recurring op */
                 in_progress = cancel_op_key(lrm_state, rsc, op_key, TRUE);
 
             } else {
                 /* the normal case when the PE cancels an orphan op */
                 in_progress = cancel_op(lrm_state, rsc->id, NULL, call, TRUE);
             }
 
             /* Acknowledge the cancellation operation if it's for a remote connection resource */
             if (in_progress == FALSE || is_remote_lrmd_ra(NULL, NULL, rsc->id)) {
                 char *op_id = make_stop_id(rsc->id, call);
 
                 if (is_remote_lrmd_ra(NULL, NULL, rsc->id) == FALSE) {
                     crm_info("Nothing known about operation %d for %s", call, op_key);
                 }
                 delete_op_entry(lrm_state, NULL, rsc->id, op_key, call);
                 send_task_ok_ack(lrm_state, input, rsc->id, rsc, op_task,
                                  from_host, from_sys);
 
                 /* needed at least for cancellation of a remote operation */
                 g_hash_table_remove(lrm_state->pending_ops, op_id);
                 free(op_id);
 
             } else {
                 /* No ack is needed since abcdaa8, but peers with older versions
                  * in a rolling upgrade need one. We didn't bump the feature set
                  * at that commit, so we can only compare against the previous
                  * CRM version (3.0.8). If any peers have feature set 3.0.9 but
                  * not abcdaa8, they will time out waiting for the ack (no
                  * released versions of Pacemaker are affected).
                  */
                 const char *peer_version = crm_element_value(params, XML_ATTR_CRM_VERSION);
 
                 if (compare_version(peer_version, "3.0.8") <= 0) {
                     crm_info("Sending compatibility ack for %s cancellation to %s (CRM version %s)",
                              op_key, from_host, peer_version);
                     send_task_ok_ack(lrm_state, input, rsc->id, rsc, op_task,
                                      from_host, from_sys);
                 }
             }
 
             free(op_key);
 
         } else if (safe_str_eq(operation, CRMD_ACTION_DELETE)) {
             gboolean unregister = TRUE;
 
 #if ENABLE_ACL
             int cib_rc = delete_rsc_status(lrm_state, rsc->id, cib_dryrun | cib_sync_call, user_name);
             if (cib_rc != pcmk_ok) {
                 lrmd_event_data_t *op = NULL;
 
                 crm_err
                     ("Attempted deletion of resource status '%s' from CIB for %s (user=%s) on %s failed: (rc=%d) %s",
                      rsc->id, from_sys, user_name ? user_name : "unknown", from_host, cib_rc,
                      pcmk_strerror(cib_rc));
 
                 op = construct_op(lrm_state, input->xml, rsc->id, operation);
                 op->op_status = PCMK_LRM_OP_ERROR;
 
                 if (cib_rc == -EACCES) {
                     op->rc = PCMK_OCF_INSUFFICIENT_PRIV;
                 } else {
                     op->rc = PCMK_OCF_UNKNOWN_ERROR;
                 }
                 send_direct_ack(from_host, from_sys, NULL, op, rsc->id);
                 lrmd_free_event(op);
                 lrmd_free_rsc_info(rsc);
                 return;
             }
 #endif
             if (crm_rsc_delete == TRUE && is_remote_lrmd_ra(NULL, NULL, rsc->id)) {
                 unregister = FALSE;
             }
 
             delete_resource(lrm_state, rsc->id, rsc, NULL, from_sys, from_host, user_name, input, unregister);
 
         } else {
             do_lrm_rsc_op(lrm_state, rsc, operation, input->xml, input->msg);
         }
 
         lrmd_free_rsc_info(rsc);
 
     } else {
         crm_err("Operation was neither a lrm_query, nor a rsc op.  %s", crm_str(crm_op));
         register_fsa_error(C_FSA_INTERNAL, I_ERROR, NULL);
     }
 }
 
 static lrmd_event_data_t *
 construct_op(lrm_state_t * lrm_state, xmlNode * rsc_op, const char *rsc_id, const char *operation)
 {
     lrmd_event_data_t *op = NULL;
     const char *op_delay = NULL;
     const char *op_timeout = NULL;
     const char *op_interval = NULL;
     GHashTable *params = NULL;
     xmlNode *versioned_params = NULL;
 
     const char *transition = NULL;
 
     CRM_ASSERT(rsc_id != NULL);
 
     op = calloc(1, sizeof(lrmd_event_data_t));
     op->type = lrmd_event_exec_complete;
     op->op_type = strdup(operation);
     op->op_status = PCMK_LRM_OP_PENDING;
     op->rc = -1;
     op->rsc_id = strdup(rsc_id);
     op->interval = 0;
     op->timeout = 0;
     op->start_delay = 0;
 
     if (rsc_op == NULL) {
         CRM_LOG_ASSERT(safe_str_eq(CRMD_ACTION_STOP, operation));
         op->user_data = NULL;
         /* the stop_all_resources() case
          * by definition there is no DC (or they'd be shutting
          *   us down).
          * So we should put our version here.
          */
         op->params = g_hash_table_new_full(crm_str_hash, g_str_equal,
                                            g_hash_destroy_str, g_hash_destroy_str);
 
         g_hash_table_insert(op->params, strdup(XML_ATTR_CRM_VERSION), strdup(CRM_FEATURE_SET));
 
         crm_trace("Constructed %s op for %s", operation, rsc_id);
         return op;
     }
 
     params = xml2list(rsc_op);
     g_hash_table_remove(params, CRM_META "_op_target_rc");
     
     if (!is_remote_lrmd_ra(NULL, NULL, rsc_id)) {
         xmlNode *ptr = first_named_child(rsc_op, XML_TAG_VER_ATTRS);
         
         if (ptr) {
             versioned_params = copy_xml(ptr);
         }
     }
 
     op_delay = crm_meta_value(params, XML_OP_ATTR_START_DELAY);
     op_timeout = crm_meta_value(params, XML_ATTR_TIMEOUT);
     op_interval = crm_meta_value(params, XML_LRM_ATTR_INTERVAL);
 
     op->interval = crm_parse_int(op_interval, "0");
     op->timeout = crm_parse_int(op_timeout, "0");
     op->start_delay = crm_parse_int(op_delay, "0");
 
     if (safe_str_neq(operation, RSC_STOP)) {
         op->params = params;
         op->versioned_params = versioned_params;
 
     } else {
         rsc_history_t *entry = g_hash_table_lookup(lrm_state->resource_history, rsc_id);
 
         /* If we do not have stop parameters cached, use
          * whatever we are given */
         if (!entry || !entry->stop_params) {
             op->params = params;
             op->versioned_params = versioned_params;
         } else {
             /* Copy the cached parameter list so that we stop the resource
              * with the old attributes, not the new ones */
             op->params = g_hash_table_new_full(crm_str_hash, g_str_equal,
                                                g_hash_destroy_str, g_hash_destroy_str);
 
             g_hash_table_foreach(params, copy_meta_keys, op->params);
             g_hash_table_foreach(entry->stop_params, copy_instance_keys, op->params);
             g_hash_table_destroy(params);
             params = NULL;
             
             op->versioned_params = NULL;
             free_xml(versioned_params);
         }
     }
 
     if (op->versioned_params) {
         char *versioned_params_text = dump_xml_unformatted(op->versioned_params);
 
         if (versioned_params_text) {
             g_hash_table_insert(op->params, strdup("#" XML_TAG_VER_ATTRS), versioned_params_text);
         }
     }
 
     /* sanity */
     if (op->interval < 0) {
         op->interval = 0;
     }
     if (op->timeout <= 0) {
         op->timeout = op->interval;
     }
     if (op->start_delay < 0) {
         op->start_delay = 0;
     }
 
     transition = crm_element_value(rsc_op, XML_ATTR_TRANSITION_KEY);
     CRM_CHECK(transition != NULL, return op);
 
     op->user_data = strdup(transition);
 
     if (op->interval != 0) {
         if (safe_str_eq(operation, CRMD_ACTION_START)
             || safe_str_eq(operation, CRMD_ACTION_STOP)) {
             crm_err("Start and Stop actions cannot have an interval: %d", op->interval);
             op->interval = 0;
         }
     }
 
     crm_trace("Constructed %s op for %s: interval=%d", operation, rsc_id, op->interval);
 
     return op;
 }
 
 void
 send_direct_ack(const char *to_host, const char *to_sys,
                 lrmd_rsc_info_t * rsc, lrmd_event_data_t * op, const char *rsc_id)
 {
     xmlNode *reply = NULL;
     xmlNode *update, *iter;
     crm_node_t *peer = NULL;
 
     CRM_CHECK(op != NULL, return);
     if (op->rsc_id == NULL) {
         CRM_ASSERT(rsc_id != NULL);
         op->rsc_id = strdup(rsc_id);
     }
     if (to_sys == NULL) {
         to_sys = CRM_SYSTEM_TENGINE;
     }
 
     peer = crm_get_peer(0, fsa_our_uname);
     update = create_node_state_update(peer, node_update_none, NULL,
                                       __FUNCTION__);
 
     iter = create_xml_node(update, XML_CIB_TAG_LRM);
     crm_xml_add(iter, XML_ATTR_ID, fsa_our_uuid);
     iter = create_xml_node(iter, XML_LRM_TAG_RESOURCES);
     iter = create_xml_node(iter, XML_LRM_TAG_RESOURCE);
 
     crm_xml_add(iter, XML_ATTR_ID, op->rsc_id);
 
     build_operation_update(iter, rsc, op, __FUNCTION__);
     reply = create_request(CRM_OP_INVOKE_LRM, update, to_host, to_sys, CRM_SYSTEM_LRMD, NULL);
 
     crm_log_xml_trace(update, "ACK Update");
 
     crm_debug("ACK'ing resource op %s_%s_%d from %s: %s",
               op->rsc_id, op->op_type, op->interval, op->user_data,
               crm_element_value(reply, XML_ATTR_REFERENCE));
 
     if (relay_message(reply, TRUE) == FALSE) {
         crm_log_xml_err(reply, "Unable to route reply");
     }
 
     free_xml(update);
     free_xml(reply);
 }
 
 gboolean
 verify_stopped(enum crmd_fsa_state cur_state, int log_level)
 {
     gboolean res = TRUE;
     GList *lrm_state_list = lrm_state_get_list();
     GList *state_entry;
 
     for (state_entry = lrm_state_list; state_entry != NULL; state_entry = state_entry->next) {
         lrm_state_t *lrm_state = state_entry->data;
 
         if (!lrm_state_verify_stopped(lrm_state, cur_state, log_level)) {
             /* keep iterating through all even when false is returned */
             res = FALSE;
         }
     }
 
     set_bit(fsa_input_register, R_SENT_RSC_STOP);
     g_list_free(lrm_state_list); lrm_state_list = NULL;
     return res;
 }
 
 struct stop_recurring_action_s {
     lrmd_rsc_info_t *rsc;
     lrm_state_t *lrm_state;
 };
 
 static gboolean
 stop_recurring_action_by_rsc(gpointer key, gpointer value, gpointer user_data)
 {
     gboolean remove = FALSE;
     struct stop_recurring_action_s *event = user_data;
     struct recurring_op_s *op = (struct recurring_op_s *)value;
 
     if (op->interval != 0 && crm_str_eq(op->rsc_id, event->rsc->id, TRUE)) {
         crm_debug("Cancelling op %d for %s (%s)", op->call_id, op->rsc_id, (char*)key);
         remove = !cancel_op(event->lrm_state, event->rsc->id, key, op->call_id, FALSE);
     }
 
     return remove;
 }
 
 static gboolean
 stop_recurring_actions(gpointer key, gpointer value, gpointer user_data)
 {
     gboolean remove = FALSE;
     lrm_state_t *lrm_state = user_data;
     struct recurring_op_s *op = (struct recurring_op_s *)value;
 
     if (op->interval != 0) {
         crm_info("Cancelling op %d for %s (%s)", op->call_id, op->rsc_id, key);
         remove = !cancel_op(lrm_state, op->rsc_id, key, op->call_id, FALSE);
     }
 
     return remove;
 }
 
 static void
 record_pending_op(const char *node_name, lrmd_rsc_info_t *rsc, lrmd_event_data_t *op)
 {
     CRM_CHECK(node_name != NULL, return);
     CRM_CHECK(rsc != NULL, return);
     CRM_CHECK(op != NULL, return);
 
     if (op->op_type == NULL
         || safe_str_eq(op->op_type, CRMD_ACTION_CANCEL)
         || safe_str_eq(op->op_type, CRMD_ACTION_DELETE)) {
         return;
     }
 
     if (op->params == NULL) {
         return;
 
     } else {
         const char *record_pending = crm_meta_value(op->params, XML_OP_ATTR_PENDING);
 
         if (record_pending == NULL || crm_is_true(record_pending) == FALSE) {
             return;
          }
     }
 
     op->call_id = -1;
     op->op_status = PCMK_LRM_OP_PENDING;
     op->rc = PCMK_OCF_UNKNOWN;
 
     op->t_run = time(NULL);
     op->t_rcchange = op->t_run;
 
     /* write a "pending" entry to the CIB, inhibit notification */
     crm_debug("Recording pending op %s_%s_%d on %s in the CIB",
               op->rsc_id, op->op_type, op->interval, node_name);
 
     do_update_resource(node_name, rsc, op);
 }
 
 static void
 do_lrm_rsc_op(lrm_state_t * lrm_state, lrmd_rsc_info_t * rsc, const char *operation, xmlNode * msg,
               xmlNode * request)
 {
     int call_id = 0;
     char *op_id = NULL;
     lrmd_event_data_t *op = NULL;
     lrmd_key_value_t *params = NULL;
     fsa_data_t *msg_data = NULL;
     const char *transition = NULL;
     gboolean stop_recurring = FALSE;
     bool send_nack = FALSE;
 
     CRM_CHECK(rsc != NULL, return);
     CRM_CHECK(operation != NULL, return);
 
     if (msg != NULL) {
         transition = crm_element_value(msg, XML_ATTR_TRANSITION_KEY);
         if (transition == NULL) {
             crm_log_xml_err(msg, "Missing transition number");
         }
     }
 
     op = construct_op(lrm_state, msg, rsc->id, operation);
     CRM_CHECK(op != NULL, return);
 
     if (is_remote_lrmd_ra(NULL, NULL, rsc->id)
         && op->interval == 0
         && strcmp(operation, CRMD_ACTION_MIGRATE) == 0) {
 
         /* pcmk remote connections are a special use case.
          * We never ever want to stop monitoring a connection resource until
-         * the entire migration has completed. If the connection is ever unexpected
+         * the entire migration has completed. If the connection is unexpectedly
          * severed, even during a migration, this is an event we must detect.*/
         stop_recurring = FALSE;
 
     } else if (op->interval == 0
         && strcmp(operation, CRMD_ACTION_STATUS) != 0
         && strcmp(operation, CRMD_ACTION_NOTIFY) != 0) {
 
         /* stop any previous monitor operations before changing the resource state */
         stop_recurring = TRUE;
     }
 
     if (stop_recurring == TRUE) {
         guint removed = 0;
         struct stop_recurring_action_s data;
 
         data.rsc = rsc;
         data.lrm_state = lrm_state;
         removed = g_hash_table_foreach_remove(
             lrm_state->pending_ops, stop_recurring_action_by_rsc, &data);
 
         if (removed) {
             crm_debug("Stopped %u recurring operations in preparation for %s_%s_%d",
                       removed, rsc->id, operation, op->interval);
         }
     }
 
     /* now do the op */
     crm_info("Performing key=%s op=%s_%s_%d", transition, rsc->id, operation, op->interval);
 
     if (is_set(fsa_input_register, R_SHUTDOWN) && safe_str_eq(operation, RSC_START)) {
         register_fsa_input(C_SHUTDOWN, I_SHUTDOWN, NULL);
         send_nack = TRUE;
 
     } else if (fsa_state != S_NOT_DC
                && fsa_state != S_POLICY_ENGINE /* Recalculating */
                && fsa_state != S_TRANSITION_ENGINE
                && safe_str_neq(operation, "fail")
                && safe_str_neq(operation, CRMD_ACTION_STOP)) {
         send_nack = TRUE;
     }
 
     if(send_nack) {
         crm_notice("Discarding attempt to perform action %s on %s in state %s (shutdown=%s)",
                    operation, rsc->id, fsa_state2string(fsa_state),
                    is_set(fsa_input_register, R_SHUTDOWN)?"true":"false");
 
         op->rc = CRM_DIRECT_NACK_RC;
         op->op_status = PCMK_LRM_OP_ERROR;
         send_direct_ack(NULL, NULL, rsc, op, rsc->id);
         lrmd_free_event(op);
         free(op_id);
         return;
     }
 
     record_pending_op(lrm_state->node_name, rsc, op);
 
     op_id = generate_op_key(rsc->id, op->op_type, op->interval);
 
     if (op->interval > 0) {
         /* cancel it so we can then restart it without conflict */
         cancel_op_key(lrm_state, rsc, op_id, FALSE);
     }
 
     if (op->params) {
         char *key = NULL;
         char *value = NULL;
         GHashTableIter iter;
 
         g_hash_table_iter_init(&iter, op->params);
         while (g_hash_table_iter_next(&iter, (gpointer *) & key, (gpointer *) & value)) {
             params = lrmd_key_value_add(params, key, value);
         }
     }
 
     call_id = lrm_state_exec(lrm_state,
                              rsc->id,
                              op->op_type,
                              op->user_data, op->interval, op->timeout, op->start_delay, params);
 
     if (call_id <= 0 && lrm_state_is_local(lrm_state)) {
         crm_err("Operation %s on %s failed: %d", operation, rsc->id, call_id);
         register_fsa_error(C_FSA_INTERNAL, I_FAIL, NULL);
 
     } else if (call_id <= 0) {
 
         crm_err("Operation %s on resource %s failed to execute on remote node %s: %d", operation, rsc->id, lrm_state->node_name, call_id);
         op->call_id = get_fake_call_id(lrm_state, rsc->id);
         op->op_status = PCMK_LRM_OP_DONE;
         op->rc = PCMK_OCF_UNKNOWN_ERROR;
         op->t_run = time(NULL);
         op->t_rcchange = op->t_run;
         process_lrm_event(lrm_state, op, NULL);
 
     } else {
         /* record all operations so we can wait
          * for them to complete during shutdown
          */
         char *call_id_s = make_stop_id(rsc->id, call_id);
         struct recurring_op_s *pending = NULL;
 
         pending = calloc(1, sizeof(struct recurring_op_s));
         crm_trace("Recording pending op: %d - %s %s", call_id, op_id, call_id_s);
 
         pending->call_id = call_id;
         pending->interval = op->interval;
         pending->op_type = strdup(operation);
         pending->op_key = strdup(op_id);
         pending->rsc_id = strdup(rsc->id);
         pending->start_time = time(NULL);
         pending->user_data = strdup(op->user_data);
         g_hash_table_replace(lrm_state->pending_ops, call_id_s, pending);
 
         if (op->interval > 0 && op->start_delay > START_DELAY_THRESHOLD) {
             char *uuid = NULL;
             int dummy = 0, target_rc = 0;
 
             crm_info("Faking confirmation of %s: execution postponed for over 5 minutes", op_id);
 
             decode_transition_key(op->user_data, &uuid, &dummy, &dummy, &target_rc);
             free(uuid);
 
             op->rc = target_rc;
             op->op_status = PCMK_LRM_OP_DONE;
             send_direct_ack(NULL, NULL, rsc, op, rsc->id);
         }
 
         pending->params = op->params;
         op->params = NULL;
     }
 
     free(op_id);
     lrmd_free_event(op);
     return;
 }
 
 int last_resource_update = 0;
 
 static void
 cib_rsc_callback(xmlNode * msg, int call_id, int rc, xmlNode * output, void *user_data)
 {
     switch (rc) {
         case pcmk_ok:
         case -pcmk_err_diff_failed:
         case -pcmk_err_diff_resync:
             crm_trace("Resource update %d complete: rc=%d", call_id, rc);
             break;
         default:
             crm_warn("Resource update %d failed: (rc=%d) %s", call_id, rc, pcmk_strerror(rc));
     }
 
     if (call_id == last_resource_update) {
         last_resource_update = 0;
         trigger_fsa(fsa_source);
     }
 }
 
 static int
 do_update_resource(const char *node_name, lrmd_rsc_info_t * rsc, lrmd_event_data_t * op)
 {
 /*
   <status>
   <nodes_status id=uname>
   <lrm>
   <lrm_resources>
   <lrm_resource id=...>
   </...>
 */
     int rc = pcmk_ok;
     xmlNode *update, *iter = NULL;
     int call_opt = crmd_cib_smart_opt();
     const char *uuid = NULL;
 
     CRM_CHECK(op != NULL, return 0);
 
     iter = create_xml_node(iter, XML_CIB_TAG_STATUS);
     update = iter;
     iter = create_xml_node(iter, XML_CIB_TAG_STATE);
 
     if (safe_str_eq(node_name, fsa_our_uname)) {
         uuid = fsa_our_uuid;
 
     } else {
         /* remote nodes uuid and uname are equal */
         uuid = node_name;
         crm_xml_add(iter, XML_NODE_IS_REMOTE, "true");
     }
 
     CRM_LOG_ASSERT(uuid != NULL);
     if(uuid == NULL) {
         rc = -EINVAL;
         goto done;
     }
 
     crm_xml_add(iter, XML_ATTR_UUID,  uuid);
     crm_xml_add(iter, XML_ATTR_UNAME, node_name);
     crm_xml_add(iter, XML_ATTR_ORIGIN, __FUNCTION__);
 
     iter = create_xml_node(iter, XML_CIB_TAG_LRM);
     crm_xml_add(iter, XML_ATTR_ID, uuid);
 
     iter = create_xml_node(iter, XML_LRM_TAG_RESOURCES);
     iter = create_xml_node(iter, XML_LRM_TAG_RESOURCE);
     crm_xml_add(iter, XML_ATTR_ID, op->rsc_id);
 
     build_operation_update(iter, rsc, op, __FUNCTION__);
 
     if (rsc) {
         const char *container = NULL;
 
         crm_xml_add(iter, XML_ATTR_TYPE, rsc->type);
         crm_xml_add(iter, XML_AGENT_ATTR_CLASS, rsc->class);
         crm_xml_add(iter, XML_AGENT_ATTR_PROVIDER, rsc->provider);
 
         if (op->params) {
             container = g_hash_table_lookup(op->params, CRM_META"_"XML_RSC_ATTR_CONTAINER);
         }
         if (container) {
             crm_trace("Resource %s is a part of container resource %s", op->rsc_id, container);
             crm_xml_add(iter, XML_RSC_ATTR_CONTAINER, container);
         }
 
     } else {
         crm_warn("Resource %s no longer exists in the lrmd", op->rsc_id);
         send_direct_ack(NULL, NULL, rsc, op, op->rsc_id);
         goto cleanup;
     }
 
     crm_log_xml_trace(update, __FUNCTION__);
 
     /* make it an asynchronous call and be done with it
      *
      * Best case:
      *   the resource state will be discovered during
      *   the next signup or election.
      *
      * Bad case:
      *   we are shutting down and there is no DC at the time,
      *   but then why were we shutting down then anyway?
      *   (probably because of an internal error)
      *
      * Worst case:
      *   we get shot for having resources "running" when the really weren't
      *
      * the alternative however means blocking here for too long, which
      * isn't acceptable
      */
     fsa_cib_update(XML_CIB_TAG_STATUS, update, call_opt, rc, NULL);
 
     if (rc > 0) {
         last_resource_update = rc;
     }
   done:
     /* the return code is a call number, not an error code */
     crm_trace("Sent resource state update message: %d for %s=%d on %s", rc,
               op->op_type, op->interval, op->rsc_id);
     fsa_register_cib_callback(rc, FALSE, NULL, cib_rsc_callback);
 
   cleanup:
     free_xml(update);
     return rc;
 }
 
 void
 do_lrm_event(long long action,
              enum crmd_fsa_cause cause,
              enum crmd_fsa_state cur_state, enum crmd_fsa_input cur_input, fsa_data_t * msg_data)
 {
     CRM_CHECK(FALSE, return);
 }
 
 gboolean
 process_lrm_event(lrm_state_t * lrm_state, lrmd_event_data_t * op, struct recurring_op_s *pending)
 {
     char *op_id = NULL;
     char *op_key = NULL;
 
     int update_id = 0;
     gboolean remove = FALSE;
     gboolean removed = FALSE;
     lrmd_rsc_info_t *rsc = NULL;
 
     CRM_CHECK(op != NULL, return FALSE);
     CRM_CHECK(op->rsc_id != NULL, return FALSE);
 
     op_id = make_stop_id(op->rsc_id, op->call_id);
     op_key = generate_op_key(op->rsc_id, op->op_type, op->interval);
     rsc = lrm_state_get_rsc_info(lrm_state, op->rsc_id, 0);
     if(pending == NULL) {
         remove = TRUE;
         pending = g_hash_table_lookup(lrm_state->pending_ops, op_id);
     }
 
     if (op->op_status == PCMK_LRM_OP_ERROR) {
         switch(op->rc) {
             case PCMK_OCF_NOT_RUNNING:
             case PCMK_OCF_RUNNING_MASTER:
             case PCMK_OCF_DEGRADED:
             case PCMK_OCF_DEGRADED_MASTER:
                 /* Leave it up to the TE/PE to decide if this is an error */
                 op->op_status = PCMK_LRM_OP_DONE;
                 break;
             default:
                 /* Nothing to do */
                 break;
         }
     }
 
     if (op->op_status != PCMK_LRM_OP_CANCELLED) {
         if (safe_str_eq(op->op_type, RSC_NOTIFY)) {
             /* Keep notify ops out of the CIB */
             send_direct_ack(NULL, NULL, NULL, op, op->rsc_id);
         } else {
             update_id = do_update_resource(lrm_state->node_name, rsc, op);
         }
     } else if (op->interval == 0) {
         /* This will occur when "crm resource cleanup" is called while actions are in-flight */
         crm_err("Op %s (call=%d): Cancelled", op_key, op->call_id);
         send_direct_ack(NULL, NULL, NULL, op, op->rsc_id);
 
     } else if (pending == NULL) {
         /* We don't need to do anything for cancelled ops
          * that are not in our pending op list. There are no
          * transition actions waiting on these operations. */
 
     } else if (op->user_data == NULL) {
         /* At this point we have a pending entry, but no transition
          * key present in the user_data field. report this */
         crm_err("Op %s (call=%d): No user data", op_key, op->call_id);
 
     } else if (pending->remove) {
         /* The tengine canceled this op, we have been waiting for the cancel to finish. */
         delete_op_entry(lrm_state, op, op->rsc_id, op_key, op->call_id);
 
     } else if (pending && op->rsc_deleted) {
         /* The tengine initiated this op, but it was cancelled outside of the
          * tengine's control during a resource cleanup/re-probe request. The tengine
          * must be alerted that this operation completed, otherwise the tengine
          * will continue waiting for this update to occur until it is timed out.
          * We don't want this update going to the cib though, so use a direct ack. */
         crm_trace("Op %s (call=%d): cancelled due to rsc deletion", op_key, op->call_id);
         send_direct_ack(NULL, NULL, NULL, op, op->rsc_id);
 
     } else {
         /* Before a stop is called, no need to direct ack */
         crm_trace("Op %s (call=%d): no delete event required", op_key, op->call_id);
     }
 
     if(remove == FALSE) {
         /* The caller will do this afterwards, but keep the logging consistent */
         removed = TRUE;
 
     } else if ((op->interval == 0) && g_hash_table_remove(lrm_state->pending_ops, op_id)) {
         removed = TRUE;
         crm_trace("Op %s (call=%d, stop-id=%s, remaining=%u): Confirmed",
                   op_key, op->call_id, op_id, g_hash_table_size(lrm_state->pending_ops));
 
     } else if(op->interval != 0 && op->op_status == PCMK_LRM_OP_CANCELLED) {
         removed = TRUE;
         g_hash_table_remove(lrm_state->pending_ops, op_id);
     }
 
     switch (op->op_status) {
         case PCMK_LRM_OP_CANCELLED:
             crm_info("Result of %s operation for %s on %s: %s "
                      CRM_XS " call=%d key=%s confirmed=%s",
                      crm_action_str(op->op_type, op->interval),
                      op->rsc_id, lrm_state->node_name,
                      services_lrm_status_str(op->op_status),
                      op->call_id, op_key, (removed? "true" : "false"));
             break;
 
         case PCMK_LRM_OP_DONE:
             do_crm_log(op->interval?LOG_INFO:LOG_NOTICE,
                        "Result of %s operation for %s on %s: %d (%s) "
                        CRM_XS " call=%d key=%s confirmed=%s cib-update=%d",
                        crm_action_str(op->op_type, op->interval),
                        op->rsc_id, lrm_state->node_name,
                        op->rc, services_ocf_exitcode_str(op->rc),
                        op->call_id, op_key, (removed? "true" : "false"),
                        update_id);
             break;
 
         case PCMK_LRM_OP_TIMEOUT:
             crm_err("Result of %s operation for %s on %s: %s "
                     CRM_XS " call=%d key=%s timeout=%dms",
                     crm_action_str(op->op_type, op->interval),
                     op->rsc_id, lrm_state->node_name,
                     services_lrm_status_str(op->op_status),
                     op->call_id, op_key, op->timeout);
             break;
 
         default:
             crm_err("Result of %s operation for %s on %s: %s "
                     CRM_XS " call=%d key=%s confirmed=%s status=%d cib-update=%d",
                     crm_action_str(op->op_type, op->interval),
                     op->rsc_id, lrm_state->node_name,
                     services_lrm_status_str(op->op_status), op->call_id, op_key,
                     (removed? "true" : "false"), op->op_status, update_id);
     }
 
     if (op->output) {
         char *prefix =
             crm_strdup_printf("%s-%s_%s_%d:%d", lrm_state->node_name, op->rsc_id, op->op_type, op->interval, op->call_id);
 
         if (op->rc) {
             crm_log_output(LOG_NOTICE, prefix, op->output);
         } else {
             crm_log_output(LOG_DEBUG, prefix, op->output);
         }
         free(prefix);
     }
 
     crmd_notify_resource_op(lrm_state->node_name, op);
 
     if (op->rsc_deleted) {
         crm_info("Deletion of resource '%s' complete after %s", op->rsc_id, op_key);
         delete_rsc_entry(lrm_state, NULL, op->rsc_id, NULL, pcmk_ok, NULL);
     }
 
     /* If a shutdown was escalated while operations were pending,
      * then the FSA will be stalled right now... allow it to continue
      */
     mainloop_set_trigger(fsa_source);
     update_history_cache(lrm_state, rsc, op);
 
     lrmd_free_rsc_info(rsc);
     free(op_key);
     free(op_id);
 
     return TRUE;
 }
diff --git a/doc/Pacemaker_Explained/en-US/Ap-Upgrade.txt b/doc/Pacemaker_Explained/en-US/Ap-Upgrade.txt
index f36f8159a3..32c0537618 100644
--- a/doc/Pacemaker_Explained/en-US/Ap-Upgrade.txt
+++ b/doc/Pacemaker_Explained/en-US/Ap-Upgrade.txt
@@ -1,420 +1,408 @@
 [appendix]
 
 == Upgrading ==
 
 [[ap-upgrade]]
 === Upgrading Cluster Software ===
 
 There are three approaches to upgrading a cluster, each with advantages and
 disadvantages.
 
 .Upgrade Methods
 [width="95%",cols="s,6*",options="header",align="center"]
 |=========================================================
 
 |Method
 |Available between all versions
 |Can be used with Pacemaker Remote nodes
 |Service outage during upgrade
 |Service recovery during upgrade
 |Exercises failover logic
 |Allows change of messaging layer
 indexterm:[Cluster,switching between stacks]
 indexterm:[Changing cluster stack]
 footnote:[For example, switching from Heartbeat to Corosync.]
 
 |Complete cluster shutdown
 indexterm:[upgrade,shutdown]
 indexterm:[shutdown upgrade]
 |yes
 |yes
 |always
 |N/A
 |no
 |yes
 
 |Rolling (node by node)
 indexterm:[upgrade,rolling]
 indexterm:[rolling upgrade]
 |no
 |yes
 |always
+footnote:[Any active resources will be moved off the node being upgraded,
+so there will be at least a brief outage unless all resources can be
+migrated "live".]
 |yes
 |yes
 |no
 
 |Detach and reattach
 indexterm:[upgrade,reattach]
 indexterm:[reattach upgrade]
 |yes
 |no
 |only due to failure
 |no
 |no
 |yes
 
 |=========================================================
 
 ==== Complete Cluster Shutdown ====
 
 In this scenario, one shuts down all cluster nodes and resources,
 then upgrades all the nodes before restarting the cluster.
 
 . On each node:
 .. Shutdown the cluster software (pacemaker and the messaging layer).
 .. Upgrade the Pacemaker software. This may also include upgrading the
    messaging layer and/or the underlying operating system.
 .. Check the configuration with the `crm_verify` tool.
 . On each node:
 .. Start the cluster software.
    The messaging layer can be either Corosync or Heartbeat and does not need to
    be the same one before the upgrade.
 
 One variation of this approach is to build a new cluster on new hosts.
 This allows the new version to be tested beforehand, and minimizes downtime by
 having the new nodes ready to be placed in production as soon as the old nodes
 are shut down.
 
 ==== Rolling (node by node) ====
 
 In this scenario, each node is removed from the cluster, upgraded, and then
 brought back online, until all nodes are running the newest version.
 
 If you plan to upgrade other cluster software -- such as the messaging layer --
 at the same time, consult that software's documentation for its compatibility
 with a rolling upgrade.
 
 Pacemaker has three version numbers that affect rolling upgrades:
 
 * *Pacemaker release version:* Rolling upgrades are possible as long as the
   major version number (the _x_ in _x.y.z_) stays the same. For example,
   a rolling upgrade may be done from 1.0.8 to 1.1.15, but not from
   0.6.7 to 1.0.0.
 
 * *CRM feature set:* This version number applies to the communication between
   full cluster nodes.
 +
 It increases when a cluster node running the older version would have
 problems if the cluster's Designated Controller (DC) has the newer version.
 To avoid these problems, Pacemaker ensures that the longest-running node is the
 DC, and that nodes with an older feature set cannot join the cluster.
 +
 Therefore, if the CRM feature set is changing in the Pacemaker version you
 are upgrading to, you should run a mixed-version cluster only during a small
-rolling upgrade window. Otherwise, if one of the older nodes drops out of the
+rolling upgrade window. If one of the older nodes drops out of the
 cluster for any reason, it will not be able to rejoin until it is upgraded.
 
 * *LRMD protocol version:* This version number applies to communication between a
   Pacemaker Remote node and the cluster. It increases when an older cluster
   node would have problems hosting the connection to a newer Pacemaker Remote
   node. To avoid these problems, Pacemaker Remote nodes will accept connections
   only from cluster nodes with the same or newer LRMD protocol version.
 +
 For rolling upgrades, this means that all cluster nodes should be upgraded
 before upgrading any Pacemaker Remote nodes.
 +
 Unlike with CRM feature set differences between full cluster nodes,
 mixed LRMD protocol versions between Pacemaker Remote nodes and full cluster
 nodes are fine, as long as the Pacemaker Remote nodes have the older version.
 This can be useful, for example, to host a legacy application in an
 older operating system version used as a Pacemaker Remote node.
 
 See the ClusterLabs wiki's
 http://clusterlabs.org/wiki/ReleaseCalendar[Release Calendar] to figure out
 whether the CRM feature set and/or LRMD protocol version changed between the
 the Pacemaker release versions in your rolling upgrade.
 
 [WARNING]
 ====
 The interpretation of the LRMD protocol version changed in Pacemaker 1.1.15.
 If you are planning a rolling upgrade from an earlier Pacemaker version to
 Pacemaker 1.1.15 or later involving Pacemaker Remote nodes, you will need to
 take special precautions to avoid problems. See
 http://clusterlabs.org/wiki/Upgrading_to_Pacemaker_1.1.15_or_later_from_an_earlier_version[Upgrading
 to Pacemaker 1.1.15 or later from an earlier version] on the ClusterLabs wiki.
 ====
 
 To perform a rolling upgrade, on each node in turn:
 
 . Put the node into standby mode, and wait for any active resources
   to be moved cleanly to another node. (This step is optional, but
   allows you to deal with any resource issues before the upgrade.)
 . Shutdown the cluster software (pacemaker and the messaging layer) on the node.
 . Upgrade the Pacemaker software. This may also include upgrading the
   messaging layer and/or the underlying operating system.
 . If this is the first node to be upgraded, check the configuration
   with the `crm_verify` tool.
 . Start the messaging layer.
   This must be the same messaging layer (Corosync or Heartbeat)
   that the rest of the cluster is using.
 
 [NOTE]
 ====
 Rolling upgrades were not always possible with older heartbeat and
 pacemaker versions. Rolling upgrades that cross compatibility
 boundaries listed in the following table must be performed in multiple steps.
 
 .Version Compatibility Table
 [width="95%",cols="2*",options="header",align="center"]
 |=========================================================
 
 |Version being Installed
 |Oldest Compatible Version
 
 |Pacemaker 1.x.y
 |Pacemaker 1.0.0
 
 |Pacemaker 0.7.x
 |Pacemaker 0.6 or Heartbeat 2.1.3
 
 |Pacemaker 0.6.x
 |Heartbeat 2.0.8
 
 |Heartbeat 2.1.3 (or less)
 |Heartbeat 2.0.4
 
 |Heartbeat 2.0.4 (or less)
 |Heartbeat 2.0.0
 
 |Heartbeat 2.0.0
 |None. Use an alternate upgrade strategy.
 
 |=========================================================
 ====
 
 ==== Detach and Reattach ====
 
 The reattach method is a variant of a complete cluster shutdown, where the
 resources are left active and get re-detected when the cluster is restarted.
 
 This method may not be used if the cluster contains any Pacemaker Remote nodes.
 
 . Tell the cluster to stop managing services. This is required to allow the
   services to remain active after the cluster shuts down.
 +
 ----
-# crm_attribute --type rsc_defaults --name is-managed --update false
-----
-
-. For any resource that has a value for +is-managed+, make sure it is
-set to +false+ so that the cluster will not stop it (replacing $rsc_id
-appropriately):
-+
-----
-# crm_resource -t primitive -r $rsc_id -p is-managed -v false
+# crm_attribute --name maintenance-mode --update true
 ----
 
 . On each node, shutdown the cluster software (pacemaker and the messaging
   layer), and upgrade the Pacemaker software. This may also include upgrading
   the messaging layer. While the underlying operating system may be upgraded
   at the same time, that will be more likely to cause outages in the detached
   services (certainly, if a reboot is required).
 . Check the configuration with the `crm_verify` tool.
 . On each node, start the cluster software. The messaging layer can be either
   Corosync or Heartbeat and does not need to be the same one as before the
   upgrade.
 . Verify that the cluster re-detected all resources correctly.
 . Allow the cluster to resume managing resources again:
 +
 ----
-# crm_attribute --type rsc_defaults --name is-managed --update true
+# crm_attribute --name maintenance-mode --delete
 ----
 
-. For any resource that has a value for +is-managed+, reset it to
-  +true+ if desired, to allow the cluster can recover the service if it fails:
-+
-----
-# crm_resource -t primitive -r $rsc_id -p is-managed -v true
-----
-
-[IMPORTANT]
+[NOTE]
 ===========
-Always check your existing configuration is still compatible with the
-version you are installing before starting the cluster.
+Support for maintenance mode was added in Pacemaker 1.0.0. If you are upgrading
+from an earlier version, you can detach by setting +is-managed+ to +false+ for
+all resources.
 ===========
 
 === Upgrading the Configuration ===
 
 indexterm:[upgrade,Configuration]
 indexterm:[Configuration,upgrading]
 
 Pacemaker's configuration -- the Configuration Information Base (CIB) -- has
 its own XML schema version, independent of the Pacemaker software version.
 
 After cluster software is upgraded, the cluster will continue to use
 the older schema version that it was previously using. This can be useful, for
 example, when administrators have written tools that modify the configuration,
 and are based on the older syntax.
 
 However, when using an older syntax, new features may be unavailable, and there
 is a performance impact, since the cluster must do a non-persistent
 configuration upgrade before each transition. So while using the old syntax is
 possible, it is not advisable to continue using it indefinitely.
 
 Even if you wish to continue using the old syntax, it is a good idea to
 follow the upgrade procedure outlined below, except for the last step, to ensure
 that the new software has no problems with your existing configuration (since it
 will perform much the same task internally).
 
 If you are brave, it is sufficient simply to run `cibadmin --upgrade`.
 
 A more cautious approach would proceed like this:
 
 . Create a shadow copy of the configuration. The later commands will automatically
   operate on this copy, rather than the live configuration.
 +
 -----
 # crm_shadow --create shadow
 -----
 . Verify the configuration is valid with the new software (which may be
   stricter about syntax mistakes, or may have dropped support for deprecated
   features):
 indexterm:[Configuration,verify]
 indexterm:[verify,Configuration]
 +
 -----
 # crm_verify --live-check
 -----
 . Fix any errors or warnings.
 . Perform the upgrade:
 +
 -----
 # cibadmin --upgrade
 -----
 . If this step fails, there are three main possibilities:
 .. The configuration was not valid to start with (did you do steps 2 and 3?).
 .. The transformation failed - http://bugs.clusterlabs.org/[report a bug] or
    mailto:users@clusterlabs.org?subject=Transformation%20failed%20during%20upgrade[email the project].
 .. The transformation was successful but produced an invalid result.
 +
 If the result of the transformation is invalid, you may see a number of errors
 from the validation library. If these are not helpful, visit the
 http://clusterlabs.org/wiki/Validation_FAQ[Validation FAQ wiki page] and/or try
-the procedure described below under <<s-upgrade-config-manual>>.
+the manual upgrade procedure described below.
 +        
 . Check the changes:
 +
 -----
 # crm_shadow --diff
 -----
 +
 If at this point there is anything about the upgrade that you wish to fine-tune
 (for example, to change some of the automatic IDs), now is the time to do so:
 +
 -----
 # crm_shadow --edit
 -----
 +
 This will open the configuration in your favorite editor (whichever is
 specified by the standard *$EDITOR* environment variable).
 +
 . Preview how the cluster will react:
 +
 ------
 # crm_simulate --live-check --save-dotfile shadow.dot -S
 # graphviz shadow.dot
 ------
 +
 Verify that either no resource actions will occur or that you are
 happy with any that are scheduled.  If the output contains actions you
 do not expect (possibly due to changes to the score calculations), you
 may need to make further manual changes.  See
 <<s-config-testing-changes>> for further details on how to interpret
 the output of `crm_simulate` and `graphviz`.
 +
 . Upload the changes:
 +
 -----
 # crm_shadow --commit shadow --force
 -----
 +
 In the unlikely event this step fails, please report a bug.
 
 [NOTE]
 ====
-[[s-upgrade-config-manual]]
 indexterm:[Configuration,upgrade manually]
 It is also possible to perform the configuration upgrade steps manually:
 
 . Locate the +upgrade*.xsl+ conversion scripts provided with the source code. These will often
   be installed in a location such as +/usr/share/pacemaker+, or may be obtained from
   the https://github.com/ClusterLabs/pacemaker/tree/master/xml[source repository].
           
 . Run the conversion scripts that apply to your older version, for example:
   indexterm:[XML,convert]
 +
 -----
 # xsltproc /path/to/upgrade06.xsl config06.xml > config10.xml
 -----
 +          
 . Locate the +pacemaker.rng+ script (from the same location as the xsl files).
 . Check the XML validity: indexterm:[validate configuration]indexterm:[Configuration,validate XML]
 +
 ----
 # xmllint --relaxng /path/to/pacemaker.rng config10.xml
 ----
 
 The advantage of this method is that it can be performed without the
 cluster running, and any validation errors are often more informative.
 ====
 
 === What Changed in 1.0 ===
 
 ==== New ====
 
 * Failure timeouts. See <<s-failure-migration>>
 * New section for resource and operation defaults. See <<s-resource-defaults>> and <<s-operation-defaults>>
 * Tool for making offline configuration changes. See <<s-config-sandboxes>>
 * +Rules, instance_attributes, meta_attributes+ and sets of operations can be defined once and referenced in multiple places. See <<s-reusing-config-elements>>
 * The CIB now accepts XPath-based create/modify/delete operations. See the pass:[<command>cibadmin</command>] help text.
 * Multi-dimensional colocation and ordering constraints. See <<s-resource-sets-ordering>> and <<s-resource-sets-colocation>>
 * The ability to connect to the CIB from non-cluster machines. See <<s-remote-connection>>
 * Allow recurring actions to be triggered at known times. See <<s-recurring-start>>
 
 
 ==== Changed ====
 
 * Syntax
 ** All resource and cluster options now use dashes (-) instead of underscores (_)
 ** +master_slave+ was renamed to +master+
 ** The +attributes+ container tag was removed
 ** The operation field +pre-req+ has been renamed +requires+
 ** All operations must have an +interval+, +start+/+stop+ must have it set to zero
 * The +stonith-enabled+ option now defaults to true.
 * The cluster will refuse to start resources if +stonith-enabled+ is true (or unset) and no STONITH resources have been defined
 * The attributes of colocation and ordering constraints were renamed for clarity. See <<s-resource-ordering>> and <<s-resource-colocation>>
 * +resource-failure-stickiness+ has been replaced by +migration-threshold+. See <<s-failure-migration>>
 * The parameters for command-line tools have been made consistent
 * Switched to 'RelaxNG' schema validation and 'libxml2' parser
 ** id fields are now XML IDs which have the following limitations:
 *** id's cannot contain colons (:)
 *** id's cannot begin with a number
 *** id's must be globally unique (not just unique for that tag)
 ** Some fields (such as those in constraints that refer to resources) are IDREFs.
 +
 This means that they must reference existing resources or objects in
 order for the configuration to be valid.  Removing an object which is
 referenced elsewhere will therefore fail.
 +              
 ** The CIB representation, from which a MD5 digest is calculated to verify CIBs on the nodes, has changed.
 +
 This means that every CIB update will require a full refresh on any
 upgraded nodes until the cluster is fully upgraded to 1.0.  This will
 result in significant performance degradation and it is therefore
 highly inadvisable to run a mixed 1.0/0.6 cluster for any longer than
 absolutely necessary.
 +              
 * Ping node information no longer needs to be added to _ha.cf_.
 +
 Simply include the lists of hosts in your ping resource(s).
 
 
 ==== Removed ====
 
 
 * Syntax
 ** It is no longer possible to set resource meta options as top-level
    attributes.  Use meta attributes instead.
 ** Resource and operation defaults are no longer read from
    +crm_config+.  See <<s-resource-defaults>> and
    <<s-operation-defaults>> instead.
diff --git a/doc/Pacemaker_Explained/en-US/Ch-Advanced-Resources.txt b/doc/Pacemaker_Explained/en-US/Ch-Advanced-Resources.txt
index 3fe9d35a10..5f5d0f9192 100644
--- a/doc/Pacemaker_Explained/en-US/Ch-Advanced-Resources.txt
+++ b/doc/Pacemaker_Explained/en-US/Ch-Advanced-Resources.txt
@@ -1,1035 +1,1035 @@
 = Advanced Resource Types =
 
 [[group-resources]]
 == Groups - A Syntactic Shortcut ==
 indexterm:[Group Resources]
 indexterm:[Resources,Groups]
 
 
 One of the most common elements of a cluster is a set of resources
 that need to be located together, start sequentially, and stop in the
 reverse order.  To simplify this configuration, we support the concept
 of groups.
 
 .A group of two primitive resources
 ======
 [source,XML]
 -------
 <group id="shortcut">
    <primitive id="Public-IP" class="ocf" type="IPaddr" provider="heartbeat">
     <instance_attributes id="params-public-ip">
        <nvpair id="public-ip-addr" name="ip" value="192.0.2.2"/>
     </instance_attributes>
    </primitive>
    <primitive id="Email" class="lsb" type="exim"/>
 </group> 
 -------
 ======
 
 
 Although the example above contains only two resources, there is no
 limit to the number of resources a group can contain.  The example is
 also sufficient to explain the fundamental properties of a group:
 
 * Resources are started in the order they appear in (+Public-IP+
   first, then +Email+)
 * Resources are stopped in the reverse order to which they appear in
   (+Email+ first, then +Public-IP+)
 
 If a resource in the group can't run anywhere, then nothing after that
 is allowed to run, too.
 
 * If +Public-IP+ can't run anywhere, neither can +Email+;
 * but if +Email+ can't run anywhere, this does not affect +Public-IP+
   in any way
 
 The group above is logically equivalent to writing:
 
 .How the cluster sees a group resource
 ======
 [source,XML]
 -------
 <configuration>
    <resources>
     <primitive id="Public-IP" class="ocf" type="IPaddr" provider="heartbeat">
      <instance_attributes id="params-public-ip">
         <nvpair id="public-ip-addr" name="ip" value="192.0.2.2"/>
      </instance_attributes>
     </primitive>
     <primitive id="Email" class="lsb" type="exim"/>
    </resources>
    <constraints>
       <rsc_colocation id="xxx" rsc="Email" with-rsc="Public-IP" score="INFINITY"/>
       <rsc_order id="yyy" first="Public-IP" then="Email"/>
    </constraints>
 </configuration> 
 -------
 ======
 
 Obviously as the group grows bigger, the reduced configuration effort
 can become significant.
 
 Another (typical) example of a group is a DRBD volume, the filesystem
 mount, an IP address, and an application that uses them.
 
 === Group Properties ===
 .Properties of a Group Resource
 [width="95%",cols="3m,5<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Description
 
 |id
 |A unique name for the group
  indexterm:[id,Group Resource Property]
  indexterm:[Resource,Group Property,id]
 
 |=========================================================
 
 === Group Options ===
 
 Groups inherit the +priority+, +target-role+, and +is-managed+ properties
 from primitive resources. See <<s-resource-options>> for information about
 those properties.
 
 === Group Instance Attributes ===
 
 Groups have no instance attributes. However, any that are set for the group
 object will be inherited by the group's children.
 
 === Group Contents ===
 
 Groups may only contain a collection of cluster resources (see
 <<primitive-resource>>).  To refer to a child of a group resource, just use
 the child's +id+ instead of the group's.
 
 === Group Constraints ===
 
 Although it is possible to reference a group's children in
 constraints, it is usually preferable to reference the group itself.
 
 .Some constraints involving groups
 ======
 [source,XML]
 -------
 <constraints>
     <rsc_location id="group-prefers-node1" rsc="shortcut" node="node1" score="500"/>
     <rsc_colocation id="webserver-with-group" rsc="Webserver" with-rsc="shortcut"/>
     <rsc_order id="start-group-then-webserver" first="Webserver" then="shortcut"/>
 </constraints> 
 -------
 ======
 
 === Group Stickiness ===
 indexterm:[resource-stickiness,Groups]
 
 Stickiness, the measure of how much a resource wants to stay where it
 is, is additive in groups.  Every active resource of the group will
 contribute its stickiness value to the group's total.  So if the
 default +resource-stickiness+ is 100, and a group has seven members,
 five of which are active, then the group as a whole will prefer its
 current location with a score of 500.
 
 [[s-resource-clone]]
 == Clones - Resources That Get Active on Multiple Hosts ==
 indexterm:[Clone Resources]
 indexterm:[Resources,Clones]
 
 Clones were initially conceived as a convenient way to start multiple
 instances of an IP address resource and have them distributed throughout the
 cluster for load balancing.  They have turned out to quite useful for
 a number of purposes including integrating with the Distributed Lock Manager
 (used by many cluster filesystems), the fencing subsystem, and OCFS2.
 
 You can clone any resource, provided the resource agent supports it.
 
 Three types of cloned resources exist:
 
 * Anonymous
 * Globally unique
 * Stateful
 
 'Anonymous' clones are the simplest.  These behave
 completely identically everywhere they are running.  Because of this,
 there can be only one copy of an anonymous clone active per machine.
       
 'Globally unique' clones are distinct entities.  A copy of the clone
 running on one machine is not equivalent to another instance on
 another node, nor would any two copies on the same node be
 equivalent.
 
 'Stateful' clones are covered later in <<s-resource-multistate>>.
 
 .A clone of an LSB resource
 ======
 [source,XML]
 -------
 <clone id="apache-clone">
     <meta_attributes id="apache-clone-meta">
        <nvpair id="apache-unique" name="globally-unique" value="false"/>
     </meta_attributes>
     <primitive id="apache" class="lsb" type="apache"/>
 </clone> 
 -------
 ======
 
 === Clone Properties ===
 
 .Properties of a Clone Resource
 [width="95%",cols="3m,5<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Description
 
 |id
 |A unique name for the clone
  indexterm:[id,Clone Property]
  indexterm:[Clone,Property,id]
 
 |=========================================================
 
 === Clone Options ===
 
 Options inherited from <<s-resource-options,primitive>> resources:
 +priority, target-role, is-managed+
 
 .Clone-specific configuration options
 [width="95%",cols="1m,1,3<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Default
 |Description
 
 |clone-max
 |number of nodes in cluster
 |How many copies of the resource to start
  indexterm:[clone-max,Clone Option]
  indexterm:[Clone,Option,clone-max]
 
 |clone-node-max
 |1
 |How many copies of the resource can be started on a single node
  indexterm:[clone-node-max,Clone Option]
  indexterm:[Clone,Option,clone-node-max]
   
 |clone-min
 |1
 |Require at least this number of clone instances to be runnable before allowing
 resources depending on the clone to be runnable '(since 1.1.14)'
  indexterm:[clone-min,Clone Option]
  indexterm:[Clone,Option,clone-min]
 
 |notify
 |true
 |When stopping or starting a copy of the clone, tell all the other
  copies beforehand and again when the action was successful. Allowed values:
  +false+, +true+
  indexterm:[notify,Clone Option]
  indexterm:[Clone,Option,notify]
 
 |globally-unique
 |false
 |Does each copy of the clone perform a different function? Allowed
  values: +false+, +true+
  indexterm:[globally-unique,Clone Option]
  indexterm:[Clone,Option,globally-unique]
   
 |ordered
 |false
 |Should the copies be started in series (instead of in
  parallel)? Allowed values: +false+, +true+
  indexterm:[ordered,Clone Option]
  indexterm:[Clone,Option,ordered]
 
 |interleave
 |false
 |If this clone depends on another clone via an ordering constraint,
 is it allowed to start after the local instance of the other clone
 starts, rather than wait for all instances of the other clone to start?
 Allowed values: +false+, +true+
  indexterm:[interleave,Clone Option]
  indexterm:[Clone,Option,interleave]
 
 |=========================================================
 
 === Clone Instance Attributes ===
 
 Clones have no instance attributes; however, any that are set here
 will be inherited by the clone's children.
 
 === Clone Contents ===
 
 Clones must contain exactly one primitive or group resource.
 
 [WARNING]
 You should never reference the name of a clone's child.
 If you think you need to do this, you probably need to re-evaluate your design.
 
 === Clone Constraints ===
 
 In most cases, a clone will have a single copy on each active cluster
 node.  If this is not the case, you can indicate which nodes the
 cluster should preferentially assign copies to with resource location
 constraints.  These constraints are written no differently from those
 for primitive resources except that the clone's +id+ is used.
 
 .Some constraints involving clones
 ======
 [source,XML]
 -------
 <constraints>
     <rsc_location id="clone-prefers-node1" rsc="apache-clone" node="node1" score="500"/>
     <rsc_colocation id="stats-with-clone" rsc="apache-stats" with="apache-clone"/>
     <rsc_order id="start-clone-then-stats" first="apache-clone" then="apache-stats"/>
 </constraints> 
 -------
 ======
 
 Ordering constraints behave slightly differently for clones.  In the
 example above, +apache-stats+ will wait until all copies of +apache-clone+
 that need to be started have done so before being started itself.
 Only if _no_ copies can be started will +apache-stats+ be prevented
 from being active.  Additionally, the clone will wait for
 +apache-stats+ to be stopped before stopping itself.
 
 Colocation of a primitive or group resource with a clone means that
 the resource can run on any machine with an active copy of the clone.
 The cluster will choose a copy based on where the clone is running and
 the resource's own location preferences.
 
 Colocation between clones is also possible.  If one clone +A+ is colocated
 with another clone +B+, the set of allowed locations for +A+ is limited to
 nodes on which +B+ is (or will be) active.  Placement is then performed
 normally.
 
 [[s-clone-stickiness]]
 === Clone Stickiness ===
 
 indexterm:[resource-stickiness,Clones]
 
 To achieve a stable allocation pattern, clones are slightly sticky by
 default.  If no value for +resource-stickiness+ is provided, the clone
 will use a value of 1.  Being a small value, it causes minimal
 disturbance to the score calculations of other resources but is enough
 to prevent Pacemaker from needlessly moving copies around the cluster.
 
 [NOTE]
 ====
 For globally unique clones, this may result in multiple instances of the
 clone staying on a single node, even after another eligible node becomes
 active (for example, after being put into standby mode then made active again).
 If you do not want this behavior, specify a +resource-stickiness+ of 0
 for the clone temporarily and let the cluster adjust, then set it back
 to 1 if you want the default behavior to apply again.
 ====
 
 === Clone Resource Agent Requirements ===
 
 Any resource can be used as an anonymous clone, as it requires no
 additional support from the resource agent.  Whether it makes sense to
 do so depends on your resource and its resource agent.
 
 Globally unique clones do require some additional support in the
 resource agent.  In particular, it must only respond with
 +$\{OCF_SUCCESS}+ if the node has that exact instance active.  All
 other probes for instances of the clone should result in
 +$\{OCF_NOT_RUNNING}+ (or one of the other OCF error codes if
 they are failed).
 
 Individual instances of a clone are identified by appending a colon and a
 numerical offset, e.g. +apache:2+.
 
 Resource agents can find out how many copies there are by examining
 the +OCF_RESKEY_CRM_meta_clone_max+ environment variable and which
 copy it is by examining +OCF_RESKEY_CRM_meta_clone+.
 
 The resource agent must not make any assumptions (based on
 +OCF_RESKEY_CRM_meta_clone+) about which numerical instances are active.  In
 particular, the list of active copies will not always be an unbroken
 sequence, nor always start at 0.
 
 ==== Clone Notifications ====
 
 Supporting notifications requires the +notify+ action to be
 implemented.  If supported, the notify action will be passed a
 number of extra variables which, when combined with additional
 context, can be used to calculate the current state of the cluster and
 what is about to happen to it.
 
 .Environment variables supplied with Clone notify actions
 [width="95%",cols="5,3<",options="header",align="center"]
 |=========================================================
 
 |Variable
 |Description
 
 |OCF_RESKEY_CRM_meta_notify_type
 |Allowed values: +pre+, +post+
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,type]
  indexterm:[type,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_operation
 |Allowed values: +start+, +stop+
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,operation]
  indexterm:[operation,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_start_resource
 |Resources to be started
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,start_resource]
  indexterm:[start_resource,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_stop_resource
 |Resources to be stopped
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,stop_resource]
  indexterm:[stop_resource,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_active_resource
 |Resources that are running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,active_resource]
  indexterm:[active_resource,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_inactive_resource
 |Resources that are not running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,inactive_resource]
  indexterm:[inactive_resource,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_start_uname
 |Nodes on which resources will be started
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,start_uname]
  indexterm:[start_uname,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_stop_uname
 |Nodes on which resources will be stopped
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,stop_uname]
  indexterm:[stop_uname,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_active_uname
 |Nodes on which resources are running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,active_uname]
  indexterm:[active_uname,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_inactive_uname
 |Nodes on which resources are not running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,inactive_uname]
  indexterm:[inactive_uname,Notification Environment Variable]
 
 |=========================================================
 
 The variables come in pairs, such as
 +OCF_RESKEY_CRM_meta_notify_start_resource+ and
 +OCF_RESKEY_CRM_meta_notify_start_uname+ and should be treated as an
 array of whitespace-separated elements.
 
 Thus in order to indicate that +clone:0+ will be started on +sles-1+,
 +clone:2+ will be started on +sles-3+, and +clone:3+ will be started
 on +sles-2+, the cluster would set
 
 .Notification variables
 ======
 [source,Bash]
 -------
 OCF_RESKEY_CRM_meta_notify_start_resource="clone:0 clone:2 clone:3"
 OCF_RESKEY_CRM_meta_notify_start_uname="sles-1 sles-3 sles-2"
 -------
 ======
 
 ==== Proper Interpretation of Notification Environment Variables ====
 
 .Pre-notification (stop):
 
 * Active resources: +$OCF_RESKEY_CRM_meta_notify_active_resource+
 * Inactive resources: +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 * Resources to be started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources to be stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 
 
 .Post-notification (stop) / Pre-notification (start):
 
 * Active resources
 ** +$OCF_RESKEY_CRM_meta_notify_active_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 * Inactive resources
 ** +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_stop_resource+ 
 * Resources that were started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources that were stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 
 
 .Post-notification (start):
 
 * Active resources:
 ** +$OCF_RESKEY_CRM_meta_notify_active_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Inactive resources:
 ** +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources that were started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources that were stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 
 [[s-resource-multistate]]
 == Multi-state - Resources That Have Multiple Modes ==
 
 indexterm:[Multi-state Resources]
 indexterm:[Resources,Multi-state]
 
 Multi-state resources are a specialization of clone resources; please
 ensure you understand <<s-resource-clone>> before continuing!
 
 Multi-state resources allow the instances to be in one of two operating modes
 (called 'roles'). The roles are called 'master' and 'slave', but can mean
 whatever you wish them to mean. The only limitation is that when an instance is
 started, it must come up in the slave role.
 
 === Multi-state Properties ===
 
 .Properties of a Multi-State Resource
 [width="95%",cols="3m,5<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Description
 
 |id
 |Your name for the multi-state resource
  indexterm:[id,Multi-State Property]
  indexterm:[Multi-State,Property,id]
 
 |=========================================================
 
 === Multi-state Options ===
 
 Options inherited from <<s-resource-options,primitive>> resources:
 +priority+, +target-role+, +is-managed+
 
 Options inherited from <<s-resource-clone,clone>> resources:
 +clone-max+, +clone-node-max+, +notify+, +globally-unique+, +ordered+,
 +interleave+
 
 .Multi-state-specific resource configuration options
 [width="95%",cols="1m,1,3<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Default
 |Description
 
 |master-max
 |1
 |How many copies of the resource can be promoted to the +master+ role
  indexterm:[master-max,Multi-State Option]
  indexterm:[Multi-State,Option,master-max]
 
 |master-node-max
 |1
 |How many copies of the resource can be promoted to the +master+ role on
  a single node
  indexterm:[master-node-max,Multi-State Option]
  indexterm:[Multi-State,Option,master-node-max]
 
 |=========================================================
 
 === Multi-state Instance Attributes ===
 
 Multi-state resources have no instance attributes; however, any that
 are set here will be inherited by a master's children.
 
 === Multi-state Contents ===
 
 Masters must contain exactly one primitive or group resource.
 
 [WARNING]
 You should never reference the name of a master's child.
 If you think you need to do this, you probably need to re-evaluate your design.
 
 === Monitoring Multi-State Resources ===
 
 The usual monitor actions are insufficient to monitor a multi-state resource,
 because pacemaker needs to verify not only that the resource is active, but
 also that its actual role matches its intended one.
 
 Define two monitoring actions: the usual one will cover the slave role,
 and an additional one with +role="master"+ will cover the master role.
 
 .Monitoring both states of a multi-state resource
 ======
 [source,XML]
 -------
 <master id="myMasterRsc">
    <primitive id="myRsc" class="ocf" type="myApp" provider="myCorp">
     <operations>
      <op id="public-ip-slave-check" name="monitor" interval="60"/>
      <op id="public-ip-master-check" name="monitor" interval="61" role="Master"/>
     </operations>
    </primitive>
 </master> 
 -------
 ======
 
 [IMPORTANT]
 ===========
 It is crucial that _every_ monitor operation has a different interval!
 Pacemaker currently differentiates between operations
 only by resource and interval; so if (for example) a master/slave resource had
 the same monitor interval for both roles, Pacemaker would ignore the
 role when checking the status -- which would cause unexpected return
 codes, and therefore unnecessary complications.
 ===========
 
 === Multi-state Constraints ===
 
 In most cases, multi-state resources will have a single copy on each
 active cluster node.  If this is not the case, you can indicate which
 nodes the cluster should preferentially assign copies to with resource
 location constraints.  These constraints are written no differently from
 those for primitive resources except that the master's +id+ is used.
 
 When considering multi-state resources in constraints, for most
 purposes it is sufficient to treat them as clones. The exception is
 that the +first-action+ and/or +then-action+ fields for ordering constraints
 may be set to +promote+ or +demote+ to constrain the master role,
 and colocation constraints may contain +rsc-role+ and/or +with-rsc-role+
 fields.
           
 .Additional colocation constraint options for multi-state resources
 [width="95%",cols="1m,1,3<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Default
 |Description
 
 |rsc-role
 |Started
 |An additional attribute of colocation constraints that specifies the
  role that +rsc+ must be in.  Allowed values: +Started+, +Master+,
  +Slave+.
  indexterm:[rsc-role,Ordering Constraints]
  indexterm:[Constraints,Ordering,rsc-role]
 
 |with-rsc-role
 |Started
 |An additional attribute of colocation constraints that specifies the
  role that +with-rsc+ must be in.  Allowed values: +Started+,
  +Master+, +Slave+.
  indexterm:[with-rsc-role,Ordering Constraints]
  indexterm:[Constraints,Ordering,with-rsc-role]
 
 |=========================================================
 
 .Constraints involving multi-state resources       
 ======
 [source,XML]
 -------
 <constraints>
    <rsc_location id="db-prefers-node1" rsc="database" node="node1" score="500"/>
    <rsc_colocation id="backup-with-db-slave" rsc="backup"
      with-rsc="database" with-rsc-role="Slave"/>
    <rsc_colocation id="myapp-with-db-master" rsc="myApp"
      with-rsc="database" with-rsc-role="Master"/>
    <rsc_order id="start-db-before-backup" first="database" then="backup"/>
    <rsc_order id="promote-db-then-app" first="database" first-action="promote"
      then="myApp" then-action="start"/>
 </constraints> 
 -------
 ======
 
 In the example above, +myApp+ will wait until one of the database
 copies has been started and promoted to master before being started
 itself on the same node.  Only if no copies can be promoted will +myApp+ be
 prevented from being active.  Additionally, the cluster will wait for
 +myApp+ to be stopped before demoting the database.
 
 Colocation of a primitive or group resource with a multi-state
 resource means that it can run on any machine with an active copy of
 the multi-state resource that has the specified role (+master+ or
 +slave+).  In the example above, the cluster will choose a location based on
 where database is running as a +master+, and if there are multiple
 +master+ instances it will also factor in +myApp+'s own location
 preferences when deciding which location to choose.
 
 Colocation with regular clones and other multi-state resources is also
 possible.  In such cases, the set of allowed locations for the +rsc+
 clone is (after role filtering) limited to nodes on which the
 +with-rsc+ multi-state resource is (or will be) in the specified role.
 Placement is then performed as normal.
 
 ==== Using Multi-state Resources in Colocation Sets ====
 
 .Additional colocation set options relevant to multi-state resources
 [width="95%",cols="1m,1,6<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Default
 |Description
 
 |role
 |Started
 |The role that 'all members' of the set must be in.  Allowed values: +Started+, +Master+,
  +Slave+.
  indexterm:[role,Ordering Constraints]
  indexterm:[Constraints,Ordering,role]
 
 |=========================================================
 
 In the following example +B+'s master must be located on the same node as +A+'s master.
 Additionally resources +C+ and +D+ must be located on the same node as +A+'s
 and +B+'s masters.
 
 .Colocate C and D with A's and B's master instances
 ======
 [source,XML]
 -------
 <constraints>
     <rsc_colocation id="coloc-1" score="INFINITY" >
       <resource_set id="colocated-set-example-1" sequential="true" role="Master">
         <resource_ref id="A"/>
         <resource_ref id="B"/>
       </resource_set>
       <resource_set id="colocated-set-example-2" sequential="true">
         <resource_ref id="C"/>
         <resource_ref id="D"/>
       </resource_set>
     </rsc_colocation>
 </constraints>
 -------
 ======
 
 ==== Using Multi-state Resources in Ordering Sets ====
 
 .Additional ordered set options relevant to multi-state resources
 [width="95%",cols="1m,1,3<",options="header",align="center"]
 |=========================================================
 
 |Field
 |Default
 |Description
 
 |action
 |value of +first-action+
 |An additional attribute of ordering constraint sets that specifies the
  action that applies to 'all members' of the set.  Allowed
  values: +start+, +stop+, +promote+, +demote+.
  indexterm:[action,Ordering Constraints]
  indexterm:[Constraints,Ordering,action]
 
 |=========================================================
 
 .Start C and D after first promoting A and B
 ======
 [source,XML]
 -------
 <constraints>
     <rsc_order id="order-1" score="INFINITY" >
       <resource_set id="ordered-set-1" sequential="true" action="promote">
         <resource_ref id="A"/>
         <resource_ref id="B"/>
       </resource_set>
       <resource_set id="ordered-set-2" sequential="true" action="start">
         <resource_ref id="C"/>
         <resource_ref id="D"/>
       </resource_set>
     </rsc_order>
 </constraints>
 -------
 ======
 
 In the above example, +B+ cannot be promoted to a master role until +A+ has
 been promoted. Additionally, resources +C+ and +D+ must wait until +A+ and +B+
 have been promoted before they can start.
 
 
 === Multi-state Stickiness ===
 
 indexterm:[resource-stickiness,Multi-State]
 As with regular clones, multi-state resources are
 slightly sticky by default. See <<s-clone-stickiness>> for details.
 
 === Which Resource Instance is Promoted ===
 
 During the start operation, most resource agents should call
 the `crm_master` utility.  This tool automatically detects both the
 resource and host and should be used to set a preference for being
 promoted.  Based on this, +master-max+, and +master-node-max+, the
 instance(s) with the highest preference will be promoted.
 
 An alternative is to create a location constraint that
 indicates which nodes are most preferred as masters.
 
 .Explicitly preferring node1 to be promoted to master
 ======
 [source,XML]
 -------
 <rsc_location id="master-location" rsc="myMasterRsc">
     <rule id="master-rule" score="100" role="Master">
       <expression id="master-exp" attribute="#uname" operation="eq" value="node1"/>
     </rule>
 </rsc_location> 
 -------
 ======
 
 === Requirements for Multi-state Resource Agents ===
 
 Since multi-state resources are an extension of cloned resources, all
 the requirements for resource agents that support clones are also requirements
 for resource agents that support multi-state resources.
 
 Additionally, multi-state resources require two extra
 actions, +demote+ and +promote+, which are responsible for
 changing the state of the resource.  Like +start+ and +stop+, they
 should return +$\{OCF_SUCCESS}+ if they completed successfully or a
 relevant error code if they did not.
 
 The states can mean whatever you wish, but when the resource is
 started, it must come up in the mode called +slave+.  From there the
 cluster will decide which instances to promote to +master+.
 
 In addition to the clone requirements for monitor actions, agents must
 also _accurately_ report which state they are in.  The cluster relies
 on the agent to report its status (including role) accurately and does
 not indicate to the agent what role it currently believes it to be in.
 
 .Role implications of OCF return codes
 [width="95%",cols="1,1<",options="header",align="center"]
 |=========================================================
 
 |Monitor Return Code
 |Description
 
 |OCF_NOT_RUNNING
 |Stopped
  indexterm:[Return Code,OCF_NOT_RUNNING]
  
 |OCF_SUCCESS
 |Running (Slave)
  indexterm:[Return Code,OCF_SUCCESS]
  
 |OCF_RUNNING_MASTER
 |Running (Master)
  indexterm:[Return Code,OCF_RUNNING_MASTER]
 
 |OCF_FAILED_MASTER
 |Failed (Master)
  indexterm:[Return Code,OCF_FAILED_MASTER]
  
 |Other
 |Failed (Slave)
 
 |=========================================================
 
 ==== Multi-state Notifications ====
 
 Like clones, supporting notifications requires the +notify+ action to
 be implemented.  If supported, the notify action will be passed a
 number of extra variables which, when combined with additional
 context, can be used to calculate the current state of the cluster and
 what is about to happen to it.
           
 .Environment variables supplied with multi-state notify actions footnote:[Emphasized variables are specific to +Master+ resources, and all behave in the same manner as described for Clone resources.]
 [width="95%",cols="5,3<",options="header",align="center"]
 |=========================================================
 
 |Variable
 |Description
 
 |OCF_RESKEY_CRM_meta_notify_type
 |Allowed values: +pre+, +post+
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,type]
  indexterm:[type,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_operation
 |Allowed values: +start+, +stop+
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,operation]
  indexterm:[operation,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_active_resource
-|Resources the that are running
+|Resources that are running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,active_resource]
  indexterm:[active_resource,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_inactive_resource
-|Resources the that are not running
+|Resources that are not running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,inactive_resource]
  indexterm:[inactive_resource,Notification Environment Variable]
   
 |_OCF_RESKEY_CRM_meta_notify_master_resource_
 |Resources that are running in +Master+ mode
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,master_resource]
  indexterm:[master_resource,Notification Environment Variable]
 
 |_OCF_RESKEY_CRM_meta_notify_slave_resource_
 |Resources that are running in +Slave+ mode
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,slave_resource]
  indexterm:[slave_resource,Notification Environment Variable]
    
 |OCF_RESKEY_CRM_meta_notify_start_resource
 |Resources to be started
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,start_resource]
  indexterm:[start_resource,Notification Environment Variable]
   
-|indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,stop_resource]
- indexterm:[stop_resource,Notification Environment Variable]
-  OCF_RESKEY_CRM_meta_notify_stop_resource
+|OCF_RESKEY_CRM_meta_notify_stop_resource
 |Resources to be stopped
+ indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,stop_resource]
+ indexterm:[stop_resource,Notification Environment Variable]
 
 |_OCF_RESKEY_CRM_meta_notify_promote_resource_
 |Resources to be promoted
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,promote_resource]
  indexterm:[promote_resource,Notification Environment Variable]
    
 |_OCF_RESKEY_CRM_meta_notify_demote_resource_
 |Resources to be demoted
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,demote_resource]
  indexterm:[demote_resource,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_start_uname
 |Nodes on which resources will be started
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,start_uname]
  indexterm:[start_uname,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_stop_uname
 |Nodes on which resources will be stopped
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,stop_uname]
  indexterm:[stop_uname,Notification Environment Variable]
 
 |_OCF_RESKEY_CRM_meta_notify_promote_uname_
-|Nodes on which resources will be promote
+|Nodes on which resources will be promoted
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,promote_uname]
  indexterm:[promote_uname,Notification Environment Variable]
 
 |_OCF_RESKEY_CRM_meta_notify_demote_uname_
 |Nodes on which resources will be demoted
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,demote_uname]
  indexterm:[demote_uname,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_active_uname
 |Nodes on which resources are running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,active_uname]
  indexterm:[active_uname,Notification Environment Variable]
 
 |OCF_RESKEY_CRM_meta_notify_inactive_uname
 |Nodes on which resources are not running
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,inactive_uname]
  indexterm:[inactive_uname,Notification Environment Variable]
 
 |_OCF_RESKEY_CRM_meta_notify_master_uname_
 |Nodes on which resources are running in +Master+ mode
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,master_uname]
  indexterm:[master_uname,Notification Environment Variable]
 
 |_OCF_RESKEY_CRM_meta_notify_slave_uname_
 |Nodes on which resources are running in +Slave+ mode
  indexterm:[Environment Variable,OCF_RESKEY_CRM_meta_notify_,slave_uname]
  indexterm:[slave_uname,Notification Environment Variable]
 
 |=========================================================
 
 ==== Proper Interpretation of Multi-state Notification Environment Variables ====
 
 
 .Pre-notification (demote):
 
 * +Active+ resources: +$OCF_RESKEY_CRM_meta_notify_active_resource+
 * +Master+ resources: +$OCF_RESKEY_CRM_meta_notify_master_resource+
 * +Slave+ resources: +$OCF_RESKEY_CRM_meta_notify_slave_resource+
 * Inactive resources: +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 * Resources to be started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources to be promoted: +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * Resources to be demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources to be stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 
 
 .Post-notification (demote) / Pre-notification (stop):
 
 * +Active+ resources: +$OCF_RESKEY_CRM_meta_notify_active_resource+
 * +Master+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_master_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_demote_resource+ 
 * +Slave+ resources: +$OCF_RESKEY_CRM_meta_notify_slave_resource+
 * Inactive resources: +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 * Resources to be started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources to be promoted: +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * Resources to be demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources to be stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 * Resources that were demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 
 
 .Post-notification (stop) / Pre-notification (start)
 
 * +Active+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_active_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+ 
 * +Master+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_master_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_demote_resource+ 
 * +Slave+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_slave_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+ 
 * Inactive resources:
 ** +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_stop_resource+ 
 * Resources to be started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources to be promoted: +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * Resources to be demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources to be stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 * Resources that were demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources that were stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 
 
 .Post-notification (start) / Pre-notification (promote)
 
 * +Active+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_active_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_start_resource+ 
 * +Master+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_master_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_demote_resource+ 
 * +Slave+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_slave_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_start_resource+ 
 * Inactive resources:
 ** +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_start_resource+           
 * Resources to be started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources to be promoted: +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * Resources to be demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources to be stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 * Resources that were started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources that were demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources that were stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 
 .Post-notification (promote)
 
 * +Active+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_active_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_start_resource+ 
 * +Master+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_master_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * +Slave+ resources:
 ** +$OCF_RESKEY_CRM_meta_notify_slave_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_start_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_promote_resource+ 
 * Inactive resources:
 ** +$OCF_RESKEY_CRM_meta_notify_inactive_resource+
 ** plus +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 ** minus +$OCF_RESKEY_CRM_meta_notify_start_resource+ 
 * Resources to be started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources to be promoted: +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * Resources to be demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources to be stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
 * Resources that were started: +$OCF_RESKEY_CRM_meta_notify_start_resource+
 * Resources that were promoted: +$OCF_RESKEY_CRM_meta_notify_promote_resource+
 * Resources that were demoted: +$OCF_RESKEY_CRM_meta_notify_demote_resource+
 * Resources that were stopped: +$OCF_RESKEY_CRM_meta_notify_stop_resource+
diff --git a/doc/Pacemaker_Remote/en-US/Ch-Options.txt b/doc/Pacemaker_Remote/en-US/Ch-Options.txt
index 0879be57be..87663f8727 100644
--- a/doc/Pacemaker_Remote/en-US/Ch-Options.txt
+++ b/doc/Pacemaker_Remote/en-US/Ch-Options.txt
@@ -1,136 +1,136 @@
 = Configuration Explained =
 
 The walk-through examples use some of these options, but don't explain exactly
 what they mean or do.  This section is meant to be the go-to resource for all
 the options available for configuring pacemaker_remote-based nodes.
 (((configuration)))
 
 == Resource Meta-Attributes for Guest Nodes ==
 
 When configuring a virtual machine as a guest node, the virtual machine is
 created using one of the usual resource agents for that purpose (for example,
 ocf:heartbeat:VirtualDomain or ocf:heartbeat:Xen), with additional metadata
 parameters.
 
 No restrictions are enforced on what agents may be used to create a guest node,
 but obviously the agent must create a distinct environment capable of running
 the pacemaker_remote daemon and cluster resources. An additional requirement is
 that fencing the host running the guest node resource must be sufficient for
 ensuring the guest node is stopped. This means, for example, that not all
 hypervisors supported by VirtualDomain may be used to create guest nodes; if
 the guest can survive the hypervisor being fenced, it may not be used as a
 guest node.
 
 Below are the metadata options available to enable a resource as a guest node
 and define its connection parameters.
 
 .Meta-attributes for configuring VM resources as guest nodes
 [width="95%",cols="2m,1,4<",options="header",align="center"]
 |=========================================================
 
 |Option
 |Default
 |Description
 
 |remote-node
 |'none'
 |The node name of the guest node this resource defines. This both enables the
 resource as a guest node and defines the unique name used to identify the
 guest node. If no other parameters are set, this value will also be assumed as
 the hostname to use when connecting to pacemaker_remote on the VM. This value
 *must not* overlap with any resource or node IDs.
 
 |remote-port
 |3121
 |The port on the virtual machine that the cluster will use to connect to
 pacemaker_remote.
 
 |remote-addr
 |'value of' +remote-node+
 |The IP address or hostname to use when connecting to pacemaker_remote on the VM.
 
 |remote-connect-timeout
 |60s
 |How long before a pending guest connection will time out.
 
 |=========================================================
 
 == Connection Resources for Remote Nodes ==
 
 A remote node is defined by a connection resource. That connection resource
 has instance attributes that define where the remote node is located on the
 network and how to communicate with it.
 
 Descriptions of these instance attributes can be retrieved using the following
 `pcs` command:
 ----
 # pcs resource describe remote
 ocf:pacemaker:remote - remote resource agent
 
 Resource options:
   server: Server location to connect to. This can be an ip address or hostname.
   port: tcp port to connect to.
   reconnect_interval: Interval in seconds at which Pacemaker will attempt to
 		      reconnect to a remote node after an active connection to
 		      the remote node has been severed. When this value is
 		      nonzero, Pacemaker will retry the connection
 		      indefinitely, at the specified interval. As with any
 		      time-based actions, this is not guaranteed to be checked
 		      more frequently than the value of the
                       cluster-recheck-interval cluster option.
 ----
 
 When defining a remote node's connection resource, it is common and recommended
 to name the connection resource the same as the remote node's hostname. By
 default, if no *server* option is provided, the cluster will attempt to contact
 the remote node using the resource name as the hostname.
 
 Example defining a remote node with the hostname *remote1*:
 ----
 # pcs resource create remote1 remote
 ----
 
 Example defining a remote node to connect to a specific IP address and port:
 ----
 # pcs resource create remote1 remote server=192.168.122.200 port=8938
 ----
 
 == Environment Variables for Daemon Start-up ==
 
 Authentication and encryption of the connection between cluster nodes
 and nodes running pacemaker_remote is achieved using
 with https://en.wikipedia.org/wiki/TLS-PSK[TLS-PSK] encryption/authentication
 over TCP (port 3121 by default). This means that both the cluster node and
 remote node must share the same private key. By default, this
 key is placed at +/etc/pacemaker/authkey+ on each node.
 
 You can change the default port and/or key location for Pacemaker and
 pacemaker_remote via environment variables. How these variables are set varies
 by OS, but usually they are set in the +/etc/sysconfig/pacemaker+ or
 +/etc/default/pacemaker+ file.
 
 ----
 #==#==# Pacemaker Remote
 # Use a custom directory for finding the authkey.
 PCMK_authkey_location=/etc/pacemaker/authkey
 #
 # Specify a custom port for Pacemaker Remote connections
 PCMK_remote_port=3121
 ----
 
 == Removing Remote Nodes and Guest Nodes ==
 
 If the resource creating a guest node, or the *ocf:pacemaker:remote* resource
 creating a connection to a remote node, is removed from the configuration, the
 affected node will continue to show up in output as an offline node.
 
 If you want to get rid of that output, run (replacing $NODE_NAME appropriately):
 ----
 # crm_node --force --remove $NODE_NAME
 ----
 
 [WARNING]
 =========
-Be absolutely sure that the node's resource has been deleted from the
-configuration first.
+Be absolutely sure that there are no references to the node's resource in the
+configuration before running the above command.
 =========
diff --git a/tools/crm_node.c b/tools/crm_node.c
index e8a71cf937..d927f31764 100644
--- a/tools/crm_node.c
+++ b/tools/crm_node.c
@@ -1,1003 +1,1002 @@
 /* 
  * Copyright (C) 2004 Andrew Beekhof <andrew@beekhof.net>
  * 
  * This program is free software; you can redistribute it and/or
  * modify it under the terms of the GNU General Public
  * License as published by the Free Software Foundation; either
  * version 2 of the License, or (at your option) any later version.
  * 
  * This software is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * General Public License for more details.
  * 
  * You should have received a copy of the GNU General Public
  * License along with this library; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
  */
 
 #include <crm_internal.h>
 
 #include <sys/param.h>
 #include <stdio.h>
 #include <sys/types.h>
 #include <unistd.h>
 
 #include <stdlib.h>
 #include <errno.h>
 #include <fcntl.h>
 
 #include <libgen.h>             /* for basename() */
 
 #include <crm/crm.h>
 #include <crm/cluster/internal.h>
 #include <crm/common/mainloop.h>
 #include <crm/msg_xml.h>
 #include <crm/cib.h>
 #include <crm/attrd.h>
 
 int command = 0;
 int ccm_fd = 0;
 gboolean do_quiet = FALSE;
 
 char *target_uuid = NULL;
 char *target_uname = NULL;
 const char *standby_value = NULL;
 const char *standby_scope = NULL;
 
 /* *INDENT-OFF* */
 static struct crm_option long_options[] = {
     /* Top-level Options */
     {"help",       0, 0, '?', "\tThis text"},
     {"version",    0, 0, '$', "\tVersion information"  },
     {"verbose",    0, 0, 'V', "\tIncrease debug output"},
     {"quiet",      0, 0, 'Q', "\tEssential output only"},
 
     {"-spacer-",   1, 0, '-', "\nStack:"},
 #if SUPPORT_CMAN
     {"cman",       0, 0, 'c', "\tOnly try connecting to a cman-based cluster"},
 #endif
 #if SUPPORT_COROSYNC
     {"openais",    0, 0, 'A', "\tOnly try connecting to an OpenAIS-based cluster"},
 #endif
 #ifdef SUPPORT_CS_QUORUM
     {"corosync",   0, 0, 'C', "\tOnly try connecting to an Corosync-based cluster"},
 #endif
 #ifdef SUPPORT_HEARTBEAT
     {"heartbeat",  0, 0, 'H', "Only try connecting to a Heartbeat-based cluster"},
 #endif
     
     {"-spacer-",      1, 0, '-', "\nCommands:"},
     {"name",	      0, 0, 'n', "\tDisplay the name used by the cluster for this node"},
     {"name-for-id",   1, 0, 'N', "\tDisplay the name used by the cluster for the node with the specified id"},
     {"epoch",	      0, 0, 'e', "\tDisplay the epoch during which this node joined the cluster"},
     {"quorum",        0, 0, 'q', "\tDisplay a 1 if our partition has quorum, 0 if not"},
     {"list",          0, 0, 'l', "\tDisplay all known members (past and present) of this cluster (Not available for heartbeat clusters)"},
     {"partition",     0, 0, 'p', "Display the members of this partition"},
     {"cluster-id",    0, 0, 'i', "Display this node's cluster id"},
     {"remove",        1, 0, 'R', "(Advanced) Remove the (stopped) node with the specified name from Pacemaker's configuration and caches"},
     {"-spacer-",      1, 0, '-', "In the case of Heartbeat, CMAN and Corosync 2.0, requires that the node has already been removed from the underlying cluster"},
 
     {"-spacer-", 1, 0, '-', "\nAdditional Options:"},
     {"force",	 0, 0, 'f'},
 
     {0, 0, 0, 0}
 };
 /* *INDENT-ON* */
 
 static int
 cib_remove_node(uint32_t id, const char *name)
 {
     int rc;
     cib_t *cib = NULL;
     xmlNode *node = NULL;
     xmlNode *node_state = NULL;
 
     crm_trace("Removing %s from the CIB", name);
 
-    /* TODO: Use 'id' instead */
     if(name == NULL && id == 0) {
         return -ENOTUNIQ;
     }
 
     node = create_xml_node(NULL, XML_CIB_TAG_NODE);
     node_state = create_xml_node(NULL, XML_CIB_TAG_STATE);
 
     crm_xml_add(node, XML_ATTR_UNAME, name);
     crm_xml_add(node_state, XML_ATTR_UNAME, name);
     if(id) {
         char buffer[64];
         if(snprintf(buffer, 63, "%u", id) > 0) {
             crm_xml_add(node, XML_ATTR_ID, buffer);
             crm_xml_add(node_state, XML_ATTR_ID, buffer);
         }
     }
 
     cib = cib_new();
     cib->cmds->signon(cib, crm_system_name, cib_command);
 
     rc = cib->cmds->delete(cib, XML_CIB_TAG_NODES, node, cib_sync_call);
     if (rc != pcmk_ok) {
         printf("Could not remove %s/%u from " XML_CIB_TAG_NODES ": %s", name, id, pcmk_strerror(rc));
     }
     rc = cib->cmds->delete(cib, XML_CIB_TAG_STATUS, node_state, cib_sync_call);
     if (rc != pcmk_ok) {
         printf("Could not remove %s/%u from " XML_CIB_TAG_STATUS ": %s", name, id, pcmk_strerror(rc));
     }
 
     cib->cmds->signoff(cib);
     cib_delete(cib);
     return rc;
 }
 
 int tools_remove_node_cache(const char *node, const char *target);
 
 int tools_remove_node_cache(const char *node, const char *target)
 {
     int n = 0;
     int rc = -1;
     char *name = NULL;
     char *admin_uuid = NULL;
     crm_ipc_t *conn = crm_ipc_new(target, 0);
     xmlNode *cmd = NULL;
     xmlNode *hello = NULL;
     char *endptr = NULL;
 
     if (!conn) {
         return -ENOTCONN;
     }
 
     if (!crm_ipc_connect(conn)) {
         crm_perror(LOG_ERR, "Connection to %s failed", target);
         crm_ipc_destroy(conn);
         return -ENOTCONN;
     }
 
     if(safe_str_eq(target, CRM_SYSTEM_CRMD)) {
         admin_uuid = calloc(1, 11);
         snprintf(admin_uuid, 10, "%d", getpid());
         admin_uuid[10] = '\0';
 
         hello = create_hello_message(admin_uuid, "crm_node", "0", "1");
         rc = crm_ipc_send(conn, hello, 0, 0, NULL);
 
         free_xml(hello);
         if (rc < 0) {
             free(admin_uuid);
             return rc;
         }
     }
 
 
     errno = 0;
     n = strtol(node, &endptr, 10);
     if (errno != 0 || endptr == node || *endptr != '\0') {
         /* Argument was not a nodeid */
         n = 0;
         name = strdup(node);
     } else {
         name = get_node_name(n);
     }
 
     crm_trace("Removing %s aka. %s (%u) from the membership cache", name, node, n);
 
     if(safe_str_eq(target, T_ATTRD)) {
         cmd = create_xml_node(NULL, __FUNCTION__);
 
         crm_xml_add(cmd, F_TYPE, T_ATTRD);
         crm_xml_add(cmd, F_ORIG, crm_system_name);
 
         crm_xml_add(cmd, F_ATTRD_TASK, ATTRD_OP_PEER_REMOVE);
         crm_xml_add(cmd, F_ATTRD_HOST, name);
 
         if (n) {
             char buffer[64];
             if(snprintf(buffer, 63, "%u", n) > 0) {
                 crm_xml_add(cmd, F_ATTRD_HOST_ID, buffer);
             }
         }
 
     } else {
         cmd = create_request(CRM_OP_RM_NODE_CACHE,
                              NULL, NULL, target, crm_system_name, admin_uuid);
         if (n) {
             char buffer[64];
             if(snprintf(buffer, 63, "%u", n) > 0) {
                 crm_xml_add(cmd, XML_ATTR_ID, buffer);
             }
         }
         crm_xml_add(cmd, XML_ATTR_UNAME, name);
     }
 
     rc = crm_ipc_send(conn, cmd, 0, 0, NULL);
     crm_debug("%s peer cache cleanup for %s (%u): %d", target, name, n, rc);
 
     if (rc > 0) {
         rc = cib_remove_node(n, name);
     }
 
     if (conn) {
         crm_ipc_close(conn);
         crm_ipc_destroy(conn);
     }
     free(admin_uuid);
     free_xml(cmd);
     free(name);
     return rc > 0 ? 0 : rc;
 }
 
 static gint
 compare_node_uname(gconstpointer a, gconstpointer b)
 {
     const crm_node_t *a_node = a;
     const crm_node_t *b_node = b;
     return strcmp(a_node->uname?a_node->uname:"", b_node->uname?b_node->uname:"");
 }
 
 static int
 node_mcp_dispatch(const char *buffer, ssize_t length, gpointer userdata)
 {
     xmlNode *msg = string2xml(buffer);
 
     if (msg) {
         xmlNode *node = NULL;
         GListPtr nodes = NULL;
         GListPtr iter = NULL;
         const char *quorate = crm_element_value(msg, "quorate");
 
         crm_log_xml_trace(msg, "message");
         if (command == 'q' && quorate != NULL) {
             fprintf(stdout, "%s\n", quorate);
             crm_exit(pcmk_ok);
 
         } else if(command == 'q') {
             crm_exit(1);
         }
 
         for (node = __xml_first_child(msg); node != NULL; node = __xml_next(node)) {
             crm_node_t *peer = calloc(1, sizeof(crm_node_t));
 
             nodes = g_list_insert_sorted(nodes, peer, compare_node_uname);
             peer->uname = (char*)crm_element_value_copy(node, "uname");
             peer->state = (char*)crm_element_value_copy(node, "state");
             crm_element_value_int(node, "id", (int*)&peer->id);
         }
 
         for(iter = nodes; iter; iter = iter->next) {
             crm_node_t *peer = iter->data;
             if (command == 'l') {
                 fprintf(stdout, "%u %s %s\n", peer->id, peer->uname, peer->state?peer->state:"");
 
             } else if (command == 'p') {
                 if(safe_str_eq(peer->state, CRM_NODE_MEMBER)) {
                     fprintf(stdout, "%s ", peer->uname);
                 }
 
             } else if (command == 'i') {
                 if(safe_str_eq(peer->state, CRM_NODE_MEMBER)) {
                     fprintf(stdout, "%u ", peer->id);
                 }
             }
         }
 
         g_list_free_full(nodes, free);
         free_xml(msg);
 
         if (command == 'p') {
             fprintf(stdout, "\n");
         }
 
         crm_exit(pcmk_ok);
     }
 
     return 0;
 }
 
 static void
 node_mcp_destroy(gpointer user_data)
 {
     crm_exit(ENOTCONN);
 }
 
 static gboolean
 try_pacemaker(int command, enum cluster_type_e stack)
 {
     struct ipc_client_callbacks node_callbacks = {
         .dispatch = node_mcp_dispatch,
         .destroy = node_mcp_destroy
     };
 
     if (stack == pcmk_cluster_heartbeat) {
         /* Nothing to do for them */
         return FALSE;
     }
 
     switch (command) {
         case 'e':
             /* Age only applies to heartbeat clusters */
             fprintf(stdout, "1\n");
             crm_exit(pcmk_ok);
 
         case 'R':
             {
                 int lpc = 0;
                 const char *daemons[] = {
                     CRM_SYSTEM_CRMD,
                     "stonith-ng",
                     T_ATTRD,
                     CRM_SYSTEM_MCP,
                 };
 
                 for(lpc = 0; lpc < DIMOF(daemons); lpc++) {
                     if (tools_remove_node_cache(target_uname, daemons[lpc])) {
                         crm_err("Failed to connect to %s to remove node '%s'", daemons[lpc], target_uname);
                         crm_exit(pcmk_err_generic);
                     }
                 }
                 crm_exit(pcmk_ok);
             }
             break;
 
         case 'i':
         case 'l':
         case 'q':
         case 'p':
             /* Go to pacemakerd */
             {
                 GMainLoop *amainloop = g_main_loop_new(NULL, FALSE);
                 mainloop_io_t *ipc =
                     mainloop_add_ipc_client(CRM_SYSTEM_MCP, G_PRIORITY_DEFAULT, 0, NULL, &node_callbacks);
                 if (ipc != NULL) {
                     /* Sending anything will get us a list of nodes */
                     xmlNode *poke = create_xml_node(NULL, "poke");
 
                     crm_ipc_send(mainloop_get_ipc_client(ipc), poke, 0, 0, NULL);
                     free_xml(poke);
                     g_main_run(amainloop);
                 }
             }
             break;
     }
     return FALSE;
 }
 
 #if SUPPORT_HEARTBEAT
 #  include <ocf/oc_event.h>
 #  include <ocf/oc_membership.h>
 #  include <clplumbing/cl_uuid.h>
 
 #  define UUID_LEN 16
 
 oc_ev_t *ccm_token = NULL;
 static void *ccm_library = NULL;
 void oc_ev_special(const oc_ev_t *, oc_ev_class_t, int);
 
 static gboolean
 read_local_hb_uuid(void)
 {
     cl_uuid_t uuid;
     char *buffer = NULL;
     long start = 0, read_len = 0;
 
     FILE *input = fopen(UUID_FILE, "r");
 
     if (input == NULL) {
         crm_info("Could not open UUID file %s", UUID_FILE);
         return FALSE;
     }
 
     /* see how big the file is */
     start = ftell(input);
     fseek(input, 0L, SEEK_END);
     if (UUID_LEN != ftell(input)) {
         fprintf(stderr, "%s must contain exactly %d bytes\n", UUID_FILE, UUID_LEN);
         abort();
     }
 
     fseek(input, 0L, start);
     if (start != ftell(input)) {
         fprintf(stderr, "fseek not behaving: %ld vs. %ld\n", start, ftell(input));
         crm_exit(pcmk_err_generic);
     }
 
     buffer = malloc(50);
     read_len = fread(uuid.uuid, 1, UUID_LEN, input);
     fclose(input);
 
     if (read_len != UUID_LEN) {
         fprintf(stderr, "Expected and read bytes differ: %d vs. %ld\n", UUID_LEN, read_len);
         crm_exit(pcmk_err_generic);
 
     } else if (buffer != NULL) {
         cl_uuid_unparse(&uuid, buffer);
         fprintf(stdout, "%s\n", buffer);
         return TRUE;
 
     } else {
         fprintf(stderr, "No buffer to unparse\n");
         crm_exit(ENODATA);
     }
 
     free(buffer);
     return FALSE;
 }
 
 static void
 ccm_age_callback(oc_ed_t event, void *cookie, size_t size, const void *data)
 {
     int lpc;
     int node_list_size;
     const oc_ev_membership_t *oc = (const oc_ev_membership_t *)data;
 
     int (*ccm_api_callback_done) (void *cookie) =
         find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_callback_done", 1);
 
     node_list_size = oc->m_n_member;
     if (command == 'q') {
         crm_debug("Processing \"%s\" event.",
                   event == OC_EV_MS_NEW_MEMBERSHIP ? "NEW MEMBERSHIP" :
                   event == OC_EV_MS_NOT_PRIMARY ? "NOT PRIMARY" :
                   event == OC_EV_MS_PRIMARY_RESTORED ? "PRIMARY RESTORED" :
                   event == OC_EV_MS_EVICTED ? "EVICTED" : "NO QUORUM MEMBERSHIP");
         if (ccm_have_quorum(event)) {
             fprintf(stdout, "1\n");
         } else {
             fprintf(stdout, "0\n");
         }
 
     } else if (command == 'e') {
         crm_debug("Searching %d members for our birth", oc->m_n_member);
     }
     for (lpc = 0; lpc < node_list_size; lpc++) {
         if (command == 'p') {
             fprintf(stdout, "%s ", oc->m_array[oc->m_memb_idx + lpc].node_uname);
 
         } else if (command == 'e') {
             int (*ccm_api_is_my_nodeid) (const oc_ev_t * token, const oc_node_t * node) =
                 find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_is_my_nodeid", 1);
             if ((*ccm_api_is_my_nodeid) (ccm_token, &(oc->m_array[lpc]))) {
                 crm_debug("MATCH: nodeid=%d, uname=%s, born=%d",
                           oc->m_array[oc->m_memb_idx + lpc].node_id,
                           oc->m_array[oc->m_memb_idx + lpc].node_uname,
                           oc->m_array[oc->m_memb_idx + lpc].node_born_on);
                 fprintf(stdout, "%d\n", oc->m_array[oc->m_memb_idx + lpc].node_born_on);
             }
         }
     }
 
     (*ccm_api_callback_done) (cookie);
 
     if (command == 'p') {
         fprintf(stdout, "\n");
     }
     fflush(stdout);
     crm_exit(pcmk_ok);
 }
 
 static gboolean
 ccm_age_connect(int *ccm_fd)
 {
     gboolean did_fail = FALSE;
     int ret = 0;
 
     int (*ccm_api_register) (oc_ev_t ** token) =
         find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_register", 1);
 
     int (*ccm_api_set_callback) (const oc_ev_t * token,
                                  oc_ev_class_t class,
                                  oc_ev_callback_t * fn,
                                  oc_ev_callback_t ** prev_fn) =
         find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_set_callback", 1);
 
     void (*ccm_api_special) (const oc_ev_t *, oc_ev_class_t, int) =
         find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_special", 1);
     int (*ccm_api_activate) (const oc_ev_t * token, int *fd) =
         find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_activate", 1);
 
     crm_debug("Registering with CCM");
     ret = (*ccm_api_register) (&ccm_token);
     if (ret != 0) {
         crm_info("CCM registration failed: %d", ret);
         did_fail = TRUE;
     }
 
     if (did_fail == FALSE) {
         crm_debug("Setting up CCM callbacks");
         ret = (*ccm_api_set_callback) (ccm_token, OC_EV_MEMB_CLASS, ccm_age_callback, NULL);
         if (ret != 0) {
             crm_warn("CCM callback not set: %d", ret);
             did_fail = TRUE;
         }
     }
     if (did_fail == FALSE) {
         (*ccm_api_special) (ccm_token, OC_EV_MEMB_CLASS, 0 /*don't care */ );
 
         crm_debug("Activating CCM token");
         ret = (*ccm_api_activate) (ccm_token, ccm_fd);
         if (ret != 0) {
             crm_warn("CCM Activation failed: %d", ret);
             did_fail = TRUE;
         }
     }
 
     return !did_fail;
 }
 
 static gboolean
 try_heartbeat(int command, enum cluster_type_e stack)
 {
     crm_debug("Attempting to process %c command", command);
 
     if (command == 'i') {
         if (read_local_hb_uuid()) {
             crm_exit(pcmk_ok);
         }
 
     } else if (command == 'R') {
         if (tools_remove_node_cache(target_uname, CRM_SYSTEM_CRMD)) {
             crm_err("Failed to connect to "CRM_SYSTEM_CRMD" to remove node '%s'", target_uname);
             crm_exit(pcmk_err_generic);
         }
         crm_exit(pcmk_ok);
 
     } else if (ccm_age_connect(&ccm_fd)) {
         int rc = 0;
         fd_set rset;
         int (*ccm_api_handle_event) (const oc_ev_t * token) =
             find_library_function(&ccm_library, CCM_LIBRARY, "oc_ev_handle_event", 1);
 
         while (1) {
 
             sleep(1);
             FD_ZERO(&rset);
             FD_SET(ccm_fd, &rset);
 
             errno = 0;
             rc = select(ccm_fd + 1, &rset, NULL, NULL, NULL);
 
             if (rc > 0 && (*ccm_api_handle_event) (ccm_token) != 0) {
                 crm_err("oc_ev_handle_event failed");
                 return FALSE;
 
             } else if (rc < 0 && errno != EINTR) {
                 crm_perror(LOG_ERR, "select failed: %d", rc);
                 return FALSE;
             }
         }
     }
     return FALSE;
 }
 #endif
 
 #if SUPPORT_CMAN
 #  include <libcman.h>
 #  define MAX_NODES 256
 static bool valid_cman_name(const char *name, uint32_t nodeid) 
 {
     bool rc = TRUE;
 
     /* Yes, %d, because that's what CMAN does */
     char *fakename = crm_strdup_printf("Node%d", nodeid);
 
     if(crm_str_eq(fakename, name, TRUE)) {
         rc = FALSE;
         crm_notice("Ignoring inferred name from cman: %s", fakename);
     }
     free(fakename);
     return rc;
 }
 
 static gboolean
 try_cman(int command, enum cluster_type_e stack)
 {
 
     int rc = -1, lpc = 0, node_count = 0;
     cman_node_t node;
     cman_cluster_t cluster;
     cman_handle_t cman_handle = NULL;
     cman_node_t cman_nodes[MAX_NODES];
 
     memset(&cluster, 0, sizeof(cluster));
 
     cman_handle = cman_init(NULL);
     if (cman_handle == NULL || cman_is_active(cman_handle) == FALSE) {
         crm_info("Couldn't connect to cman");
         return FALSE;
     }
 
     switch (command) {
         case 'R':
             try_pacemaker(command, stack);
             break;
 
         case 'e':
             /* Age makes no sense (yet?) in a cman cluster */
             fprintf(stdout, "1\n");
             break;
 
         case 'q':
             fprintf(stdout, "%d\n", cman_is_quorate(cman_handle));
             break;
 
         case 'l':
         case 'p':
             memset(cman_nodes, 0, MAX_NODES * sizeof(cman_node_t));
             rc = cman_get_nodes(cman_handle, MAX_NODES, &node_count, cman_nodes);
             if (rc != 0) {
                 fprintf(stderr, "Couldn't query cman node list: %d %d", rc, errno);
                 goto cman_bail;
             }
 
             for (lpc = 0; lpc < node_count; lpc++) {
                 if(valid_cman_name(cman_nodes[lpc].cn_name, cman_nodes[lpc].cn_nodeid) == FALSE) {
                     /* The name was invented, but we need to print something, make it the id instead */
                     printf("%u ", cman_nodes[lpc].cn_nodeid);
 
                 } if (command == 'l') {
                     printf("%s ", cman_nodes[lpc].cn_name);
 
                 } else if (cman_nodes[lpc].cn_nodeid != 0 && cman_nodes[lpc].cn_member) {
                     /* Never allow node ID 0 to be considered a member #315711 */
                     printf("%s ", cman_nodes[lpc].cn_name);
                 }
             }
             printf("\n");
             break;
 
         case 'i':
             memset(&node, 0, sizeof(cman_node_t));
             rc = cman_get_node(cman_handle, CMAN_NODEID_US, &node);
             if (rc != 0) {
                 fprintf(stderr, "Couldn't query cman node id: %d %d", rc, errno);
                 goto cman_bail;
             }
             fprintf(stdout, "%u\n", node.cn_nodeid);
             break;
 
         default:
             fprintf(stderr, "Unknown option '%c'\n", command);
             crm_help('?', EX_USAGE);
     }
     cman_finish(cman_handle);
     crm_exit(pcmk_ok);
 
   cman_bail:
     cman_finish(cman_handle);
     return crm_exit(EINVAL);
 }
 #endif
 
 #if HAVE_CONFDB
 static void
 ais_membership_destroy(gpointer user_data)
 {
     crm_err("AIS connection terminated");
     ais_fd_sync = -1;
     crm_exit(ENOTCONN);
 }
 
 static gint
 member_sort(gconstpointer a, gconstpointer b)
 {
     const crm_node_t *node_a = a;
     const crm_node_t *node_b = b;
 
     return strcmp(node_a->uname, node_b->uname);
 }
 
 static void
 crm_add_member(gpointer key, gpointer value, gpointer user_data)
 {
     GList **list = user_data;
     crm_node_t *node = value;
 
     if (node->uname != NULL) {
         *list = g_list_insert_sorted(*list, node, member_sort);
     }
 }
 
 static void
 ais_membership_dispatch(cpg_handle_t handle,
                           const struct cpg_name *groupName,
                           uint32_t nodeid, uint32_t pid, void *msg, size_t msg_len)
 {
     uint32_t kind = 0;
     const char *from = NULL;
     char *data = pcmk_message_common_cs(handle, nodeid, pid, msg, &kind, &from);
 
     switch (kind) {
         case crm_class_members:
         case crm_class_notify:
         case crm_class_quorum:
             break;
         default:
             free(data);
             return;
 
             break;
     }
 
     if (command == 'q') {
         if (crm_have_quorum) {
             fprintf(stdout, "1\n");
         } else {
             fprintf(stdout, "0\n");
         }
 
     } else if (command == 'l') {
         GList *nodes = NULL;
         GListPtr lpc = NULL;
 
         g_hash_table_foreach(crm_peer_cache, crm_add_member, &nodes);
         for (lpc = nodes; lpc != NULL; lpc = lpc->next) {
             crm_node_t *node = (crm_node_t *) lpc->data;
 
             fprintf(stdout, "%u %s %s\n", node->id, node->uname, node->state);
         }
         fprintf(stdout, "\n");
 
     } else if (command == 'p') {
         GList *nodes = NULL;
         GListPtr lpc = NULL;
 
         g_hash_table_foreach(crm_peer_cache, crm_add_member, &nodes);
         for (lpc = nodes; lpc != NULL; lpc = lpc->next) {
             crm_node_t *node = (crm_node_t *) lpc->data;
 
             if (node->uname && safe_str_eq(node->state, CRM_NODE_MEMBER)) {
                 fprintf(stdout, "%s ", node->uname);
             }
         }
         fprintf(stdout, "\n");
     }
 
     free(data);
     crm_exit(pcmk_ok);
 
     return;
 }
 #endif
 
 #ifdef SUPPORT_CS_QUORUM
 #  include <corosync/quorum.h>
 #  include <corosync/cpg.h>
 
 static gboolean
 try_corosync(int command, enum cluster_type_e stack)
 {
     int rc = 0;
     int quorate = 0;
     uint32_t quorum_type = 0;
     unsigned int nodeid = 0;
     cpg_handle_t c_handle = 0;
     quorum_handle_t q_handle = 0;
 
     switch (command) {
         case 'q':
             /* Go direct to the Quorum API */
             rc = quorum_initialize(&q_handle, NULL, &quorum_type);
             if (rc != CS_OK) {
                 crm_err("Could not connect to the Quorum API: %d", rc);
                 return FALSE;
             }
 
             rc = quorum_getquorate(q_handle, &quorate);
             if (rc != CS_OK) {
                 crm_err("Could not obtain the current Quorum API state: %d", rc);
                 return FALSE;
             }
 
             if (quorate) {
                 fprintf(stdout, "1\n");
             } else {
                 fprintf(stdout, "0\n");
             }
             quorum_finalize(q_handle);
             crm_exit(pcmk_ok);
 
         case 'i':
             /* Go direct to the CPG API */
             rc = cpg_initialize(&c_handle, NULL);
             if (rc != CS_OK) {
                 crm_err("Could not connect to the Cluster Process Group API: %d", rc);
                 return FALSE;
             }
 
             rc = cpg_local_get(c_handle, &nodeid);
             if (rc != CS_OK) {
                 crm_err("Could not get local node id from the CPG API");
                 return FALSE;
             }
 
             fprintf(stdout, "%u\n", nodeid);
             cpg_finalize(c_handle);
             crm_exit(pcmk_ok);
 
         default:
             try_pacemaker(command, stack);
             break;
     }
     return FALSE;
 }
 #endif
 
 #if HAVE_CONFDB
 static gboolean
 try_openais(int command, enum cluster_type_e stack)
 {
     static crm_cluster_t cluster;
 
     cluster.destroy = ais_membership_destroy;
     cluster.cpg.cpg_deliver_fn = ais_membership_dispatch;
     cluster.cpg.cpg_confchg_fn = NULL;
 
     if (init_cs_connection_once(&cluster)) {
 
         GMainLoop *amainloop = NULL;
 
         switch (command) {
             case 'R':
                 send_cluster_text(crm_class_rmpeer, target_uname, TRUE, NULL, crm_msg_ais);
                 cib_remove_node(0, target_uname);
                 crm_exit(pcmk_ok);
 
             case 'e':
                 /* Age makes no sense (yet) in an AIS cluster */
                 fprintf(stdout, "1\n");
                 crm_exit(pcmk_ok);
 
             case 'q':
                 send_cluster_text(crm_class_quorum, NULL, TRUE, NULL, crm_msg_ais);
                 break;
 
             case 'l':
             case 'p':
                 crm_info("Requesting the list of configured nodes");
                 send_cluster_text(crm_class_members, __FUNCTION__, TRUE, NULL, crm_msg_ais);
                 break;
 
             case 'i':
                 printf("%u\n", cluster.nodeid);
                 crm_exit(pcmk_ok);
 
             default:
                 fprintf(stderr, "Unknown option '%c'\n", command);
                 crm_help('?', EX_USAGE);
         }
         amainloop = g_main_new(FALSE);
         g_main_run(amainloop);
     }
     return FALSE;
 }
 #endif
 
 int set_cluster_type(enum cluster_type_e type);
 
 int
 main(int argc, char **argv)
 {
     int flag = 0;
     int argerr = 0;
     uint32_t nodeid = 0;
     gboolean force_flag = FALSE;
     gboolean dangerous_cmd = FALSE;
     enum cluster_type_e try_stack = pcmk_cluster_unknown;
 
     int option_index = 0;
 
     crm_peer_init();
     crm_log_cli_init("crm_node");
     crm_set_options(NULL, "command [options]", long_options,
                     "Tool for displaying low-level node information");
 
     while (flag >= 0) {
         flag = crm_get_option(argc, argv, &option_index);
         switch (flag) {
             case -1:
                 break;
             case 'V':
                 crm_bump_log_level(argc, argv);
                 break;
             case '$':
             case '?':
                 crm_help(flag, EX_OK);
                 break;
             case 'Q':
                 do_quiet = TRUE;
                 break;
             case 'H':
                 set_cluster_type(pcmk_cluster_heartbeat);
                 break;
             case 'A':
                 set_cluster_type(pcmk_cluster_classic_ais);
                 break;
             case 'C':
                 set_cluster_type(pcmk_cluster_corosync);
                 break;
             case 'c':
                 set_cluster_type(pcmk_cluster_cman);
                 break;
             case 'f':
                 force_flag = TRUE;
                 break;
             case 'R':
                 command = flag;
                 dangerous_cmd = TRUE;
                 target_uname = optarg;
                 break;
             case 'N':
                 command = flag;
                 nodeid = crm_parse_int(optarg, NULL);
                 break;
             case 'p':
             case 'e':
             case 'q':
             case 'i':
             case 'l':
             case 'n':
                 command = flag;
                 break;
             default:
                 ++argerr;
                 break;
         }
     }
 
     if (optind > argc) {
         ++argerr;
     }
 
     if (argerr) {
         crm_help('?', EX_USAGE);
     }
 
     if (command == 'n') {
         fprintf(stdout, "%s\n", get_local_node_name());
         crm_exit(pcmk_ok);
 
     } else if (command == 'N') {
         fprintf(stdout, "%s\n", get_node_name(nodeid));
         crm_exit(pcmk_ok);
     }
 
     if (dangerous_cmd && force_flag == FALSE) {
         fprintf(stderr, "The supplied command is considered dangerous."
                 "  To prevent accidental destruction of the cluster,"
                 " the --force flag is required in order to proceed.\n");
         fflush(stderr);
         crm_exit(EINVAL);
     }
 
     try_stack = get_cluster_type();
     crm_debug("Attempting to process -%c command for cluster type: %s", command,
               name_for_cluster_type(try_stack));
 
 #if SUPPORT_CMAN
     if (try_stack == pcmk_cluster_cman) {
         try_cman(command, try_stack);
     }
 #endif
 
 #ifdef SUPPORT_CS_QUORUM
     if (try_stack == pcmk_cluster_corosync) {
         try_corosync(command, try_stack);
     }
 #endif
 
 #if HAVE_CONFDB
     /* Only an option if we're using the plugins */
     if (try_stack == pcmk_cluster_classic_ais) {
         try_openais(command, try_stack);
     }
 #endif
 
 #if SUPPORT_HEARTBEAT
     if (try_stack == pcmk_cluster_heartbeat) {
         try_heartbeat(command, try_stack);
     }
 #endif
 
     try_pacemaker(command, try_stack);
 
     return (1);
 }