dlm: add recovery callbacks
[linux-block.git] / fs / dlm / member.c
index eebc52aae82e1613f5a1b1669dab666403708d8e..862640a36d5cbba1762ad47317dffbd72eab0531 100644 (file)
@@ -1,7 +1,7 @@
 /******************************************************************************
 *******************************************************************************
 **
-**  Copyright (C) 2005-2009 Red Hat, Inc.  All rights reserved.
+**  Copyright (C) 2005-2011 Red Hat, Inc.  All rights reserved.
 **
 **  This copyrighted material is made available to anyone wishing to use,
 **  modify, copy, or redistribute it subject to the terms and conditions
@@ -27,7 +27,7 @@ int dlm_slots_version(struct dlm_header *h)
 }
 
 void dlm_slot_save(struct dlm_ls *ls, struct dlm_rcom *rc,
-                 struct dlm_member *memb)
+                  struct dlm_member *memb)
 {
        struct rcom_config *rf = (struct rcom_config *)rc->rc_buf;
 
@@ -317,59 +317,51 @@ static void add_ordered_member(struct dlm_ls *ls, struct dlm_member *new)
        }
 }
 
-static int dlm_add_member(struct dlm_ls *ls, int nodeid)
+static int dlm_add_member(struct dlm_ls *ls, struct dlm_config_node *node)
 {
        struct dlm_member *memb;
-       int w, error;
+       int error;
 
        memb = kzalloc(sizeof(struct dlm_member), GFP_NOFS);
        if (!memb)
                return -ENOMEM;
 
-       w = dlm_node_weight(ls->ls_name, nodeid);
-       if (w < 0) {
-               kfree(memb);
-               return w;
-       }
-
-       error = dlm_lowcomms_connect_node(nodeid);
+       error = dlm_lowcomms_connect_node(node->nodeid);
        if (error < 0) {
                kfree(memb);
                return error;
        }
 
-       memb->nodeid = nodeid;
-       memb->weight = w;
+       memb->nodeid = node->nodeid;
+       memb->weight = node->weight;
+       memb->comm_seq = node->comm_seq;
        add_ordered_member(ls, memb);
        ls->ls_num_nodes++;
        return 0;
 }
 
-static void dlm_remove_member(struct dlm_ls *ls, struct dlm_member *memb)
-{
-       list_move(&memb->list, &ls->ls_nodes_gone);
-       ls->ls_num_nodes--;
-}
-
-int dlm_is_member(struct dlm_ls *ls, int nodeid)
+static struct dlm_member *find_memb(struct list_head *head, int nodeid)
 {
        struct dlm_member *memb;
 
-       list_for_each_entry(memb, &ls->ls_nodes, list) {
+       list_for_each_entry(memb, head, list) {
                if (memb->nodeid == nodeid)
-                       return 1;
+                       return memb;
        }
+       return NULL;
+}
+
+int dlm_is_member(struct dlm_ls *ls, int nodeid)
+{
+       if (find_memb(&ls->ls_nodes, nodeid))
+               return 1;
        return 0;
 }
 
 int dlm_is_removed(struct dlm_ls *ls, int nodeid)
 {
-       struct dlm_member *memb;
-
-       list_for_each_entry(memb, &ls->ls_nodes_gone, list) {
-               if (memb->nodeid == nodeid)
-                       return 1;
-       }
+       if (find_memb(&ls->ls_nodes_gone, nodeid))
+               return 1;
        return 0;
 }
 
@@ -460,10 +452,88 @@ static int ping_members(struct dlm_ls *ls)
        return error;
 }
 
+static void dlm_lsop_recover_prep(struct dlm_ls *ls)
+{
+       if (!ls->ls_ops || !ls->ls_ops->recover_prep)
+               return;
+       ls->ls_ops->recover_prep(ls->ls_ops_arg);
+}
+
+static void dlm_lsop_recover_slot(struct dlm_ls *ls, struct dlm_member *memb)
+{
+       struct dlm_slot slot;
+       uint32_t seq;
+       int error;
+
+       if (!ls->ls_ops || !ls->ls_ops->recover_slot)
+               return;
+
+       /* if there is no comms connection with this node
+          or the present comms connection is newer
+          than the one when this member was added, then
+          we consider the node to have failed (versus
+          being removed due to dlm_release_lockspace) */
+
+       error = dlm_comm_seq(memb->nodeid, &seq);
+
+       if (!error && seq == memb->comm_seq)
+               return;
+
+       slot.nodeid = memb->nodeid;
+       slot.slot = memb->slot;
+
+       ls->ls_ops->recover_slot(ls->ls_ops_arg, &slot);
+}
+
+void dlm_lsop_recover_done(struct dlm_ls *ls)
+{
+       struct dlm_member *memb;
+       struct dlm_slot *slots;
+       int i, num;
+
+       if (!ls->ls_ops || !ls->ls_ops->recover_done)
+               return;
+
+       num = ls->ls_num_nodes;
+
+       slots = kzalloc(num * sizeof(struct dlm_slot), GFP_KERNEL);
+       if (!slots)
+               return;
+
+       i = 0;
+       list_for_each_entry(memb, &ls->ls_nodes, list) {
+               if (i == num) {
+                       log_error(ls, "dlm_lsop_recover_done bad num %d", num);
+                       goto out;
+               }
+               slots[i].nodeid = memb->nodeid;
+               slots[i].slot = memb->slot;
+               i++;
+       }
+
+       ls->ls_ops->recover_done(ls->ls_ops_arg, slots, num,
+                                ls->ls_slot, ls->ls_generation);
+ out:
+       kfree(slots);
+}
+
+static struct dlm_config_node *find_config_node(struct dlm_recover *rv,
+                                               int nodeid)
+{
+       int i;
+
+       for (i = 0; i < rv->nodes_count; i++) {
+               if (rv->nodes[i].nodeid == nodeid)
+                       return &rv->nodes[i];
+       }
+       return NULL;
+}
+
 int dlm_recover_members(struct dlm_ls *ls, struct dlm_recover *rv, int *neg_out)
 {
        struct dlm_member *memb, *safe;
-       int i, error, found, pos = 0, neg = 0, low = -1;
+       struct dlm_config_node *node;
+       int i, error, neg = 0, low = -1;
 
        /* previously removed members that we've not finished removing need to
           count as a negative change so the "neg" recovery steps will happen */
@@ -476,46 +546,32 @@ int dlm_recover_members(struct dlm_ls *ls, struct dlm_recover *rv, int *neg_out)
        /* move departed members from ls_nodes to ls_nodes_gone */
 
        list_for_each_entry_safe(memb, safe, &ls->ls_nodes, list) {
-               found = 0;
-               for (i = 0; i < rv->node_count; i++) {
-                       if (memb->nodeid == rv->nodeids[i]) {
-                               found = 1;
-                               break;
-                       }
-               }
+               node = find_config_node(rv, memb->nodeid);
+               if (node && !node->new)
+                       continue;
 
-               if (!found) {
-                       neg++;
-                       dlm_remove_member(ls, memb);
+               if (!node) {
                        log_debug(ls, "remove member %d", memb->nodeid);
+               } else {
+                       /* removed and re-added */
+                       log_debug(ls, "remove member %d comm_seq %u %u",
+                                 memb->nodeid, memb->comm_seq, node->comm_seq);
                }
-       }
-
-       /* Add an entry to ls_nodes_gone for members that were removed and
-          then added again, so that previous state for these nodes will be
-          cleared during recovery. */
 
-       for (i = 0; i < rv->new_count; i++) {
-               if (!dlm_is_member(ls, rv->new[i]))
-                       continue;
-               log_debug(ls, "new nodeid %d is a re-added member", rv->new[i]);
-
-               memb = kzalloc(sizeof(struct dlm_member), GFP_NOFS);
-               if (!memb)
-                       return -ENOMEM;
-               memb->nodeid = rv->new[i];
-               list_add_tail(&memb->list, &ls->ls_nodes_gone);
                neg++;
+               list_move(&memb->list, &ls->ls_nodes_gone);
+               ls->ls_num_nodes--;
+               dlm_lsop_recover_slot(ls, memb);
        }
 
        /* add new members to ls_nodes */
 
-       for (i = 0; i < rv->node_count; i++) {
-               if (dlm_is_member(ls, rv->nodeids[i]))
+       for (i = 0; i < rv->nodes_count; i++) {
+               node = &rv->nodes[i];
+               if (dlm_is_member(ls, node->nodeid))
                        continue;
-               dlm_add_member(ls, rv->nodeids[i]);
-               pos++;
-               log_debug(ls, "add member %d", rv->nodeids[i]);
+               dlm_add_member(ls, node);
+               log_debug(ls, "add member %d", node->nodeid);
        }
 
        list_for_each_entry(memb, &ls->ls_nodes, list) {
@@ -609,21 +665,22 @@ int dlm_ls_stop(struct dlm_ls *ls)
 
        if (!ls->ls_recover_begin)
                ls->ls_recover_begin = jiffies;
+
+       dlm_lsop_recover_prep(ls);
        return 0;
 }
 
 int dlm_ls_start(struct dlm_ls *ls)
 {
        struct dlm_recover *rv = NULL, *rv_old;
-       int *ids = NULL, *new = NULL;
-       int error, ids_count = 0, new_count = 0;
+       struct dlm_config_node *nodes;
+       int error, count;
 
        rv = kzalloc(sizeof(struct dlm_recover), GFP_NOFS);
        if (!rv)
                return -ENOMEM;
 
-       error = dlm_nodeid_list(ls->ls_name, &ids, &ids_count,
-                               &new, &new_count);
+       error = dlm_config_nodes(ls->ls_name, &nodes, &count);
        if (error < 0)
                goto fail;
 
@@ -638,10 +695,8 @@ int dlm_ls_start(struct dlm_ls *ls)
                goto fail;
        }
 
-       rv->nodeids = ids;
-       rv->node_count = ids_count;
-       rv->new = new;
-       rv->new_count = new_count;
+       rv->nodes = nodes;
+       rv->nodes_count = count;
        rv->seq = ++ls->ls_recover_seq;
        rv_old = ls->ls_recover_args;
        ls->ls_recover_args = rv;
@@ -649,9 +704,8 @@ int dlm_ls_start(struct dlm_ls *ls)
 
        if (rv_old) {
                log_error(ls, "unused recovery %llx %d",
-                         (unsigned long long)rv_old->seq, rv_old->node_count);
-               kfree(rv_old->nodeids);
-               kfree(rv_old->new);
+                         (unsigned long long)rv_old->seq, rv_old->nodes_count);
+               kfree(rv_old->nodes);
                kfree(rv_old);
        }
 
@@ -660,8 +714,7 @@ int dlm_ls_start(struct dlm_ls *ls)
 
  fail:
        kfree(rv);
-       kfree(ids);
-       kfree(new);
+       kfree(nodes);
        return error;
 }