drbd: Avoid NetworkFailure state during disconnect
authorPhilipp Reisner <philipp.reisner@linbit.com>
Wed, 8 Aug 2012 19:19:09 +0000 (21:19 +0200)
committerPhilipp Reisner <philipp.reisner@linbit.com>
Fri, 9 Nov 2012 13:08:18 +0000 (14:08 +0100)
Disconnecting is a cluster wide state change. In case the peer node agrees
to the state transition, it sends back the fact on the meta-data connection
and closes both sockets.

In case the node node that initiated the state transfer sees the closing
action on the data-socket, before the P_STATE_CHG_REPLY packet, it was
going into one of the network failure states.

At least with the fencing option set to something else thatn "dont-care",
the unclean shutdown of the connection causes a short IO freeze or
a fence operation.

Signed-off-by: Philipp Reisner <philipp.reisner@linbit.com>
Signed-off-by: Lars Ellenberg <lars.ellenberg@linbit.com>
drivers/block/drbd/drbd_int.h
drivers/block/drbd/drbd_receiver.c
drivers/block/drbd/drbd_state.c

index b83398d64a9ca12987745fa43fc1331039f0bbf6..37ae87e468ae66af17c58f3c212b116871316ac2 100644 (file)
@@ -816,6 +816,7 @@ enum {
                                 * so shrink_page_list() would not recurse into,
                                 * and potentially deadlock on, this drbd worker.
                                 */
+       DISCONNECT_SENT,
 };
 
 struct drbd_tconn {                    /* is a resource from the config file */
index 0eefbeb65664c49d7b8a85e8124cc874699482c2..1a8f698021a2bfe3bb2fcc90a7ceef52e916b40d 100644 (file)
@@ -522,7 +522,6 @@ static int drbd_recv(struct drbd_tconn *tconn, void *buf, size_t size)
                                conn_err(tconn, "sock_recvmsg returned %d\n", rv);
                        break;
                } else if (rv == 0) {
-                       conn_info(tconn, "sock was shut down by peer\n");
                        break;
                } else  {
                        /* signal came in, or peer/link went down,
@@ -535,9 +534,25 @@ static int drbd_recv(struct drbd_tconn *tconn, void *buf, size_t size)
 
        set_fs(oldfs);
 
+       if (rv == 0) {
+               if (test_bit(DISCONNECT_SENT, &tconn->flags)) {
+                       long t;
+                       rcu_read_lock();
+                       t = rcu_dereference(tconn->net_conf)->ping_timeo * HZ/10;
+                       rcu_read_unlock();
+
+                       t = wait_event_timeout(tconn->ping_wait, tconn->cstate < C_WF_REPORT_PARAMS, t);
+
+                       if (t)
+                               goto out;
+               }
+               conn_info(tconn, "sock was shut down by peer\n");
+       }
+
        if (rv != size)
                conn_request_state(tconn, NS(conn, C_BROKEN_PIPE), CS_HARD);
 
+out:
        return rv;
 }
 
@@ -894,6 +909,7 @@ static int conn_connect(struct drbd_tconn *tconn)
                .door_bell = COMPLETION_INITIALIZER_ONSTACK(ad.door_bell),
        };
 
+       clear_bit(DISCONNECT_SENT, &tconn->flags);
        if (conn_request_state(tconn, NS(conn, C_WF_CONNECTION), CS_VERBOSE) < SS_SUCCESS)
                return -2;
 
@@ -5316,6 +5332,18 @@ int drbd_asender(struct drbd_thread *thi)
                        received += rv;
                        buf      += rv;
                } else if (rv == 0) {
+                       if (test_bit(DISCONNECT_SENT, &tconn->flags)) {
+                               long t;
+                               rcu_read_lock();
+                               t = rcu_dereference(tconn->net_conf)->ping_timeo * HZ/10;
+                               rcu_read_unlock();
+
+                               t = wait_event_timeout(tconn->ping_wait,
+                                                      tconn->cstate < C_WF_REPORT_PARAMS,
+                                                      t);
+                               if (t)
+                                       break;
+                       }
                        conn_err(tconn, "meta connection shut down by peer.\n");
                        goto reconnect;
                } else if (rv == -EAGAIN) {
index c16349aec23c8c41188b3779e82089307639016a..4fda4e2024ecc24c5c5cd4590e51c94b6bab3ff1 100644 (file)
@@ -1742,6 +1742,9 @@ conn_cl_wide(struct drbd_tconn *tconn, union drbd_state mask, union drbd_state v
                goto abort;
        }
 
+       if (val.conn == C_DISCONNECTING)
+               set_bit(DISCONNECT_SENT, &tconn->flags);
+
        wait_event(tconn->ping_wait, (rv = _conn_rq_cond(tconn, mask, val)));
        clear_bit(CONN_WD_ST_CHG_REQ, &tconn->flags);