drbd: ignore "all zero" peer volume sizes in handshake
authorLars Ellenberg <lars.ellenberg@linbit.com>
Thu, 20 Dec 2018 16:23:31 +0000 (17:23 +0100)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 5 Dec 2019 14:37:44 +0000 (15:37 +0100)
[ Upstream commit 94c43a13b8d6e3e0dd77b3536b5e04a84936b762 ]

During handshake, if we are diskless ourselves, we used to accept any size
presented by the peer.

Which could be zero if that peer was just brought up and connected
to us without having a disk attached first, in which case both
peers would just "flip" their volume sizes.

Now, even a diskless node will ignore "zero" sizes
presented by a diskless peer.

Also a currently Diskless Primary will refuse to shrink during handshake:
it may be frozen, and waiting for a "suitable" local disk or peer to
re-appear (on-no-data-accessible suspend-io). If the peer is smaller
than what we used to be, it is not suitable.

The logic for a diskless node during handshake is now supposed to be:
believe the peer, if
 - I don't have a current size myself
 - we agree on the size anyways
 - I do have a current size, am Secondary, and he has the only disk
 - I do have a current size, am Primary, and he has the only disk,
   which is larger than my current size

Signed-off-by: Lars Ellenberg <lars.ellenberg@linbit.com>
Signed-off-by: Jens Axboe <axboe@kernel.dk>
Signed-off-by: Sasha Levin <sashal@kernel.org>
drivers/block/drbd/drbd_receiver.c

index 8fbdfaacc222676cc2650c5579ce206072aa40e1..08586bc5219bfe1dbf5519cf62505362f87d4155 100644 (file)
@@ -3977,6 +3977,7 @@ static int receive_sizes(struct drbd_connection *connection, struct packet_info
        struct o_qlim *o = (connection->agreed_features & DRBD_FF_WSAME) ? p->qlim : NULL;
        enum determine_dev_size dd = DS_UNCHANGED;
        sector_t p_size, p_usize, p_csize, my_usize;
+       sector_t new_size, cur_size;
        int ldsc = 0; /* local disk size changed */
        enum dds_flags ddsf;
 
@@ -3984,6 +3985,7 @@ static int receive_sizes(struct drbd_connection *connection, struct packet_info
        if (!peer_device)
                return config_unknown_volume(connection, pi);
        device = peer_device->device;
+       cur_size = drbd_get_capacity(device->this_bdev);
 
        p_size = be64_to_cpu(p->d_size);
        p_usize = be64_to_cpu(p->u_size);
@@ -3994,7 +3996,6 @@ static int receive_sizes(struct drbd_connection *connection, struct packet_info
        device->p_size = p_size;
 
        if (get_ldev(device)) {
-               sector_t new_size, cur_size;
                rcu_read_lock();
                my_usize = rcu_dereference(device->ldev->disk_conf)->disk_size;
                rcu_read_unlock();
@@ -4012,7 +4013,6 @@ static int receive_sizes(struct drbd_connection *connection, struct packet_info
                /* Never shrink a device with usable data during connect.
                   But allow online shrinking if we are connected. */
                new_size = drbd_new_dev_size(device, device->ldev, p_usize, 0);
-               cur_size = drbd_get_capacity(device->this_bdev);
                if (new_size < cur_size &&
                    device->state.disk >= D_OUTDATED &&
                    device->state.conn < C_CONNECTED) {
@@ -4077,9 +4077,36 @@ static int receive_sizes(struct drbd_connection *connection, struct packet_info
                 *
                 * However, if he sends a zero current size,
                 * take his (user-capped or) backing disk size anyways.
+                *
+                * Unless of course he does not have a disk himself.
+                * In which case we ignore this completely.
                 */
+               sector_t new_size = p_csize ?: p_usize ?: p_size;
                drbd_reconsider_queue_parameters(device, NULL, o);
-               drbd_set_my_capacity(device, p_csize ?: p_usize ?: p_size);
+               if (new_size == 0) {
+                       /* Ignore, peer does not know nothing. */
+               } else if (new_size == cur_size) {
+                       /* nothing to do */
+               } else if (cur_size != 0 && p_size == 0) {
+                       drbd_warn(device, "Ignored diskless peer device size (peer:%llu != me:%llu sectors)!\n",
+                                       (unsigned long long)new_size, (unsigned long long)cur_size);
+               } else if (new_size < cur_size && device->state.role == R_PRIMARY) {
+                       drbd_err(device, "The peer's device size is too small! (%llu < %llu sectors); demote me first!\n",
+                                       (unsigned long long)new_size, (unsigned long long)cur_size);
+                       conn_request_state(peer_device->connection, NS(conn, C_DISCONNECTING), CS_HARD);
+                       return -EIO;
+               } else {
+                       /* I believe the peer, if
+                        *  - I don't have a current size myself
+                        *  - we agree on the size anyways
+                        *  - I do have a current size, am Secondary,
+                        *    and he has the only disk
+                        *  - I do have a current size, am Primary,
+                        *    and he has the only disk,
+                        *    which is larger than my current size
+                        */
+                       drbd_set_my_capacity(device, new_size);
+               }
        }
 
        if (get_ldev(device)) {