ocfs2: fix a tiny race that leads file system read-only

author Jiufei Xue <xuejiufei@huawei.com>

Tue, 15 Mar 2016 21:53:20 +0000 (14:53 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Tue, 15 Mar 2016 23:55:16 +0000 (16:55 -0700)
author Jiufei Xue <xuejiufei@huawei.com>
Tue, 15 Mar 2016 21:53:20 +0000 (14:53 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Tue, 15 Mar 2016 23:55:16 +0000 (16:55 -0700)
diff --git a/fs/ocfs2/dlm/dlmcommon.h b/fs/ocfs2/dlm/dlmcommon.h

index 3b77862fc85d39eac5e03babde712e177caf3d6a..004f2cbe8f71e7c4ffb8833f8cc1e249680f99c4 100644 (file)
--- a/fs/ocfs2/dlm/dlmcommon.h
+++ b/fs/ocfs2/dlm/dlmcommon.h
@@ -282,6 +282,7 @@ static inline void __dlm_set_joining_node(struct dlm_ctxt *dlm,
  #define DLM_LOCK_RES_DROPPING_REF         0x00000040
  #define DLM_LOCK_RES_BLOCK_DIRTY          0x00001000
  #define DLM_LOCK_RES_SETREF_INPROG        0x00002000
+#define DLM_LOCK_RES_RECOVERY_WAITING     0x00004000
  
  /* max milliseconds to wait to sync up a network failure with a node death */
  #define DLM_NODE_DEATH_WAIT_MAX (5 * 1000)
@@ -804,7 +805,8 @@ __dlm_lockres_state_to_status(struct dlm_lock_resource *res)
  
         assert_spin_locked(&res->spinlock);
  
-       if (res->state & DLM_LOCK_RES_RECOVERING)
+       if (res->state & (DLM_LOCK_RES_RECOVERING|
+                       DLM_LOCK_RES_RECOVERY_WAITING))
                 status = DLM_RECOVERING;
         else if (res->state & DLM_LOCK_RES_MIGRATING)
                 status = DLM_MIGRATING;
@@ -1026,6 +1028,7 @@ static inline void __dlm_wait_on_lockres(struct dlm_lock_resource *res)
  {
         __dlm_wait_on_lockres_flags(res, (DLM_LOCK_RES_IN_PROGRESS|
                                           DLM_LOCK_RES_RECOVERING|
+                                         DLM_LOCK_RES_RECOVERY_WAITING|
                                           DLM_LOCK_RES_MIGRATING));
  }
  
diff --git a/fs/ocfs2/dlm/dlmmaster.c b/fs/ocfs2/dlm/dlmmaster.c

index 87e22541850e3138b506cb4032dc94671c12a157..9aed6e2022014afb71988de025e583b38aea3892 100644 (file)
--- a/fs/ocfs2/dlm/dlmmaster.c
+++ b/fs/ocfs2/dlm/dlmmaster.c
@@ -2550,7 +2550,8 @@ static int dlm_is_lockres_migrateable(struct dlm_ctxt *dlm,
                 return 0;
  
         /* delay migration when the lockres is in RECOCERING state */
-       if (res->state & DLM_LOCK_RES_RECOVERING)
+       if (res->state & (DLM_LOCK_RES_RECOVERING|
+                       DLM_LOCK_RES_RECOVERY_WAITING))
                 return 0;
  
         if (res->owner != dlm->node_num)
diff --git a/fs/ocfs2/dlm/dlmrecovery.c b/fs/ocfs2/dlm/dlmrecovery.c

index 213279db3f282021e3f4a3647e1aea460eecf56d..cd38488a10fc104fba6339cc2d6c9501a4251dfe 100644 (file)
--- a/fs/ocfs2/dlm/dlmrecovery.c
+++ b/fs/ocfs2/dlm/dlmrecovery.c
@@ -2175,6 +2175,13 @@ static void dlm_finish_local_lockres_recovery(struct dlm_ctxt *dlm,
         for (i = 0; i < DLM_HASH_BUCKETS; i++) {
                 bucket = dlm_lockres_hash(dlm, i);
                 hlist_for_each_entry(res, bucket, hash_node) {
+                       if (res->state & DLM_LOCK_RES_RECOVERY_WAITING) {
+                               spin_lock(&res->spinlock);
+                               res->state &= ~DLM_LOCK_RES_RECOVERY_WAITING;
+                               spin_unlock(&res->spinlock);
+                               wake_up(&res->wq);
+                       }
+
                         if (!(res->state & DLM_LOCK_RES_RECOVERING))
                                 continue;
  
@@ -2312,6 +2319,7 @@ static void dlm_free_dead_locks(struct dlm_ctxt *dlm,
                              res->lockname.len, res->lockname.name, freed, dead_node);
                         __dlm_print_one_lock_resource(res);
                 }
+               res->state |= DLM_LOCK_RES_RECOVERY_WAITING;
                 dlm_lockres_clear_refmap_bit(dlm, res, dead_node);
         } else if (test_bit(dead_node, res->refmap)) {
                 mlog(0, "%s:%.*s: dead node %u had a ref, but had "
diff --git a/fs/ocfs2/dlm/dlmthread.c b/fs/ocfs2/dlm/dlmthread.c

index 22e6eb8b8d22f9f9f15aa886467cabca6649ce48..68d239ba0c63c8c925644755d16a1f020298bfba 100644 (file)
--- a/fs/ocfs2/dlm/dlmthread.c
+++ b/fs/ocfs2/dlm/dlmthread.c
@@ -106,7 +106,8 @@ int __dlm_lockres_unused(struct dlm_lock_resource *res)
         if (!list_empty(&res->dirty) || res->state & DLM_LOCK_RES_DIRTY)
                 return 0;
  
-       if (res->state & DLM_LOCK_RES_RECOVERING)
+       if (res->state & (DLM_LOCK_RES_RECOVERING|
+                       DLM_LOCK_RES_RECOVERY_WAITING))
                 return 0;
  
         /* Another node has this resource with this node as the master */
@@ -707,7 +708,8 @@ static int dlm_thread(void *data)
                          * dirty for a short while. */
                         BUG_ON(res->state & DLM_LOCK_RES_MIGRATING);
                         if (res->state & (DLM_LOCK_RES_IN_PROGRESS |
-                                         DLM_LOCK_RES_RECOVERING)) {
+                                         DLM_LOCK_RES_RECOVERING |
+                                         DLM_LOCK_RES_RECOVERY_WAITING)) {
                                 /* move it to the tail and keep going */
                                 res->state &= ~DLM_LOCK_RES_DIRTY;
                                 spin_unlock(&res->spinlock);
author	Jiufei Xue <xuejiufei@huawei.com>
	Tue, 15 Mar 2016 21:53:20 +0000 (14:53 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Tue, 15 Mar 2016 23:55:16 +0000 (16:55 -0700)
fs/ocfs2/dlm/dlmcommon.h		patch \| blob \| blame \| history
fs/ocfs2/dlm/dlmmaster.c		patch \| blob \| blame \| history
fs/ocfs2/dlm/dlmrecovery.c		patch \| blob \| blame \| history
fs/ocfs2/dlm/dlmthread.c		patch \| blob \| blame \| history