[Ocfs2-devel] [PATCH 2/2] ocfs2: o2dlm fix race in purge lockres and newlock (orabug 9094491) -backport to 1.2
Sunil Mushran
sunil.mushran at oracle.com
Sun Jun 27 11:47:03 PDT 2010
Just to be clear. This is just an interim patch for 1.2. Not for
inclusion in mainline.
On 06/26/2010 04:32 AM, Wengang Wang wrote:
> This patch fixes the following hole.
> dlmlock tries to create a new lock on a lockres that is on purge list. It calls
> dlm_get_lockresource and later adds a lock to blocked list. But in this window,
> dlm_thread can purge the lockres and unhash it. This will cause a BUG, as when
> the AST comes back from the master lockres is not found
>
> This patch marks the lockres with a new state DLM_LOCK_RES_IN_USE which would
> protect lockres from dlm_thread purging it.
>
> Signed-off-by: Srinivas Eeda<srinivas.eeda at oracle.com>
> Signed-off-by: Sunil Mushran<sunil.mushran at oracle.com>
> ---
> dlmcommon.h | 1 +
> dlmlock.c | 4 ++++
> dlmmaster.c | 5 ++++-
> dlmthread.c | 1 +
> 4 files changed, 10 insertions(+), 1 deletion(-)
>
> diff -upr ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmcommon.h ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmcommon.h
> --- ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmcommon.h 2010-06-26 19:04:32.000000000 +0800
> +++ ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmcommon.h 2010-06-26 19:18:33.000000000 +0800
> @@ -218,6 +218,7 @@ static inline void __dlm_set_joining_nod
> #define DLM_LOCK_RES_IN_PROGRESS 0x00000010
> #define DLM_LOCK_RES_MIGRATING 0x00000020
> #define DLM_LOCK_RES_DROPPING_REF 0x00000040
> +#define DLM_LOCK_RES_IN_USE 0x00000100
> #define DLM_LOCK_RES_BLOCK_DIRTY 0x00001000
> #define DLM_LOCK_RES_SETREF_INPROG 0x00002000
>
> diff -upr ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmlock.c ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmlock.c
> --- ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmlock.c 2010-06-26 19:04:22.000000000 +0800
> +++ ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmlock.c 2010-06-26 19:21:06.000000000 +0800
> @@ -116,6 +116,8 @@ static enum dlm_status dlmlock_master(st
> if (status != DLM_NORMAL&&
> lock->ml.node != dlm->node_num) {
> /* erf. state changed after lock was dropped. */
> + /* DLM_LOCK_RES_IN_USE is set in dlm_get_lock_resource */
> + res->state&= ~DLM_LOCK_RES_IN_USE;
> spin_unlock(&res->spinlock);
> dlm_error(status);
> return status;
> @@ -162,6 +164,7 @@ static enum dlm_status dlmlock_master(st
> kick_thread = 1;
> }
> }
> + res->state&= ~DLM_LOCK_RES_IN_USE;
> /* reduce the inflight count, this may result in the lockres
> * being purged below during calc_usage */
> if (lock->ml.node == dlm->node_num)
> @@ -228,6 +231,7 @@ static enum dlm_status dlmlock_remote(st
>
> spin_lock(&res->spinlock);
> res->state&= ~DLM_LOCK_RES_IN_PROGRESS;
> + res->state&= ~DLM_LOCK_RES_IN_USE;
> lock->lock_pending = 0;
> if (status != DLM_NORMAL) {
> if (status == DLM_RECOVERING&&
> diff -upr ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmmaster.c ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmmaster.c
> --- ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmmaster.c 2010-06-26 19:04:22.000000000 +0800
> +++ ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmmaster.c 2010-06-26 19:23:57.000000000 +0800
> @@ -804,12 +804,15 @@ lookup:
> if (tmpres) {
> int dropping_ref = 0;
>
> + tmpres->state |= DLM_LOCK_RES_IN_USE;
> spin_lock(&tmpres->spinlock);
> if (tmpres->owner == dlm->node_num) {
> BUG_ON(tmpres->state& DLM_LOCK_RES_DROPPING_REF);
> dlm_lockres_grab_inflight_ref(dlm, tmpres);
> - } else if (tmpres->state& DLM_LOCK_RES_DROPPING_REF)
> + } else if (tmpres->state& DLM_LOCK_RES_DROPPING_REF) {
> + tmpres->state&= ~DLM_LOCK_RES_IN_USE;
> dropping_ref = 1;
> + }
> spin_unlock(&tmpres->spinlock);
> spin_unlock(&dlm->spinlock);
>
> diff -upr ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmthread.c ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmthread.c
> --- ocfs2-1.2.9-8-test/fs/ocfs2/dlm/dlmthread.c 2010-06-26 19:04:32.000000000 +0800
> +++ ocfs2-1.2.9-8.2/fs/ocfs2/dlm/dlmthread.c 2010-06-26 19:25:06.000000000 +0800
> @@ -97,6 +97,7 @@ int __dlm_lockres_has_locks(struct dlm_l
> int __dlm_lockres_unused(struct dlm_lock_resource *res)
> {
> if (!__dlm_lockres_has_locks(res)&&
> + !(res->state& DLM_LOCK_RES_IN_USE)&&
> (list_empty(&res->dirty)&& !(res->state& DLM_LOCK_RES_DIRTY))) {
> /* try not to scan the bitmap unless the first two
> * conditions are already true */
>
> _______________________________________________
> Ocfs2-devel mailing list
> Ocfs2-devel at oss.oracle.com
> http://oss.oracle.com/mailman/listinfo/ocfs2-devel
>
More information about the Ocfs2-devel
mailing list