summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorDavid Teigland <teigland@redhat.com>2015-10-14 14:36:46 -0500
committerDavid Teigland <teigland@redhat.com>2015-10-14 14:39:29 -0500
commitdf34fcdafd20ac195e588a06c8fc5a904fa71669 (patch)
tree46d12ef446979f9e1160a824a731d7ba5bb3ec9e
parenta6d1c8ac651ecdc6fbdfa20f892ba318c2dddeda (diff)
downloadlvm2-df34fcdafd20ac195e588a06c8fc5a904fa71669.tar.gz
lvmlockd: use flag to avoid blocking in sanlock_acquire
If a host failed while holding a sanlock lease, sanlock_acquire will by default block and wait for the lease to expire before returning. We want it to return with an error so we can retry instead of blocking, which allows us to process other lock operations. (Enclose this in an ifdef until the new flag appears in a sanlock release.)
-rw-r--r--daemons/lvmlockd/lvmlockd-sanlock.c29
1 files changed, 29 insertions, 0 deletions
diff --git a/daemons/lvmlockd/lvmlockd-sanlock.c b/daemons/lvmlockd/lvmlockd-sanlock.c
index 1e691eb94..e1a85b4cc 100644
--- a/daemons/lvmlockd/lvmlockd-sanlock.c
+++ b/daemons/lvmlockd/lvmlockd-sanlock.c
@@ -1392,6 +1392,15 @@ int lm_lock_sanlock(struct lockspace *ls, struct resource *r, int ld_mode,
if (adopt)
flags |= SANLK_ACQUIRE_ORPHAN_ONLY;
+#ifdef SANLOCK_HAS_ACQUIRE_OWNER_NOWAIT
+ /*
+ * Don't block waiting for a failed lease to expire since it causes
+ * sanlock_acquire to block for a long time, which would prevent this
+ * thread from processing other lock requests.
+ */
+ flags |= SANLK_ACQUIRE_OWNER_NOWAIT;
+#endif
+
rv = sanlock_acquire(lms->sock, -1, flags, 1, &rs, NULL);
if (rv == -EAGAIN) {
@@ -1462,6 +1471,26 @@ int lm_lock_sanlock(struct lockspace *ls, struct resource *r, int ld_mode,
return -EAGAIN;
}
+#ifdef SANLOCK_HAS_ACQUIRE_OWNER_NOWAIT
+ if (rv == SANLK_ACQUIRE_OWNED_RETRY) {
+ /*
+ * The lock is held by a failed host, and will eventually
+ * expire. If we retry we'll eventually acquire the lock
+ * (or find someone else has acquired it). The EAGAIN retry
+ * attempts for SH locks above would not be sufficient for
+ * the length of expiration time. We could add a longer
+ * retry time here to cover the full expiration time and block
+ * the activation command for that long. For now just return
+ * the standard error indicating that another host still owns
+ * the lease. FIXME: return a different error number so the
+ * command can print an different error indicating that the
+ * owner of the lease is in the process of expiring?
+ */
+ log_debug("S %s R %s lock_san acquire mode %d rv %d", ls->name, r->name, ld_mode, rv);
+ *retry = 0;
+ return -EAGAIN;
+ }
+#endif
if (rv < 0) {
log_error("S %s R %s lock_san acquire error %d",
ls->name, r->name, rv);