file-posix: Skip effectiveless OFD lock operations

If we know we've already locked the bytes, don't do it again; similarly
don't unlock a byte if we haven't locked it. This doesn't change the
behavior, but fixes a corner case explained below.

Libvirt had an error handling bug that an image can get its (ownership,
file mode, SELinux) permissions changed (RHBZ 1584982) by mistake behind
QEMU. Specifically, an image in use by Libvirt VM has:

    $ ls -lhZ b.img
    -rw-r--r--. qemu qemu system_u:object_r:svirt_image_t:s0:c600,c690 b.img

Trying to attach it a second time won't work because of image locking.
And after the error, it becomes:

    $ ls -lhZ b.img
    -rw-r--r--. root root system_u:object_r:virt_image_t:s0 b.img

Then, we won't be able to do OFD lock operations with the existing fd.
In other words, the code such as in blk_detach_dev:

    blk_set_perm(blk, 0, BLK_PERM_ALL, &error_abort);

can abort() QEMU, out of environmental changes.

This patch is an easy fix to this and the change is regardlessly
reasonable, so do it.

Signed-off-by: Fam Zheng <famz@redhat.com>
Reviewed-by: Max Reitz <mreitz@redhat.com>
Signed-off-by: Kevin Wolf <kwolf@redhat.com>
This commit is contained in:
Fam Zheng 2018-10-11 15:21:33 +08:00 committed by Kevin Wolf
parent a883d6a0bc
commit 2996ffad3a

View File

@ -152,6 +152,11 @@ typedef struct BDRVRawState {
uint64_t perm; uint64_t perm;
uint64_t shared_perm; uint64_t shared_perm;
/* The perms bits whose corresponding bytes are already locked in
* s->lock_fd. */
uint64_t locked_perm;
uint64_t locked_shared_perm;
#ifdef CONFIG_XFS #ifdef CONFIG_XFS
bool is_xfs:1; bool is_xfs:1;
#endif #endif
@ -689,43 +694,72 @@ typedef enum {
* file; if @unlock == true, also unlock the unneeded bytes. * file; if @unlock == true, also unlock the unneeded bytes.
* @shared_perm_lock_bits is the mask of all permissions that are NOT shared. * @shared_perm_lock_bits is the mask of all permissions that are NOT shared.
*/ */
static int raw_apply_lock_bytes(int fd, static int raw_apply_lock_bytes(BDRVRawState *s, int fd,
uint64_t perm_lock_bits, uint64_t perm_lock_bits,
uint64_t shared_perm_lock_bits, uint64_t shared_perm_lock_bits,
bool unlock, Error **errp) bool unlock, Error **errp)
{ {
int ret; int ret;
int i; int i;
uint64_t locked_perm, locked_shared_perm;
if (s) {
locked_perm = s->locked_perm;
locked_shared_perm = s->locked_shared_perm;
} else {
/*
* We don't have the previous bits, just lock/unlock for each of the
* requested bits.
*/
if (unlock) {
locked_perm = BLK_PERM_ALL;
locked_shared_perm = BLK_PERM_ALL;
} else {
locked_perm = 0;
locked_shared_perm = 0;
}
}
PERM_FOREACH(i) { PERM_FOREACH(i) {
int off = RAW_LOCK_PERM_BASE + i; int off = RAW_LOCK_PERM_BASE + i;
if (perm_lock_bits & (1ULL << i)) { uint64_t bit = (1ULL << i);
if ((perm_lock_bits & bit) && !(locked_perm & bit)) {
ret = qemu_lock_fd(fd, off, 1, false); ret = qemu_lock_fd(fd, off, 1, false);
if (ret) { if (ret) {
error_setg(errp, "Failed to lock byte %d", off); error_setg(errp, "Failed to lock byte %d", off);
return ret; return ret;
} else if (s) {
s->locked_perm |= bit;
} }
} else if (unlock) { } else if (unlock && (locked_perm & bit) && !(perm_lock_bits & bit)) {
ret = qemu_unlock_fd(fd, off, 1); ret = qemu_unlock_fd(fd, off, 1);
if (ret) { if (ret) {
error_setg(errp, "Failed to unlock byte %d", off); error_setg(errp, "Failed to unlock byte %d", off);
return ret; return ret;
} else if (s) {
s->locked_perm &= ~bit;
} }
} }
} }
PERM_FOREACH(i) { PERM_FOREACH(i) {
int off = RAW_LOCK_SHARED_BASE + i; int off = RAW_LOCK_SHARED_BASE + i;
if (shared_perm_lock_bits & (1ULL << i)) { uint64_t bit = (1ULL << i);
if ((shared_perm_lock_bits & bit) && !(locked_shared_perm & bit)) {
ret = qemu_lock_fd(fd, off, 1, false); ret = qemu_lock_fd(fd, off, 1, false);
if (ret) { if (ret) {
error_setg(errp, "Failed to lock byte %d", off); error_setg(errp, "Failed to lock byte %d", off);
return ret; return ret;
} else if (s) {
s->locked_shared_perm |= bit;
} }
} else if (unlock) { } else if (unlock && (locked_shared_perm & bit) &&
!(shared_perm_lock_bits & bit)) {
ret = qemu_unlock_fd(fd, off, 1); ret = qemu_unlock_fd(fd, off, 1);
if (ret) { if (ret) {
error_setg(errp, "Failed to unlock byte %d", off); error_setg(errp, "Failed to unlock byte %d", off);
return ret; return ret;
} else if (s) {
s->locked_shared_perm &= ~bit;
} }
} }
} }
@ -793,7 +827,7 @@ static int raw_handle_perm_lock(BlockDriverState *bs,
switch (op) { switch (op) {
case RAW_PL_PREPARE: case RAW_PL_PREPARE:
ret = raw_apply_lock_bytes(s->lock_fd, s->perm | new_perm, ret = raw_apply_lock_bytes(s, s->lock_fd, s->perm | new_perm,
~s->shared_perm | ~new_shared, ~s->shared_perm | ~new_shared,
false, errp); false, errp);
if (!ret) { if (!ret) {
@ -808,7 +842,7 @@ static int raw_handle_perm_lock(BlockDriverState *bs,
op = RAW_PL_ABORT; op = RAW_PL_ABORT;
/* fall through to unlock bytes. */ /* fall through to unlock bytes. */
case RAW_PL_ABORT: case RAW_PL_ABORT:
raw_apply_lock_bytes(s->lock_fd, s->perm, ~s->shared_perm, raw_apply_lock_bytes(s, s->lock_fd, s->perm, ~s->shared_perm,
true, &local_err); true, &local_err);
if (local_err) { if (local_err) {
/* Theoretically the above call only unlocks bytes and it cannot /* Theoretically the above call only unlocks bytes and it cannot
@ -818,7 +852,7 @@ static int raw_handle_perm_lock(BlockDriverState *bs,
} }
break; break;
case RAW_PL_COMMIT: case RAW_PL_COMMIT:
raw_apply_lock_bytes(s->lock_fd, new_perm, ~new_shared, raw_apply_lock_bytes(s, s->lock_fd, new_perm, ~new_shared,
true, &local_err); true, &local_err);
if (local_err) { if (local_err) {
/* Theoretically the above call only unlocks bytes and it cannot /* Theoretically the above call only unlocks bytes and it cannot
@ -2220,7 +2254,7 @@ raw_co_create(BlockdevCreateOptions *options, Error **errp)
shared = BLK_PERM_ALL & ~BLK_PERM_RESIZE; shared = BLK_PERM_ALL & ~BLK_PERM_RESIZE;
/* Step one: Take locks */ /* Step one: Take locks */
result = raw_apply_lock_bytes(fd, perm, ~shared, false, errp); result = raw_apply_lock_bytes(NULL, fd, perm, ~shared, false, errp);
if (result < 0) { if (result < 0) {
goto out_close; goto out_close;
} }
@ -2264,7 +2298,7 @@ raw_co_create(BlockdevCreateOptions *options, Error **errp)
} }
out_unlock: out_unlock:
raw_apply_lock_bytes(fd, 0, 0, true, &local_err); raw_apply_lock_bytes(NULL, fd, 0, 0, true, &local_err);
if (local_err) { if (local_err) {
/* The above call should not fail, and if it does, that does /* The above call should not fail, and if it does, that does
* not mean the whole creation operation has failed. So * not mean the whole creation operation has failed. So