Skip to content

Commit 9875201

Browse files
committed
rbd: fix use-after free of rbd_dev->disk
Removing a device deallocates the disk, unschedules the watch, and finally cleans up the rbd_dev structure. rbd_dev_refresh(), called from the watch callback, updates the disk size and rbd_dev structure. With no locking between them, rbd_dev_refresh() may use the device or rbd_dev after they've been freed. To fix this, check whether RBD_DEV_FLAG_REMOVING is set before updating the disk size in rbd_dev_refresh(). In order to prevent a race where rbd_dev_refresh() is already revalidating the disk when rbd_remove() is called, move the call to rbd_bus_del_dev() after the watch is unregistered and all notifies are complete. It's safe to defer deleting this structure because no new requests can be submitted once the RBD_DEV_FLAG_REMOVING is set, since the device cannot be opened. Fixes: http://tracker.ceph.com/issues/5636 Signed-off-by: Josh Durgin <[email protected]> Reviewed-by: Alex Elder <[email protected]>
1 parent 20e0af6 commit 9875201

File tree

1 file changed

+33
-7
lines changed

1 file changed

+33
-7
lines changed

drivers/block/rbd.c

Lines changed: 33 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -3325,6 +3325,31 @@ static void rbd_exists_validate(struct rbd_device *rbd_dev)
33253325
clear_bit(RBD_DEV_FLAG_EXISTS, &rbd_dev->flags);
33263326
}
33273327

3328+
static void rbd_dev_update_size(struct rbd_device *rbd_dev)
3329+
{
3330+
sector_t size;
3331+
bool removing;
3332+
3333+
/*
3334+
* Don't hold the lock while doing disk operations,
3335+
* or lock ordering will conflict with the bdev mutex via:
3336+
* rbd_add() -> blkdev_get() -> rbd_open()
3337+
*/
3338+
spin_lock_irq(&rbd_dev->lock);
3339+
removing = test_bit(RBD_DEV_FLAG_REMOVING, &rbd_dev->flags);
3340+
spin_unlock_irq(&rbd_dev->lock);
3341+
/*
3342+
* If the device is being removed, rbd_dev->disk has
3343+
* been destroyed, so don't try to update its size
3344+
*/
3345+
if (!removing) {
3346+
size = (sector_t)rbd_dev->mapping.size / SECTOR_SIZE;
3347+
dout("setting size to %llu sectors", (unsigned long long)size);
3348+
set_capacity(rbd_dev->disk, size);
3349+
revalidate_disk(rbd_dev->disk);
3350+
}
3351+
}
3352+
33283353
static int rbd_dev_refresh(struct rbd_device *rbd_dev)
33293354
{
33303355
u64 mapping_size;
@@ -3344,12 +3369,7 @@ static int rbd_dev_refresh(struct rbd_device *rbd_dev)
33443369
up_write(&rbd_dev->header_rwsem);
33453370

33463371
if (mapping_size != rbd_dev->mapping.size) {
3347-
sector_t size;
3348-
3349-
size = (sector_t)rbd_dev->mapping.size / SECTOR_SIZE;
3350-
dout("setting size to %llu sectors", (unsigned long long)size);
3351-
set_capacity(rbd_dev->disk, size);
3352-
revalidate_disk(rbd_dev->disk);
3372+
rbd_dev_update_size(rbd_dev);
33533373
}
33543374

33553375
return ret;
@@ -5160,7 +5180,6 @@ static ssize_t rbd_remove(struct bus_type *bus,
51605180
if (ret < 0 || already)
51615181
return ret;
51625182

5163-
rbd_bus_del_dev(rbd_dev);
51645183
ret = rbd_dev_header_watch_sync(rbd_dev, false);
51655184
if (ret)
51665185
rbd_warn(rbd_dev, "failed to cancel watch event (%d)\n", ret);
@@ -5171,6 +5190,13 @@ static ssize_t rbd_remove(struct bus_type *bus,
51715190
*/
51725191
dout("%s: flushing notifies", __func__);
51735192
ceph_osdc_flush_notifies(&rbd_dev->rbd_client->client->osdc);
5193+
/*
5194+
* Don't free anything from rbd_dev->disk until after all
5195+
* notifies are completely processed. Otherwise
5196+
* rbd_bus_del_dev() will race with rbd_watch_cb(), resulting
5197+
* in a potential use after free of rbd_dev->disk or rbd_dev.
5198+
*/
5199+
rbd_bus_del_dev(rbd_dev);
51745200
rbd_dev_image_release(rbd_dev);
51755201
module_put(THIS_MODULE);
51765202

0 commit comments

Comments
 (0)