Donate to e Foundation | Murena handsets with /e/OS | Own a part of Murena! Learn more

Commit e9ff04dd authored by Linus Torvalds's avatar Linus Torvalds
Browse files
Pull ceph fixes from Sage Weil:
 "These fix several bugs with RBD from 3.11 that didn't get tested in
  time for the merge window: some error handling, a use-after-free, and
  a sequencing issue when unmapping and image races with a notify
  operation.

  There is also a patch fixing a problem with the new ceph + fscache
  code that just went in"

* 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/sage/ceph-client:
  fscache: check consistency does not decrement refcount
  rbd: fix error handling from rbd_snap_name()
  rbd: ignore unmapped snapshots that no longer exist
  rbd: fix use-after free of rbd_dev->disk
  rbd: make rbd_obj_notify_ack() synchronous
  rbd: complete notifies before cleaning up osd_client and rbd_dev
  libceph: add function to ensure notifies are complete
parents ed24fee2 9c89d629
Loading
Loading
Loading
Loading
+59 −18
Original line number Original line Diff line number Diff line
@@ -931,12 +931,14 @@ static const char *rbd_dev_v1_snap_name(struct rbd_device *rbd_dev,
					u64 snap_id)
					u64 snap_id)
{
{
	u32 which;
	u32 which;
	const char *snap_name;


	which = rbd_dev_snap_index(rbd_dev, snap_id);
	which = rbd_dev_snap_index(rbd_dev, snap_id);
	if (which == BAD_SNAP_INDEX)
	if (which == BAD_SNAP_INDEX)
		return NULL;
		return ERR_PTR(-ENOENT);


	return _rbd_dev_v1_snap_name(rbd_dev, which);
	snap_name = _rbd_dev_v1_snap_name(rbd_dev, which);
	return snap_name ? snap_name : ERR_PTR(-ENOMEM);
}
}


static const char *rbd_snap_name(struct rbd_device *rbd_dev, u64 snap_id)
static const char *rbd_snap_name(struct rbd_device *rbd_dev, u64 snap_id)
@@ -2812,7 +2814,7 @@ static void rbd_img_parent_read(struct rbd_obj_request *obj_request)
	obj_request_done_set(obj_request);
	obj_request_done_set(obj_request);
}
}


static int rbd_obj_notify_ack(struct rbd_device *rbd_dev, u64 notify_id)
static int rbd_obj_notify_ack_sync(struct rbd_device *rbd_dev, u64 notify_id)
{
{
	struct rbd_obj_request *obj_request;
	struct rbd_obj_request *obj_request;
	struct ceph_osd_client *osdc = &rbd_dev->rbd_client->client->osdc;
	struct ceph_osd_client *osdc = &rbd_dev->rbd_client->client->osdc;
@@ -2827,15 +2829,16 @@ static int rbd_obj_notify_ack(struct rbd_device *rbd_dev, u64 notify_id)
	obj_request->osd_req = rbd_osd_req_create(rbd_dev, false, obj_request);
	obj_request->osd_req = rbd_osd_req_create(rbd_dev, false, obj_request);
	if (!obj_request->osd_req)
	if (!obj_request->osd_req)
		goto out;
		goto out;
	obj_request->callback = rbd_obj_request_put;


	osd_req_op_watch_init(obj_request->osd_req, 0, CEPH_OSD_OP_NOTIFY_ACK,
	osd_req_op_watch_init(obj_request->osd_req, 0, CEPH_OSD_OP_NOTIFY_ACK,
					notify_id, 0, 0);
					notify_id, 0, 0);
	rbd_osd_req_format_read(obj_request);
	rbd_osd_req_format_read(obj_request);


	ret = rbd_obj_request_submit(osdc, obj_request);
	ret = rbd_obj_request_submit(osdc, obj_request);
out:
	if (ret)
	if (ret)
		goto out;
	ret = rbd_obj_request_wait(obj_request);
out:
	rbd_obj_request_put(obj_request);
	rbd_obj_request_put(obj_request);


	return ret;
	return ret;
@@ -2856,7 +2859,7 @@ static void rbd_watch_cb(u64 ver, u64 notify_id, u8 opcode, void *data)
	if (ret)
	if (ret)
		rbd_warn(rbd_dev, "header refresh error (%d)\n", ret);
		rbd_warn(rbd_dev, "header refresh error (%d)\n", ret);


	rbd_obj_notify_ack(rbd_dev, notify_id);
	rbd_obj_notify_ack_sync(rbd_dev, notify_id);
}
}


/*
/*
@@ -3328,6 +3331,31 @@ static void rbd_exists_validate(struct rbd_device *rbd_dev)
		clear_bit(RBD_DEV_FLAG_EXISTS, &rbd_dev->flags);
		clear_bit(RBD_DEV_FLAG_EXISTS, &rbd_dev->flags);
}
}


static void rbd_dev_update_size(struct rbd_device *rbd_dev)
{
	sector_t size;
	bool removing;

	/*
	 * Don't hold the lock while doing disk operations,
	 * or lock ordering will conflict with the bdev mutex via:
	 * rbd_add() -> blkdev_get() -> rbd_open()
	 */
	spin_lock_irq(&rbd_dev->lock);
	removing = test_bit(RBD_DEV_FLAG_REMOVING, &rbd_dev->flags);
	spin_unlock_irq(&rbd_dev->lock);
	/*
	 * If the device is being removed, rbd_dev->disk has
	 * been destroyed, so don't try to update its size
	 */
	if (!removing) {
		size = (sector_t)rbd_dev->mapping.size / SECTOR_SIZE;
		dout("setting size to %llu sectors", (unsigned long long)size);
		set_capacity(rbd_dev->disk, size);
		revalidate_disk(rbd_dev->disk);
	}
}

static int rbd_dev_refresh(struct rbd_device *rbd_dev)
static int rbd_dev_refresh(struct rbd_device *rbd_dev)
{
{
	u64 mapping_size;
	u64 mapping_size;
@@ -3347,12 +3375,7 @@ static int rbd_dev_refresh(struct rbd_device *rbd_dev)
	up_write(&rbd_dev->header_rwsem);
	up_write(&rbd_dev->header_rwsem);


	if (mapping_size != rbd_dev->mapping.size) {
	if (mapping_size != rbd_dev->mapping.size) {
		sector_t size;
		rbd_dev_update_size(rbd_dev);

		size = (sector_t)rbd_dev->mapping.size / SECTOR_SIZE;
		dout("setting size to %llu sectors", (unsigned long long)size);
		set_capacity(rbd_dev->disk, size);
		revalidate_disk(rbd_dev->disk);
	}
	}


	return ret;
	return ret;
@@ -4061,8 +4084,13 @@ static u64 rbd_v2_snap_id_by_name(struct rbd_device *rbd_dev, const char *name)


		snap_id = snapc->snaps[which];
		snap_id = snapc->snaps[which];
		snap_name = rbd_dev_v2_snap_name(rbd_dev, snap_id);
		snap_name = rbd_dev_v2_snap_name(rbd_dev, snap_id);
		if (IS_ERR(snap_name))
		if (IS_ERR(snap_name)) {
			/* ignore no-longer existing snapshots */
			if (PTR_ERR(snap_name) == -ENOENT)
				continue;
			else
				break;
				break;
		}
		found = !strcmp(name, snap_name);
		found = !strcmp(name, snap_name);
		kfree(snap_name);
		kfree(snap_name);
	}
	}
@@ -4141,8 +4169,8 @@ static int rbd_dev_spec_update(struct rbd_device *rbd_dev)
	/* Look up the snapshot name, and make a copy */
	/* Look up the snapshot name, and make a copy */


	snap_name = rbd_snap_name(rbd_dev, spec->snap_id);
	snap_name = rbd_snap_name(rbd_dev, spec->snap_id);
	if (!snap_name) {
	if (IS_ERR(snap_name)) {
		ret = -ENOMEM;
		ret = PTR_ERR(snap_name);
		goto out_err;
		goto out_err;
	}
	}


@@ -5163,10 +5191,23 @@ static ssize_t rbd_remove(struct bus_type *bus,
	if (ret < 0 || already)
	if (ret < 0 || already)
		return ret;
		return ret;


	rbd_bus_del_dev(rbd_dev);
	ret = rbd_dev_header_watch_sync(rbd_dev, false);
	ret = rbd_dev_header_watch_sync(rbd_dev, false);
	if (ret)
	if (ret)
		rbd_warn(rbd_dev, "failed to cancel watch event (%d)\n", ret);
		rbd_warn(rbd_dev, "failed to cancel watch event (%d)\n", ret);

	/*
	 * flush remaining watch callbacks - these must be complete
	 * before the osd_client is shutdown
	 */
	dout("%s: flushing notifies", __func__);
	ceph_osdc_flush_notifies(&rbd_dev->rbd_client->client->osdc);
	/*
	 * Don't free anything from rbd_dev->disk until after all
	 * notifies are completely processed. Otherwise
	 * rbd_bus_del_dev() will race with rbd_watch_cb(), resulting
	 * in a potential use after free of rbd_dev->disk or rbd_dev.
	 */
	rbd_bus_del_dev(rbd_dev);
	rbd_dev_image_release(rbd_dev);
	rbd_dev_image_release(rbd_dev);
	module_put(THIS_MODULE);
	module_put(THIS_MODULE);


+2 −1
Original line number Original line Diff line number Diff line
@@ -586,7 +586,8 @@ int __fscache_check_consistency(struct fscache_cookie *cookie)


	fscache_operation_init(op, NULL, NULL);
	fscache_operation_init(op, NULL, NULL);
	op->flags = FSCACHE_OP_MYTHREAD |
	op->flags = FSCACHE_OP_MYTHREAD |
		(1 << FSCACHE_OP_WAITING);
		(1 << FSCACHE_OP_WAITING) |
		(1 << FSCACHE_OP_UNUSE_COOKIE);


	spin_lock(&cookie->lock);
	spin_lock(&cookie->lock);


+2 −0
Original line number Original line Diff line number Diff line
@@ -335,6 +335,8 @@ extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc,
				  struct ceph_osd_request *req);
				  struct ceph_osd_request *req);
extern void ceph_osdc_sync(struct ceph_osd_client *osdc);
extern void ceph_osdc_sync(struct ceph_osd_client *osdc);


extern void ceph_osdc_flush_notifies(struct ceph_osd_client *osdc);

extern int ceph_osdc_readpages(struct ceph_osd_client *osdc,
extern int ceph_osdc_readpages(struct ceph_osd_client *osdc,
			       struct ceph_vino vino,
			       struct ceph_vino vino,
			       struct ceph_file_layout *layout,
			       struct ceph_file_layout *layout,
+11 −0
Original line number Original line Diff line number Diff line
@@ -2215,6 +2215,17 @@ void ceph_osdc_sync(struct ceph_osd_client *osdc)
}
}
EXPORT_SYMBOL(ceph_osdc_sync);
EXPORT_SYMBOL(ceph_osdc_sync);


/*
 * Call all pending notify callbacks - for use after a watch is
 * unregistered, to make sure no more callbacks for it will be invoked
 */
extern void ceph_osdc_flush_notifies(struct ceph_osd_client *osdc)
{
	flush_workqueue(osdc->notify_wq);
}
EXPORT_SYMBOL(ceph_osdc_flush_notifies);


/*
/*
 * init, shutdown
 * init, shutdown
 */
 */