drbd: fix error path during resize

In case the lower level device size changed, but some other internal
details of the resize did not work out, drbd_determine_dev_size() would
try to restore the previous settings, trusting
drbd_md_set_sector_offsets() to "do the right thing", but overlooked
that this internally may set the meta data base offset based on device size.

This could end up with incomplete on-disk meta data layout change, and
ultimately lead to data corruption (if the failure was not noticed or
ignored by the operator, and other things go wrong as well).

Just remember all meta data related offsets/sizes,
and on error restore them all.

Signed-off-by: Philipp Reisner <philipp.reisner@linbit.com>
Signed-off-by: Lars Ellenberg <lars.ellenberg@linbit.com>
Signed-off-by: Jens Axboe <axboe@fb.com>
This commit is contained in:
Lars Ellenberg 2015-06-08 14:48:38 +02:00 committed by Jens Axboe
parent 5f7c01249b
commit 8011e24909

View File

@ -891,12 +891,18 @@ void drbd_resume_io(struct drbd_device *device)
enum determine_dev_size enum determine_dev_size
drbd_determine_dev_size(struct drbd_device *device, enum dds_flags flags, struct resize_parms *rs) __must_hold(local) drbd_determine_dev_size(struct drbd_device *device, enum dds_flags flags, struct resize_parms *rs) __must_hold(local)
{ {
sector_t prev_first_sect, prev_size; /* previous meta location */ struct md_offsets_and_sizes {
sector_t la_size_sect, u_size; u64 last_agreed_sect;
u64 md_offset;
s32 al_offset;
s32 bm_offset;
u32 md_size_sect;
u32 al_stripes;
u32 al_stripe_size_4k;
} prev;
sector_t u_size, size;
struct drbd_md *md = &device->ldev->md; struct drbd_md *md = &device->ldev->md;
u32 prev_al_stripe_size_4k;
u32 prev_al_stripes;
sector_t size;
char ppb[10]; char ppb[10];
void *buffer; void *buffer;
@ -918,16 +924,17 @@ drbd_determine_dev_size(struct drbd_device *device, enum dds_flags flags, struct
return DS_ERROR; return DS_ERROR;
} }
prev_first_sect = drbd_md_first_sector(device->ldev); /* remember current offset and sizes */
prev_size = device->ldev->md.md_size_sect; prev.last_agreed_sect = md->la_size_sect;
la_size_sect = device->ldev->md.la_size_sect; prev.md_offset = md->md_offset;
prev.al_offset = md->al_offset;
prev.bm_offset = md->bm_offset;
prev.md_size_sect = md->md_size_sect;
prev.al_stripes = md->al_stripes;
prev.al_stripe_size_4k = md->al_stripe_size_4k;
if (rs) { if (rs) {
/* rs is non NULL if we should change the AL layout only */ /* rs is non NULL if we should change the AL layout only */
prev_al_stripes = md->al_stripes;
prev_al_stripe_size_4k = md->al_stripe_size_4k;
md->al_stripes = rs->al_stripes; md->al_stripes = rs->al_stripes;
md->al_stripe_size_4k = rs->al_stripe_size / 4; md->al_stripe_size_4k = rs->al_stripe_size / 4;
md->al_size_4k = (u64)rs->al_stripes * rs->al_stripe_size / 4; md->al_size_4k = (u64)rs->al_stripes * rs->al_stripe_size / 4;
@ -940,7 +947,7 @@ drbd_determine_dev_size(struct drbd_device *device, enum dds_flags flags, struct
rcu_read_unlock(); rcu_read_unlock();
size = drbd_new_dev_size(device, device->ldev, u_size, flags & DDSF_FORCED); size = drbd_new_dev_size(device, device->ldev, u_size, flags & DDSF_FORCED);
if (size < la_size_sect) { if (size < prev.last_agreed_sect) {
if (rs && u_size == 0) { if (rs && u_size == 0) {
/* Remove "rs &&" later. This check should always be active, but /* Remove "rs &&" later. This check should always be active, but
right now the receiver expects the permissive behavior */ right now the receiver expects the permissive behavior */
@ -961,30 +968,29 @@ drbd_determine_dev_size(struct drbd_device *device, enum dds_flags flags, struct
err = drbd_bm_resize(device, size, !(flags & DDSF_NO_RESYNC)); err = drbd_bm_resize(device, size, !(flags & DDSF_NO_RESYNC));
if (unlikely(err)) { if (unlikely(err)) {
/* currently there is only one error: ENOMEM! */ /* currently there is only one error: ENOMEM! */
size = drbd_bm_capacity(device)>>1; size = drbd_bm_capacity(device);
if (size == 0) { if (size == 0) {
drbd_err(device, "OUT OF MEMORY! " drbd_err(device, "OUT OF MEMORY! "
"Could not allocate bitmap!\n"); "Could not allocate bitmap!\n");
} else { } else {
drbd_err(device, "BM resizing failed. " drbd_err(device, "BM resizing failed. "
"Leaving size unchanged at size = %lu KB\n", "Leaving size unchanged\n");
(unsigned long)size);
} }
rv = DS_ERROR; rv = DS_ERROR;
} }
/* racy, see comments above. */ /* racy, see comments above. */
drbd_set_my_capacity(device, size); drbd_set_my_capacity(device, size);
device->ldev->md.la_size_sect = size; md->la_size_sect = size;
drbd_info(device, "size = %s (%llu KB)\n", ppsize(ppb, size>>1), drbd_info(device, "size = %s (%llu KB)\n", ppsize(ppb, size>>1),
(unsigned long long)size>>1); (unsigned long long)size>>1);
} }
if (rv <= DS_ERROR) if (rv <= DS_ERROR)
goto err_out; goto err_out;
la_size_changed = (la_size_sect != device->ldev->md.la_size_sect); la_size_changed = (prev.last_agreed_sect != md->la_size_sect);
md_moved = prev_first_sect != drbd_md_first_sector(device->ldev) md_moved = prev.md_offset != md->md_offset
|| prev_size != device->ldev->md.md_size_sect; || prev.md_size_sect != md->md_size_sect;
if (la_size_changed || md_moved || rs) { if (la_size_changed || md_moved || rs) {
u32 prev_flags; u32 prev_flags;
@ -1024,20 +1030,22 @@ drbd_determine_dev_size(struct drbd_device *device, enum dds_flags flags, struct
md->al_stripes, md->al_stripe_size_4k * 4); md->al_stripes, md->al_stripe_size_4k * 4);
} }
if (size > la_size_sect) if (size > prev.last_agreed_sect)
rv = la_size_sect ? DS_GREW : DS_GREW_FROM_ZERO; rv = prev.last_agreed_sect ? DS_GREW : DS_GREW_FROM_ZERO;
if (size < la_size_sect) if (size < prev.last_agreed_sect)
rv = DS_SHRUNK; rv = DS_SHRUNK;
if (0) { if (0) {
err_out: err_out:
if (rs) { /* restore previous offset and sizes */
md->al_stripes = prev_al_stripes; md->la_size_sect = prev.last_agreed_sect;
md->al_stripe_size_4k = prev_al_stripe_size_4k; md->md_offset = prev.md_offset;
md->al_size_4k = (u64)prev_al_stripes * prev_al_stripe_size_4k; md->al_offset = prev.al_offset;
md->bm_offset = prev.bm_offset;
drbd_md_set_sector_offsets(device, device->ldev); md->md_size_sect = prev.md_size_sect;
} md->al_stripes = prev.al_stripes;
md->al_stripe_size_4k = prev.al_stripe_size_4k;
md->al_size_4k = (u64)prev.al_stripes * prev.al_stripe_size_4k;
} }
lc_unlock(device->act_log); lc_unlock(device->act_log);
wake_up(&device->al_wait); wake_up(&device->al_wait);