]> sourceware.org Git - lvm2.git/commitdiff
Finish fix for bug 607347: failing both redundant mirror log legs...
authorJonathan Earl Brassow <jbrassow@redhat.com>
Fri, 9 Jul 2010 15:08:12 +0000 (15:08 +0000)
committerJonathan Earl Brassow <jbrassow@redhat.com>
Fri, 9 Jul 2010 15:08:12 +0000 (15:08 +0000)
A previous check-in added logic to handle the case where both images
of a mirrored log failed.  It solved the problem by simply removing
the log entirely - leaving the parent mirror with a 'core' log.  This
worked for most cases.  However, if there was a small delay between
the failures of the two mirrored log devices, the mirror would hang,
LVM would hang, and no additional LVM commands could be issued.

When the first leg of the log fails, it signals the need for repair.
Before 'lvconvert --repair' is run by dmeventd, the second leg fails.
'lvconvert' would see both devices as failed and try to remove the
log entirely.  When it came time to suspend the parent mirror to
update the configuration, the suspend would hang because it couldn't
get any I/O through the mirrored log, which was plugged waiting for
corrective action.  The solution is to replace the log with an error
target to clear any pending writes before removing it.  This allows
the parent mirror to suspend and make the proper changes.

WHATS_NEW
lib/metadata/mirror.c

index 2a9fe62e8472d9ee552dfe925d922080fadc6974..8bbe3a1e6e3802ddbed9d1ac180667b62938446a 100644 (file)
--- a/WHATS_NEW
+++ b/WHATS_NEW
@@ -1,5 +1,6 @@
 Version 2.02.71 -
 ===============================
+  Fix possible hang when all mirror images of a mirrored log fail.
   Do not log backtrace in valid _lv_resume() code path.
   Cleanup help strings in configure.in.
   Prompt if metadataignore with vgextend or pvchange would adjust vg_mda_copies.
index 80436f93f46e5b9c3aa28c390040eca7a8c5bbec..d84b0766eab5b6b4600a49e0ad3102aefd472e14 100644 (file)
@@ -864,9 +864,72 @@ static int _remove_mirror_images(struct logical_volume *lv,
                lv->status &= ~MIRROR_NOTSYNCED;
                if (!replace_lv_with_error_segment(lv))
                        return_0;
-       } else if (remove_log)
+       } else if (remove_log) {
                detached_log_lv = detach_mirror_log(mirrored_seg);
 
+               /*
+                * The log may be removed due to repair.  If the log
+                * happens to be a mirrored log, then there is a special
+                * case we need to consider.  One of the images of a
+                * mirrored log can fail followed shortly afterwards by
+                * a failure of the second.  This means that the top-level
+                * mirror is waiting for writes to the log to finish, but
+                * they never will unless the mirrored log can be repaired
+                * or replaced with an error target.  Since both the devices
+                * have failed, we must replace with error target - it is
+                * the only way to release the pending writes.
+                */
+               if (lv_is_mirrored(detached_log_lv) &&
+                   (detached_log_lv->status & PARTIAL_LV)) {
+                       struct lv_segment *seg = first_seg(detached_log_lv);
+
+                       log_very_verbose("%s being removed due to failures",
+                                        detached_log_lv->name);
+
+                       /*
+                        * We are going to replace the mirror with an
+                        * error segment, but before we do, we must remember
+                        * all of the LVs that must be deleted later (i.e.
+                        * the sub-lv's)
+                        */
+                       for (m = 0; m < seg->area_count; m++) {
+                               seg_lv(seg, m)->status &= ~MIRROR_IMAGE;
+                               lv_set_visible(seg_lv(seg, m));
+                               if (!(lvl = dm_pool_alloc(lv->vg->cmd->mem,
+                                                         sizeof(*lvl))))
+                                       return 0;
+                               lvl->lv = seg_lv(seg, m);
+                               dm_list_add(&tmp_orphan_lvs, &lvl->list);
+                       }
+
+                       if (!replace_lv_with_error_segment(detached_log_lv)) {
+                               log_error("Failed error target substitution for %s",
+                                         detached_log_lv->name);
+                               return_0;
+                       }
+
+                       if (!vg_write(detached_log_lv->vg)) {
+                               log_error("intermediate VG write fail.");
+                               return 0;
+                       }
+
+                       if (!suspend_lv(detached_log_lv->vg->cmd,
+                                       detached_log_lv)) {
+                               log_error("Failed to suspend %s",
+                                         detached_log_lv->name);
+                               vg_revert(detached_log_lv->vg);
+                               return 0;
+                       }
+
+                       if (!vg_commit(detached_log_lv->vg))
+                               return_0;
+
+                       if (!resume_lv(detached_log_lv->vg->cmd,
+                                      detached_log_lv))
+                                       return 0;
+               }
+       }
+
        /*
         * To successfully remove these unwanted LVs we need to
         * remove the LVs from the mirror set, commit that metadata
This page took 0.043935 seconds and 5 git commands to generate.