]> git.ipfire.org Git - thirdparty/mdadm.git/blobdiff - Grow.c
Grow: Allow for component_size not being set for RAID0 arrays.
[thirdparty/mdadm.git] / Grow.c
diff --git a/Grow.c b/Grow.c
index 49831ad7ca16a4be7e65faf2390385b8033fbbb8..812c1da9e997c3c0f3dda704f98e55e7e5f8ecdf 100644 (file)
--- a/Grow.c
+++ b/Grow.c
@@ -893,6 +893,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
         * when assembling an array that is undergoing reshape.
         */
        int new_disks;
+       /* delta_parity records change in number of devices
+        * caused by level change
+        */
+       int delta_parity = 0;
 
        /* If a new level not explicitly given, we assume no-change */
        if (info->new_level == UnSet)
@@ -925,6 +929,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                 * raid0 with 1 disk
                 */
                if (info->new_level == 0) {
+                       if (info->delta_disks != UnSet &&
+                           info->delta_disks != 0)
+                               return "Cannot change number of disks "
+                                       "with RAID1->RAID0 conversion";
                        re->level = 0;
                        re->before.data_disks = 1;
                        re->after.data_disks = 1;
@@ -944,9 +952,17 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                }
                if (info->array.raid_disks == 2 &&
                    info->new_level == 5) {
+
                        re->level = 5;
                        re->before.data_disks = 1;
-                       re->after.data_disks = 1;
+                       if (info->delta_disks != UnSet &&
+                           info->delta_disks != 0)
+                               re->after.data_disks = 1 + info->delta_disks;
+                       else
+                               re->after.data_disks = 1;
+                       if (re->after.data_disks < 1)
+                               return "Number of disks too small for RAID5";
+
                        re->before.layout = ALGORITHM_LEFT_SYMMETRIC;
                        info->array.chunk_size = 65536;
                        break;
@@ -970,10 +986,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                        return "RAID10 can only be changed to RAID0";
                new_disks = (info->array.raid_disks
                             / (info->array.layout & 0xff));
-               if (info->delta_disks == UnSet) {
+               if (info->delta_disks == UnSet)
                        info->delta_disks = (new_disks
                                             - info->array.raid_disks);
-               }
+
                if (info->delta_disks != new_disks - info->array.raid_disks)
                        return "New number of raid-devices impossible for RAID10";
                if (info->new_chunk &&
@@ -1032,16 +1048,19 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                 * a raid4 style layout of the final level.
                 */
                switch (info->new_level) {
-               case 0:
                case 4:
+                       delta_parity = 1;
+               case 0:
                        re->level = 4;
                        re->before.layout = 0;
                        break;
                case 5:
+                       delta_parity = 1;
                        re->level = 5;
                        re->before.layout = ALGORITHM_PARITY_N;
                        break;
                case 6:
+                       delta_parity = 2;
                        re->level = 6;
                        re->before.layout = ALGORITHM_PARITY_N;
                        break;
@@ -1057,6 +1076,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
        case 5:
                switch (info->new_level) {
                case 0:
+                       delta_parity = -1;
                case 4:
                        re->level = info->array.level;
                        re->before.data_disks = info->array.raid_disks - 1;
@@ -1068,6 +1088,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                        re->before.layout = info->array.layout;
                        break;
                case 6:
+                       delta_parity = 1;
                        re->level = 6;
                        re->before.data_disks = info->array.raid_disks - 1;
                        switch (info->array.layout) {
@@ -1096,6 +1117,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                case 1:
                        if (info->array.raid_disks != 2)
                                return "Can only convert a 2-device array to RAID1";
+                       if (info->delta_disks != UnSet &&
+                           info->delta_disks != 0)
+                               return "Cannot set raid_disk when "
+                                       "converting RAID5->RAID1";
                        re->level = 1;
                        break;
                default:
@@ -1106,6 +1131,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                switch (info->new_level) {
                case 4:
                case 5:
+                       delta_parity = -1;
                case 6:
                        re->level = 6;
                        re->before.data_disks = info->array.raid_disks - 2;
@@ -1131,11 +1157,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                 */
                if (re->level != 4 && re->level != 5)
                        return "Cannot covert to RAID0 from this level";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else
-                       re->after.data_disks =
-                               info->array.raid_disks + info->delta_disks;
+
                switch (re->level) {
                case 4:
                        re->after.layout = 0 ; break;
@@ -1148,11 +1170,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                /* We can only get to RAID4 from RAID5 */
                if (re->level != 4 && re->level != 5)
                        return "Cannot convert to RAID4 from this level";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else
-                       re->after.data_disks =
-                               re->before.data_disks + info->delta_disks;
+
                switch (re->level) {
                case 4:
                        re->after.layout = 0 ; break;
@@ -1165,14 +1183,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                /* We get to RAID5 for RAID5 or RAID6 */
                if (re->level != 5 && re->level != 6)
                        return "Cannot convert to RAID5 from this level";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else if (re->level == 5)
-                       re->after.data_disks =
-                               re->before.data_disks + info->delta_disks;
-               else
-                       re->after.data_disks =
-                               info->array.raid_disks + info->delta_disks - 1;
+
                switch (re->level) {
                case 5:
                        if (info->new_layout == UnSet)
@@ -1205,11 +1216,6 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                /* We must already be at level 6 */
                if (re->level != 6)
                        return "Impossible level change";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else
-                       re->after.data_disks = (info->array.raid_disks +
-                                               info->delta_disks) - 2;
                if (info->new_layout == UnSet)
                        re->after.layout = info->array.layout;
                else
@@ -1218,6 +1224,12 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
        default:
                return "Impossible level change requested";
        }
+       if (info->delta_disks == UnSet)
+               info->delta_disks = delta_parity;
+
+       re->after.data_disks = (re->before.data_disks
+                               + info->delta_disks
+                               - delta_parity);
        switch (re->level) {
        case 6: re->parity = 2; break;
        case 4:
@@ -1263,12 +1275,12 @@ static int reshape_array(char *container, int fd, char *devname,
                         struct supertype *st, struct mdinfo *info,
                         int force, char *backup_file, int quiet, int forked,
                         int restart);
-static int reshape_container(char *container, int cfd, char *devname,
+static int reshape_container(char *container, char *devname,
                             struct supertype *st, 
                             struct mdinfo *info,
                             int force,
                             char *backup_file,
-                            int quiet);
+                            int quiet, int restart);
 
 int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
                 long long size,
@@ -1494,7 +1506,10 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
        info.component_size = size*2;
        info.new_level = level;
        info.new_chunk = chunksize * 1024;
-       if (raid_disks)
+       if (info.array.level == LEVEL_CONTAINER) {
+               info.delta_disks = UnSet;
+               info.array.raid_disks = raid_disks;
+       } else if (raid_disks)
                info.delta_disks = raid_disks - info.array.raid_disks;
        else
                info.delta_disks = UnSet;
@@ -1570,8 +1585,8 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
                 * number of devices (On-Line Capacity Expansion) must be
                 * performed at the level of the container
                 */
-               rv = reshape_container(container, fd, devname, st, &info,
-                                      force, backup_file, quiet);
+               rv = reshape_container(container, devname, st, &info,
+                                      force, backup_file, quiet, 0);
                frozen = 0;
        } else {
                /* get spare devices from external metadata
@@ -1634,13 +1649,38 @@ static int reshape_array(char *container, int fd, char *devname,
        int done;
        struct mdinfo *sra = NULL;
 
-       msg = analyse_change(info, &reshape);
+       /* when reshaping a RAID0, the component_size might be zero.
+        * So try to fix that up.
+        */
+       if (ioctl(fd, GET_ARRAY_INFO, &array) != 0) {
+               dprintf("Cannot get array information.\n");
+               goto release;
+       }
+       if (array.level == 0 && info->component_size == 0) {
+               get_dev_size(fd, NULL, &array_size);
+               info->component_size = array_size / array.raid_disks;
+       }
+
+       if (info->reshape_active) {
+               int new_level = info->new_level;
+               info->new_level = UnSet;
+               msg = analyse_change(info, &reshape);
+               info->new_level = new_level;
+               if (!restart)
+                       /* Make sure the array isn't read-only */
+                       ioctl(fd, RESTART_ARRAY_RW, 0);
+       } else
+               msg = analyse_change(info, &reshape);
        if (msg) {
                fprintf(stderr, Name ": %s\n", msg);
                goto release;
        }
-       if (ioctl(fd, GET_ARRAY_INFO, &array) != 0) {
-               dprintf("Canot get array information.\n");
+       if (restart &&
+           (reshape.level != info->array.level ||
+            reshape.before.layout != info->array.layout ||
+            reshape.before.data_disks + reshape.parity != info->array.raid_disks)) {
+               fprintf(stderr, Name ": reshape info is not in native format -"
+                       " cannot continue.\n");
                goto release;
        }
 
@@ -1656,6 +1696,7 @@ static int reshape_array(char *container, int fd, char *devname,
         * freeze_array and freeze_container.
         */
        sysfs_freeze_array(info);
+       /* Check we have enough spares to not be degraded */
        spares_needed = max(reshape.before.data_disks,
                            reshape.after.data_disks)
                + reshape.parity - array.raid_disks;
@@ -1672,8 +1713,22 @@ static int reshape_array(char *container, int fd, char *devname,
                        info->array.spare_disks);
                goto release;
        }
+       /* Check we have enough spares to not fail */
+       spares_needed = max(reshape.before.data_disks,
+                           reshape.after.data_disks)
+               - array.raid_disks;
+       if ((info->new_level > 1 || info->new_level == 0) &&
+           spares_needed > info->array.spare_disks) {
+               fprintf(stderr,
+                       Name ": Need %d spare%s to create working array,"
+                       " and only have %d.\n",
+                       spares_needed,
+                       spares_needed == 1 ? "" : "s", 
+                       info->array.spare_disks);
+               goto release;
+       }
 
-       if (reshape.level != info->array.level) {
+       if (reshape.level != array.level) {
                char *c = map_num(pers, reshape.level);
                int err;
                if (c == NULL)
@@ -1693,7 +1748,7 @@ static int reshape_array(char *container, int fd, char *devname,
                if (!quiet)
                        fprintf(stderr, Name ": level of %s changed to %s\n",
                                devname, c);    
-               orig_level = info->array.level;
+               orig_level = array.level;
                sysfs_freeze_array(info);
 
                if (reshape.level > 0 && st->ss->external) {
@@ -1735,7 +1790,7 @@ static int reshape_array(char *container, int fd, char *devname,
                 */
                /* read current array info */
                if (ioctl(fd, GET_ARRAY_INFO, &array) != 0) {
-                       dprintf("Canot get array information.\n");
+                       dprintf("Cannot get array information.\n");
                        goto release;
                }
                /* compare current array info with new values and if
@@ -1920,7 +1975,7 @@ started:
 
        sra->new_chunk = info->new_chunk;
 
-       if (info->reshape_active)
+       if (restart)
                sra->reshape_progress = info->reshape_progress;
        else {
                sra->reshape_progress = 0;
@@ -1936,7 +1991,7 @@ started:
                /* use SET_ARRAY_INFO but only if reshape hasn't started */
                ioctl(fd, GET_ARRAY_INFO, &array);
                array.raid_disks = reshape.after.data_disks + reshape.parity;
-               if (!info->reshape_active &&
+               if (!restart &&
                    ioctl(fd, SET_ARRAY_INFO, &array) != 0) {
                        int err = errno;
 
@@ -1952,17 +2007,9 @@ started:
 
                        goto release;
                }
-       } else if (info->reshape_active && !st->ss->external) {
-               /* We don't need to set anything here for internal
-                * metadata, and for kernels before 2.6.38 we can
-                * fail if we try.
-                */
-       } else {
+       } else if (!restart) {
                /* set them all just in case some old 'new_*' value
                 * persists from some earlier problem.
-                * We even set them when restarting in the middle.  They will
-                * already be set in that case so this will be a no-op,
-                * but it is hard to tell the difference.
                 */
                int err = 0;
                if (sysfs_set_num(sra, NULL, "chunk_size", info->new_chunk) < 0)
@@ -1987,9 +2034,11 @@ started:
                }
        }
 
-       err = start_reshape(sra, (info->reshape_active && !st->ss->external));
+       err = start_reshape(sra, restart);
        if (err) {
-               fprintf(stderr, Name ": Cannot start reshape for %s\n",
+               fprintf(stderr, 
+                       Name ": Cannot %s reshape for %s\n",
+                       restart ? "continue" : "start",
                        devname);
                goto release;
        }
@@ -2126,19 +2175,20 @@ release:
        return 1;
 }
 
-int reshape_container(char *container, int cfd, char *devname,
+int reshape_container(char *container, char *devname,
                      struct supertype *st, 
                      struct mdinfo *info,
                      int force,
                      char *backup_file,
-                     int quiet)
+                     int quiet, int restart)
 {
        struct mdinfo *cc = NULL;
 
        /* component_size is not meaningful for a container,
         * so pass '-1' meaning 'no change'
         */
-       if (reshape_super(st, -1, info->new_level,
+       if (!restart &&
+           reshape_super(st, -1, info->new_level,
                          info->new_layout, info->new_chunk,
                          info->array.raid_disks, info->delta_disks,
                          backup_file, devname, quiet)) {
@@ -2171,6 +2221,10 @@ int reshape_container(char *container, int cfd, char *devname,
                 * reshape it.  reshape_array() will re-read the metadata
                 * so the next time through a different array should be
                 * ready for reshape.
+                * It is possible that the 'different' array will not
+                * be assembled yet.  In that case we simple exit.
+                * When it is assembled, the mdadm which assembles it
+                * will take over the reshape.
                 */
                struct mdinfo *content;
                int rv;
@@ -2210,8 +2264,9 @@ int reshape_container(char *container, int cfd, char *devname,
 
                rv = reshape_array(container, fd, adev, st,
                                   content, force,
-                                  backup_file, quiet, 1, 0);
+                                  backup_file, quiet, 1, restart);
                close(fd);
+               restart = 0;
                if (rv)
                        break;
        }
@@ -2293,8 +2348,8 @@ int progress_reshape(struct mdinfo *info, struct reshape *reshape,
         *   1 if more data from backup_point - but only as far as suspend_point,
         *     should be backed up
         *   0 if things are progressing smoothly
-        *  -1 if the reshape is finished, either because it is all done,
-        *     or due to an error.
+        *  -1 if the reshape is finished because it is all done,
+        *  -2 if the reshape is finished due to an error.
         */
 
        int advancing = (reshape->after.data_disks
@@ -3315,10 +3370,34 @@ int Grow_restart(struct supertype *st, struct mdinfo *info, int *fdlist, int cnt
 int Grow_continue(int mdfd, struct supertype *st, struct mdinfo *info,
                  char *backup_file)
 {
-       int err = sysfs_set_str(info, NULL, "array_state", "readonly");
+       char buf[40];
+       char *container = NULL;
+       int err;
+
+       err = sysfs_set_str(info, NULL, "array_state", "readonly");
        if (err)
                return err;
-       return reshape_array(NULL, mdfd, "array", st, info, 1, backup_file, 0, 0, 1);
-}
+       if (st->ss->external) {
+               fmt_devname(buf, st->container_dev);
+               container = buf;
+               freeze(st);
 
+               if (!mdmon_running(st->container_dev))
+                       start_mdmon(st->container_dev);
+               ping_monitor(devnum2devname(st->container_dev));
 
+
+               if (info->reshape_active == 2) {
+                       int cfd = open_dev(st->container_dev);
+                       if (cfd < 0)
+                               return 1;
+                       st->ss->load_container(st, cfd, container);
+                       close(cfd);
+                       return reshape_container(container, NULL,
+                                                st, info, 0, backup_file,
+                                                0, 1);
+               }
+       }
+       return reshape_array(container, mdfd, "array", st, info, 1,
+                            backup_file, 0, 0, 1);
+}