]> git.ipfire.org Git - thirdparty/mdadm.git/blobdiff - Grow.c
imsm: do not publish OROM/EFI unsupported arrays
[thirdparty/mdadm.git] / Grow.c
diff --git a/Grow.c b/Grow.c
index 402da5eea772face397b34d992e2dfaa06938e2a..d596c2de7a7df6bd9ebe0eafdb3e55c365f66f9b 100644 (file)
--- a/Grow.c
+++ b/Grow.c
@@ -565,7 +565,8 @@ static void wait_reshape(struct mdinfo *sra)
 
 static int reshape_super(struct supertype *st, long long size, int level,
                         int layout, int chunksize, int raid_disks,
-                        char *backup_file, char *dev, int verbose)
+                        int delta_disks, char *backup_file, char *dev,
+                        int verbose)
 {
        /* nothing extra to check in the native case */
        if (!st->ss->external)
@@ -578,7 +579,8 @@ static int reshape_super(struct supertype *st, long long size, int level,
        }
 
        return st->ss->reshape_super(st, size, level, layout, chunksize,
-                                    raid_disks, backup_file, dev, verbose);
+                                    raid_disks, delta_disks, backup_file, dev,
+                                    verbose);
 }
 
 static void sync_metadata(struct supertype *st)
@@ -891,6 +893,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
         * when assembling an array that is undergoing reshape.
         */
        int new_disks;
+       /* delta_parity records change in number of devices
+        * caused by level change
+        */
+       int delta_parity = 0;
 
        /* If a new level not explicitly given, we assume no-change */
        if (info->new_level == UnSet)
@@ -923,6 +929,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                 * raid0 with 1 disk
                 */
                if (info->new_level == 0) {
+                       if (info->delta_disks != UnSet &&
+                           info->delta_disks != 0)
+                               return "Cannot change number of disks "
+                                       "with RAID1->RAID0 conversion";
                        re->level = 0;
                        re->before.data_disks = 1;
                        re->after.data_disks = 1;
@@ -942,9 +952,17 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                }
                if (info->array.raid_disks == 2 &&
                    info->new_level == 5) {
+
                        re->level = 5;
                        re->before.data_disks = 1;
-                       re->after.data_disks = 1;
+                       if (info->delta_disks != UnSet &&
+                           info->delta_disks != 0)
+                               re->after.data_disks = 1 + info->delta_disks;
+                       else
+                               re->after.data_disks = 1;
+                       if (re->after.data_disks < 1)
+                               return "Number of disks too small for RAID5";
+
                        re->before.layout = ALGORITHM_LEFT_SYMMETRIC;
                        info->array.chunk_size = 65536;
                        break;
@@ -968,10 +986,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                        return "RAID10 can only be changed to RAID0";
                new_disks = (info->array.raid_disks
                             / (info->array.layout & 0xff));
-               if (info->delta_disks == UnSet) {
+               if (info->delta_disks == UnSet)
                        info->delta_disks = (new_disks
                                             - info->array.raid_disks);
-               }
+
                if (info->delta_disks != new_disks - info->array.raid_disks)
                        return "New number of raid-devices impossible for RAID10";
                if (info->new_chunk &&
@@ -1030,16 +1048,19 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                 * a raid4 style layout of the final level.
                 */
                switch (info->new_level) {
-               case 0:
                case 4:
+                       delta_parity = 1;
+               case 0:
                        re->level = 4;
                        re->before.layout = 0;
                        break;
                case 5:
+                       delta_parity = 1;
                        re->level = 5;
                        re->before.layout = ALGORITHM_PARITY_N;
                        break;
                case 6:
+                       delta_parity = 2;
                        re->level = 6;
                        re->before.layout = ALGORITHM_PARITY_N;
                        break;
@@ -1054,6 +1075,8 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                info->array.layout = ALGORITHM_PARITY_N;
        case 5:
                switch (info->new_level) {
+               case 0:
+                       delta_parity = -1;
                case 4:
                        re->level = info->array.level;
                        re->before.data_disks = info->array.raid_disks - 1;
@@ -1065,6 +1088,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                        re->before.layout = info->array.layout;
                        break;
                case 6:
+                       delta_parity = 1;
                        re->level = 6;
                        re->before.data_disks = info->array.raid_disks - 1;
                        switch (info->array.layout) {
@@ -1093,6 +1117,10 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                case 1:
                        if (info->array.raid_disks != 2)
                                return "Can only convert a 2-device array to RAID1";
+                       if (info->delta_disks != UnSet &&
+                           info->delta_disks != 0)
+                               return "Cannot set raid_disk when "
+                                       "converting RAID5->RAID1";
                        re->level = 1;
                        break;
                default:
@@ -1103,6 +1131,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                switch (info->new_level) {
                case 4:
                case 5:
+                       delta_parity = -1;
                case 6:
                        re->level = 6;
                        re->before.data_disks = info->array.raid_disks - 2;
@@ -1128,11 +1157,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                 */
                if (re->level != 4 && re->level != 5)
                        return "Cannot covert to RAID0 from this level";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else
-                       re->after.data_disks =
-                               info->array.raid_disks + info->delta_disks;
+
                switch (re->level) {
                case 4:
                        re->after.layout = 0 ; break;
@@ -1145,11 +1170,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                /* We can only get to RAID4 from RAID5 */
                if (re->level != 4 && re->level != 5)
                        return "Cannot convert to RAID4 from this level";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else
-                       re->after.data_disks =
-                               re->before.data_disks + info->delta_disks;
+
                switch (re->level) {
                case 4:
                        re->after.layout = 0 ; break;
@@ -1162,14 +1183,7 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                /* We get to RAID5 for RAID5 or RAID6 */
                if (re->level != 5 && re->level != 6)
                        return "Cannot convert to RAID5 from this level";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else if (re->level == 5)
-                       re->after.data_disks =
-                               re->before.data_disks + info->delta_disks;
-               else
-                       re->after.data_disks =
-                               info->array.raid_disks + info->delta_disks - 1;
+
                switch (re->level) {
                case 5:
                        if (info->new_layout == UnSet)
@@ -1202,11 +1216,6 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
                /* We must already be at level 6 */
                if (re->level != 6)
                        return "Impossible level change";
-               if (info->delta_disks == UnSet)
-                       re->after.data_disks = re->before.data_disks;
-               else
-                       re->after.data_disks = (info->array.raid_disks +
-                                               info->delta_disks) - 2;
                if (info->new_layout == UnSet)
                        re->after.layout = info->array.layout;
                else
@@ -1215,6 +1224,12 @@ char *analyse_change(struct mdinfo *info, struct reshape *re)
        default:
                return "Impossible level change requested";
        }
+       if (info->delta_disks == UnSet)
+               info->delta_disks = delta_parity;
+
+       re->after.data_disks = (re->before.data_disks
+                               + info->delta_disks
+                               - delta_parity);
        switch (re->level) {
        case 6: re->parity = 2; break;
        case 4:
@@ -1260,12 +1275,12 @@ static int reshape_array(char *container, int fd, char *devname,
                         struct supertype *st, struct mdinfo *info,
                         int force, char *backup_file, int quiet, int forked,
                         int restart);
-static int reshape_container(char *container, int cfd, char *devname,
+static int reshape_container(char *container, char *devname,
                             struct supertype *st, 
                             struct mdinfo *info,
                             int force,
                             char *backup_file,
-                            int quiet);
+                            int quiet, int restart);
 
 int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
                 long long size,
@@ -1416,7 +1431,8 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
        if (size >= 0 && (size == 0 || size != array.size)) {
                long long orig_size = array.size;
 
-               if (reshape_super(st, size, UnSet, UnSet, 0, 0, NULL, devname, !quiet)) {
+               if (reshape_super(st, size, UnSet, UnSet, 0, 0, UnSet, NULL,
+                                 devname, !quiet)) {
                        rv = 1;
                        goto release;
                }
@@ -1438,7 +1454,7 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
 
                        /* restore metadata */
                        if (reshape_super(st, orig_size, UnSet, UnSet, 0, 0,
-                                         NULL, devname, !quiet) == 0)
+                                         UnSet, NULL, devname, !quiet) == 0)
                                sync_metadata(st);
                        fprintf(stderr, Name ": Cannot set device size for %s: %s\n",
                                devname, strerror(err));
@@ -1490,7 +1506,10 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
        info.component_size = size*2;
        info.new_level = level;
        info.new_chunk = chunksize * 1024;
-       if (raid_disks)
+       if (info.array.level == LEVEL_CONTAINER) {
+               info.delta_disks = UnSet;
+               info.array.raid_disks = raid_disks;
+       } else if (raid_disks)
                info.delta_disks = raid_disks - info.array.raid_disks;
        else
                info.delta_disks = UnSet;
@@ -1566,16 +1585,29 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file,
                 * number of devices (On-Line Capacity Expansion) must be
                 * performed at the level of the container
                 */
-               rv = reshape_container(container, fd, devname, st, &info,
-                                      force, backup_file, quiet);
+               rv = reshape_container(container, devname, st, &info,
+                                      force, backup_file, quiet, 0);
                frozen = 0;
        } else {
+               /* get spare devices from external metadata
+                */
+               if (st->ss->external) {
+                       struct mdinfo *info2;
+
+                       info2 = st->ss->container_content(st, subarray);
+                       if (info2) {
+                               info.array.spare_disks =
+                                       info2->array.spare_disks;
+                               sysfs_free(info2);
+                       }
+               }
+
                /* Impose these changes on a single array.  First
                 * check that the metadata is OK with the change. */
 
                if (reshape_super(st, info.component_size, info.new_level,
                                  info.new_layout, info.new_chunk,
-                                 info.array.raid_disks + info.delta_disks,
+                                 info.array.raid_disks, info.delta_disks,
                                  backup_file, devname, quiet)) {
                        rv = 1;
                        goto release;
@@ -1617,13 +1649,30 @@ static int reshape_array(char *container, int fd, char *devname,
        int done;
        struct mdinfo *sra = NULL;
 
-       msg = analyse_change(info, &reshape);
+       if (info->reshape_active) {
+               int new_level = info->new_level;
+               info->new_level = UnSet;
+               msg = analyse_change(info, &reshape);
+               info->new_level = new_level;
+               if (!restart)
+                       /* Make sure the array isn't read-only */
+                       ioctl(fd, RESTART_ARRAY_RW, 0);
+       } else
+               msg = analyse_change(info, &reshape);
        if (msg) {
                fprintf(stderr, Name ": %s\n", msg);
                goto release;
        }
+       if (restart &&
+           (reshape.level != info->array.level ||
+            reshape.before.layout != info->array.layout ||
+            reshape.before.data_disks + reshape.parity != info->array.raid_disks)) {
+               fprintf(stderr, Name ": reshape info is not in native format -"
+                       " cannot continue.\n");
+               goto release;
+       }
        if (ioctl(fd, GET_ARRAY_INFO, &array) != 0) {
-               dprintf("Canot get array information.\n");
+               dprintf("Cannot get array information.\n");
                goto release;
        }
 
@@ -1639,6 +1688,7 @@ static int reshape_array(char *container, int fd, char *devname,
         * freeze_array and freeze_container.
         */
        sysfs_freeze_array(info);
+       /* Check we have enough spares to not be degraded */
        spares_needed = max(reshape.before.data_disks,
                            reshape.after.data_disks)
                + reshape.parity - array.raid_disks;
@@ -1655,8 +1705,22 @@ static int reshape_array(char *container, int fd, char *devname,
                        info->array.spare_disks);
                goto release;
        }
+       /* Check we have enough spares to not fail */
+       spares_needed = max(reshape.before.data_disks,
+                           reshape.after.data_disks)
+               - array.raid_disks;
+       if ((info->new_level > 1 || info->new_level == 0) &&
+           spares_needed > info->array.spare_disks) {
+               fprintf(stderr,
+                       Name ": Need %d spare%s to create working array,"
+                       " and only have %d.\n",
+                       spares_needed,
+                       spares_needed == 1 ? "" : "s", 
+                       info->array.spare_disks);
+               goto release;
+       }
 
-       if (reshape.level != info->array.level) {
+       if (reshape.level != array.level) {
                char *c = map_num(pers, reshape.level);
                int err;
                if (c == NULL)
@@ -1676,7 +1740,7 @@ static int reshape_array(char *container, int fd, char *devname,
                if (!quiet)
                        fprintf(stderr, Name ": level of %s changed to %s\n",
                                devname, c);    
-               orig_level = info->array.level;
+               orig_level = array.level;
                sysfs_freeze_array(info);
 
                if (reshape.level > 0 && st->ss->external) {
@@ -1718,7 +1782,7 @@ static int reshape_array(char *container, int fd, char *devname,
                 */
                /* read current array info */
                if (ioctl(fd, GET_ARRAY_INFO, &array) != 0) {
-                       dprintf("Canot get array information.\n");
+                       dprintf("Cannot get array information.\n");
                        goto release;
                }
                /* compare current array info with new values and if
@@ -1903,7 +1967,7 @@ started:
 
        sra->new_chunk = info->new_chunk;
 
-       if (info->reshape_active)
+       if (restart)
                sra->reshape_progress = info->reshape_progress;
        else {
                sra->reshape_progress = 0;
@@ -1919,7 +1983,7 @@ started:
                /* use SET_ARRAY_INFO but only if reshape hasn't started */
                ioctl(fd, GET_ARRAY_INFO, &array);
                array.raid_disks = reshape.after.data_disks + reshape.parity;
-               if (!info->reshape_active &&
+               if (!restart &&
                    ioctl(fd, SET_ARRAY_INFO, &array) != 0) {
                        int err = errno;
 
@@ -1935,17 +1999,9 @@ started:
 
                        goto release;
                }
-       } else if (info->reshape_active && !st->ss->external) {
-               /* We don't need to set anything here for internal
-                * metadata, and for kernels before 2.6.38 we can
-                * fail if we try.
-                */
-       } else {
+       } else if (!restart) {
                /* set them all just in case some old 'new_*' value
                 * persists from some earlier problem.
-                * We even set them when restarting in the middle.  They will
-                * already be set in that case so this will be a no-op,
-                * but it is hard to tell the difference.
                 */
                int err = 0;
                if (sysfs_set_num(sra, NULL, "chunk_size", info->new_chunk) < 0)
@@ -1970,9 +2026,11 @@ started:
                }
        }
 
-       err = start_reshape(sra, (info->reshape_active && !st->ss->external));
+       err = start_reshape(sra, restart);
        if (err) {
-               fprintf(stderr, Name ": Cannot start reshape for %s\n",
+               fprintf(stderr, 
+                       Name ": Cannot %s reshape for %s\n",
+                       restart ? "continue" : "start",
                        devname);
                goto release;
        }
@@ -2109,21 +2167,22 @@ release:
        return 1;
 }
 
-int reshape_container(char *container, int cfd, char *devname,
+int reshape_container(char *container, char *devname,
                      struct supertype *st, 
                      struct mdinfo *info,
                      int force,
                      char *backup_file,
-                     int quiet)
+                     int quiet, int restart)
 {
        struct mdinfo *cc = NULL;
 
        /* component_size is not meaningful for a container,
         * so pass '-1' meaning 'no change'
         */
-       if (reshape_super(st, -1, info->new_level,
+       if (!restart &&
+           reshape_super(st, -1, info->new_level,
                          info->new_layout, info->new_chunk,
-                         info->array.raid_disks + info->delta_disks,
+                         info->array.raid_disks, info->delta_disks,
                          backup_file, devname, quiet)) {
                unfreeze(st);
                return 1;
@@ -2154,6 +2213,10 @@ int reshape_container(char *container, int cfd, char *devname,
                 * reshape it.  reshape_array() will re-read the metadata
                 * so the next time through a different array should be
                 * ready for reshape.
+                * It is possible that the 'different' array will not
+                * be assembled yet.  In that case we simple exit.
+                * When it is assembled, the mdadm which assembles it
+                * will take over the reshape.
                 */
                struct mdinfo *content;
                int rv;
@@ -2193,8 +2256,9 @@ int reshape_container(char *container, int cfd, char *devname,
 
                rv = reshape_array(container, fd, adev, st,
                                   content, force,
-                                  backup_file, quiet, 1, 0);
+                                  backup_file, quiet, 1, restart);
                close(fd);
+               restart = 0;
                if (rv)
                        break;
        }
@@ -2276,8 +2340,8 @@ int progress_reshape(struct mdinfo *info, struct reshape *reshape,
         *   1 if more data from backup_point - but only as far as suspend_point,
         *     should be backed up
         *   0 if things are progressing smoothly
-        *  -1 if the reshape is finished, either because it is all done,
-        *     or due to an error.
+        *  -1 if the reshape is finished because it is all done,
+        *  -2 if the reshape is finished due to an error.
         */
 
        int advancing = (reshape->after.data_disks
@@ -3298,10 +3362,34 @@ int Grow_restart(struct supertype *st, struct mdinfo *info, int *fdlist, int cnt
 int Grow_continue(int mdfd, struct supertype *st, struct mdinfo *info,
                  char *backup_file)
 {
-       int err = sysfs_set_str(info, NULL, "array_state", "readonly");
+       char buf[40];
+       char *container = NULL;
+       int err;
+
+       err = sysfs_set_str(info, NULL, "array_state", "readonly");
        if (err)
                return err;
-       return reshape_array(NULL, mdfd, "array", st, info, 1, backup_file, 0, 0, 1);
-}
+       if (st->ss->external) {
+               fmt_devname(buf, st->container_dev);
+               container = buf;
+               freeze(st);
 
+               if (!mdmon_running(st->container_dev))
+                       start_mdmon(st->container_dev);
+               ping_monitor(devnum2devname(st->container_dev));
 
+
+               if (info->reshape_active == 2) {
+                       int cfd = open_dev(st->container_dev);
+                       if (cfd < 0)
+                               return 1;
+                       st->ss->load_container(st, cfd, container);
+                       close(cfd);
+                       return reshape_container(container, NULL,
+                                                st, info, 0, backup_file,
+                                                0, 1);
+               }
+       }
+       return reshape_array(container, mdfd, "array", st, info, 1,
+                            backup_file, 0, 0, 1);
+}