super-intel: enable loading metadata from non-IMSM compliant disks

[thirdparty/mdadm.git] / super-intel.c
diff --git a/super-intel.c b/super-intel.c

index 9a99d609b4a83079c1064222be483eb4791e2fe8..2b41e086bf19d73c4d240160ff106cb3ce47b501 100644 (file)
--- a/super-intel.c
+++ b/super-intel.c
@@ -230,9 +230,20 @@ static unsigned int mpb_sectors(struct imsm_super *mpb)
  struct intel_dev {
         struct imsm_dev *dev;
         struct intel_dev *next;
-       int index;
+       unsigned index;
  };
  
+struct intel_hba {
+       enum sys_dev_type type;
+       char *path;
+       char *pci_id;
+       struct intel_hba *next;
+};
+
+enum action {
+       DISK_REMOVE = 1,
+       DISK_ADD
+};
  /* internal representation of IMSM metadata */
  struct intel_super {
         union {
@@ -243,7 +254,6 @@ struct intel_super {
         void *next_buf; /* for realloc'ing buf from the manager */
         size_t next_len;
         int updates_pending; /* count of pending updates for mdmon */
-       int creating_imsm; /* flag to indicate container creation */
         int current_vol; /* index of raid device undergoing creation */
         __u32 create_offset; /* common start for 'current_vol' */
         __u32 random; /* random data for seeding new family numbers */
@@ -259,11 +269,13 @@ struct intel_super {
                 int extent_cnt;
                 struct extent *e; /* for determining freespace @ create */
                 int raiddisk; /* slot to fill in autolayout */
+               enum action action;
         } *disks;
-       struct dl *add; /* list of disks to add while mdmon active */
+       struct dl *disk_mgmt_list; /* list of disks to add/remove while mdmon
+                                     active */
         struct dl *missing; /* disks removed while we weren't looking */
         struct bbm_log *bbm_log;
-       const char *hba; /* device path of the raid controller for this metadata */
+       struct intel_hba *hba; /* device path of the raid controller for this metadata */
         const struct imsm_orom *orom; /* platform firmware support */
         struct intel_super *next; /* (temp) list for disambiguating family_num */
  };
@@ -279,11 +291,21 @@ struct extent {
         unsigned long long start, size;
  };
  
+/* definitions of reshape process types */
+enum imsm_reshape_type {
+       CH_TAKEOVER,
+       CH_MIGRATION,
+};
+
  /* definition of messages passed to imsm_process_update */
  enum imsm_update_type {
         update_activate_spare,
         update_create_array,
-       update_add_disk,
+       update_kill_array,
+       update_rename_array,
+       update_add_remove_disk,
+       update_reshape_container_disks,
+       update_takeover
  };
  
  struct imsm_update_activate_spare {
@@ -294,6 +316,33 @@ struct imsm_update_activate_spare {
         struct imsm_update_activate_spare *next;
  };
  
+struct geo_params {
+       int dev_id;
+       char *dev_name;
+       long long size;
+       int level;
+       int layout;
+       int chunksize;
+       int raid_disks;
+};
+
+enum takeover_direction {
+       R10_TO_R0,
+       R0_TO_R10
+};
+struct imsm_update_takeover {
+       enum imsm_update_type type;
+       int subarray;
+       enum takeover_direction direction;
+};
+
+struct imsm_update_reshape {
+       enum imsm_update_type type;
+       int old_raid_disks;
+       int new_raid_disks;
+       int new_disks[1]; /* new_raid_disks - old_raid_disks makedev number */
+};
+
  struct disk_info {
         __u8 serial[MAX_RAID_SERIAL_LEN];
  };
@@ -304,10 +353,132 @@ struct imsm_update_create_array {
         struct imsm_dev dev;
  };
  
-struct imsm_update_add_disk {
+struct imsm_update_kill_array {
+       enum imsm_update_type type;
+       int dev_idx;
+};
+
+struct imsm_update_rename_array {
+       enum imsm_update_type type;
+       __u8 name[MAX_RAID_SERIAL_LEN];
+       int dev_idx;
+};
+
+struct imsm_update_add_remove_disk {
         enum imsm_update_type type;
  };
  
+
+static const char *_sys_dev_type[] = {
+       [SYS_DEV_UNKNOWN] = "Unknown",
+       [SYS_DEV_SAS] = "SAS",
+       [SYS_DEV_SATA] = "SATA"
+};
+
+const char *get_sys_dev_type(enum sys_dev_type type)
+{
+       if (type >= SYS_DEV_MAX)
+               type = SYS_DEV_UNKNOWN;
+
+       return _sys_dev_type[type];
+}
+
+#ifndef MDASSEMBLE
+static struct intel_hba * alloc_intel_hba(struct sys_dev *device)
+{
+       struct intel_hba *result = malloc(sizeof(*result));
+       if (result) {
+               result->type = device->type;
+               result->path = strdup(device->path);
+               result->next = NULL;
+               if (result->path && (result->pci_id = strrchr(result->path, '/')) != NULL)
+                       result->pci_id++;
+       }
+       return result;
+}
+
+static struct intel_hba * find_intel_hba(struct intel_hba *hba, struct sys_dev *device)
+{
+       struct intel_hba *result=NULL;
+       for (result = hba; result; result = result->next) {
+               if (result->type == device->type && strcmp(result->path, device->path) == 0)
+                       break;
+       }
+       return result;
+}
+
+
+static int attach_hba_to_super(struct intel_super *super, struct sys_dev *device)
+{
+       struct intel_hba *hba;
+
+       /* check if disk attached to Intel HBA */
+       hba = find_intel_hba(super->hba, device);
+       if (hba != NULL)
+               return 1;
+       /* Check if HBA is already attached to super */
+       if (super->hba == NULL) {
+               super->hba = alloc_intel_hba(device);
+               return 1;
+       }
+
+       hba = super->hba;
+       /* Intel metadata allows for all disks attached to the same type HBA.
+        * Do not sypport odf HBA types mixing
+        */
+       if (device->type != hba->type)
+               return 2;
+
+       while (hba->next)
+               hba = hba->next;
+
+       hba->next = alloc_intel_hba(device);
+       return 1;
+}
+
+static struct sys_dev* find_disk_attached_hba(int fd, const char *devname)
+{
+       struct sys_dev *list, *elem, *prev;
+       char *disk_path;
+
+       if ((list = find_intel_devices()) == NULL)
+               return 0;
+
+       if (fd < 0)
+               disk_path  = (char *) devname;
+       else
+               disk_path = diskfd_to_devpath(fd);
+
+       if (!disk_path) {
+               free_sys_dev(&list);
+               return 0;
+       }
+
+       for (prev = NULL, elem = list; elem; prev = elem, elem = elem->next) {
+               if (path_attached_to_hba(disk_path, elem->path)) {
+                       if (prev == NULL)
+                               list = list->next;
+                       else
+                               prev->next = elem->next;
+                       elem->next = NULL;
+                       if (disk_path != devname)
+                               free(disk_path);
+                       free_sys_dev(&list);
+                       return elem;
+               }
+       }
+       if (disk_path != devname)
+               free(disk_path);
+       free_sys_dev(&list);
+
+       return NULL;
+}
+#endif /* MDASSEMBLE */
+
+
+static int find_intel_hba_capability(int fd, struct intel_super *super,
+                                    char *devname);
+
  static struct supertype *match_metadata_desc_imsm(char *arg)
  {
         struct supertype *st;
@@ -318,7 +489,10 @@ static struct supertype *match_metadata_desc_imsm(char *arg)
                 return NULL;
  
         st = malloc(sizeof(*st));
+       if (!st)
+               return NULL;
         memset(st, 0, sizeof(*st));
+       st->container_dev = NoMdDev;
         st->ss = &super_imsm;
         st->max_devs = IMSM_MAX_DEVICES;
         st->minor_version = 0;
@@ -343,19 +517,30 @@ static struct imsm_disk *__get_imsm_disk(struct imsm_super *mpb, __u8 index)
         return &mpb->disk[index];
  }
  
-#ifndef MDASSEMBLE
-/* retrieve a disk from the parsed metadata */
-static struct imsm_disk *get_imsm_disk(struct intel_super *super, __u8 index)
+/* retrieve the disk description based on a index of the disk
+ * in the sub-array
+ */
+static struct dl *get_imsm_dl_disk(struct intel_super *super, __u8 index)
  {
         struct dl *d;
  
         for (d = super->disks; d; d = d->next)
                 if (d->index == index)
-                       return &d->disk;
-       
+                       return d;
+
+       return NULL;
+}
+/* retrieve a disk from the parsed metadata */
+static struct imsm_disk *get_imsm_disk(struct intel_super *super, __u8 index)
+{
+       struct dl *dl;
+
+       dl = get_imsm_dl_disk(super, index);
+       if (dl)
+               return &dl->disk;
+
         return NULL;
  }
-#endif
  
  /* generate a checksum directly from the anchor when the anchor is known to be
   * up-to-date, currently only at load or write_super after coalescing
@@ -381,17 +566,24 @@ static size_t sizeof_imsm_map(struct imsm_map *map)
  
  struct imsm_map *get_imsm_map(struct imsm_dev *dev, int second_map)
  {
+       /* A device can have 2 maps if it is in the middle of a migration.
+        * If second_map is:
+        *    0   - we return the first map
+        *    1   - we return the second map if it exists, else NULL
+        *   -1   - we return the second map if it exists, else the first
+        */
         struct imsm_map *map = &dev->vol.map[0];
  
-       if (second_map && !dev->vol.migr_state)
+       if (second_map == 1 && !dev->vol.migr_state)
                 return NULL;
-       else if (second_map) {
+       else if (second_map == 1 ||
+                (second_map < 0 && dev->vol.migr_state)) {
                 void *ptr = map;
  
                 return ptr + sizeof_imsm_map(map);
         } else
                 return map;
-               
+
  }
  
  /* return the size of the device.
@@ -458,23 +650,28 @@ static struct imsm_dev *get_imsm_dev(struct intel_super *super, __u8 index)
         return NULL;
  }
  
-static __u32 get_imsm_ord_tbl_ent(struct imsm_dev *dev, int slot)
+/*
+ * for second_map:
+ *  == 0 get first map
+ *  == 1 get second map
+ *  == -1 than get map according to the current migr_state
+ */
+static __u32 get_imsm_ord_tbl_ent(struct imsm_dev *dev,
+                                 int slot,
+                                 int second_map)
  {
         struct imsm_map *map;
  
-       if (dev->vol.migr_state)
-               map = get_imsm_map(dev, 1);
-       else
-               map = get_imsm_map(dev, 0);
+       map = get_imsm_map(dev, second_map);
  
         /* top byte identifies disk under rebuild */
         return __le32_to_cpu(map->disk_ord_tbl[slot]);
  }
  
  #define ord_to_idx(ord) (((ord) << 8) >> 8)
-static __u32 get_imsm_disk_idx(struct imsm_dev *dev, int slot)
+static __u32 get_imsm_disk_idx(struct imsm_dev *dev, int slot, int second_map)
  {
-       __u32 ord = get_imsm_ord_tbl_ent(dev, slot);
+       __u32 ord = get_imsm_ord_tbl_ent(dev, slot, second_map);
  
         return ord_to_idx(ord);
  }
@@ -484,7 +681,7 @@ static void set_imsm_ord_tbl_ent(struct imsm_map *map, int slot, __u32 ord)
         map->disk_ord_tbl[slot] = __cpu_to_le32(ord);
  }
  
-static int get_imsm_disk_slot(struct imsm_map *map, int idx)
+static int get_imsm_disk_slot(struct imsm_map *map, unsigned idx)
  {
         int slot;
         __u32 ord;
@@ -578,7 +775,7 @@ static struct extent *get_extents(struct intel_super *super, struct dl *dl)
                  */
                 remainder &= ~1UL;
                 /* make sure remainder is still sane */
-               if (remainder < ROUND_UP(super->len, 512) >> 9)
+               if (remainder < (unsigned)ROUND_UP(super->len, 512) >> 9)
                         remainder = ROUND_UP(super->len, 512) >> 9;
                 if (reservation > remainder)
                         reservation = remainder;
@@ -634,22 +831,83 @@ static int is_failed(struct imsm_disk *disk)
         return (disk->status & FAILED_DISK) == FAILED_DISK;
  }
  
+/* Return minimum size of a spare that can be used in this array*/
+static unsigned long long min_acceptable_spare_size_imsm(struct supertype *st)
+{
+       struct intel_super *super = st->sb;
+       struct dl *dl;
+       struct extent *e;
+       int i;
+       unsigned long long rv = 0;
+
+       if (!super)
+               return rv;
+       /* find first active disk in array */
+       dl = super->disks;
+       while (dl && (is_failed(&dl->disk) || dl->index == -1))
+               dl = dl->next;
+       if (!dl)
+               return rv;
+       /* find last lba used by subarrays */
+       e = get_extents(super, dl);
+       if (!e)
+               return rv;
+       for (i = 0; e[i].size; i++)
+               continue;
+       if (i > 0)
+               rv = e[i-1].start + e[i-1].size;
+       free(e);
+       /* add the amount of space needed for metadata */
+       rv = rv + MPB_SECTOR_CNT + IMSM_RESERVED_SECTORS;
+       return rv * 512;
+}
+
  #ifndef MDASSEMBLE
+static __u64 blocks_per_migr_unit(struct imsm_dev *dev);
+
  static void print_imsm_dev(struct imsm_dev *dev, char *uuid, int disk_idx)
  {
         __u64 sz;
-       int slot;
+       int slot, i;
         struct imsm_map *map = get_imsm_map(dev, 0);
+       struct imsm_map *map2 = get_imsm_map(dev, 1);
         __u32 ord;
  
         printf("\n");
         printf("[%.16s]:\n", dev->volume);
         printf("           UUID : %s\n", uuid);
-       printf("     RAID Level : %d\n", get_imsm_raid_level(map));
-       printf("        Members : %d\n", map->num_members);
+       printf("     RAID Level : %d", get_imsm_raid_level(map));
+       if (map2)
+               printf(" <-- %d", get_imsm_raid_level(map2));
+       printf("\n");
+       printf("        Members : %d", map->num_members);
+       if (map2)
+               printf(" <-- %d", map2->num_members);
+       printf("\n");
+       printf("          Slots : [");
+       for (i = 0; i < map->num_members; i++) {
+               ord = get_imsm_ord_tbl_ent(dev, i, 0);
+               printf("%s", ord & IMSM_ORD_REBUILD ? "_" : "U");
+       }
+       printf("]");
+       if (map2) {
+               printf(" <-- [");
+               for (i = 0; i < map2->num_members; i++) {
+                       ord = get_imsm_ord_tbl_ent(dev, i, 1);
+                       printf("%s", ord & IMSM_ORD_REBUILD ? "_" : "U");
+               }
+               printf("]");
+       }
+       printf("\n");
+       printf("    Failed disk : ");
+       if (map->failed_disk_num == 0xff)
+               printf("none");
+       else
+               printf("%i", map->failed_disk_num);
+       printf("\n");
         slot = get_imsm_disk_slot(map, disk_idx);
         if (slot >= 0) {
-               ord = get_imsm_ord_tbl_ent(dev, slot);
+               ord = get_imsm_ord_tbl_ent(dev, slot, -1);
                 printf("      This Slot : %d%s\n", slot,
                        ord & IMSM_ORD_REBUILD ? " (out-of-sync)" : "");
         } else
@@ -666,30 +924,39 @@ static void print_imsm_dev(struct imsm_dev *dev, char *uuid, int disk_idx)
                 __le32_to_cpu(map->pba_of_lba0));
         printf("    Num Stripes : %u\n",
                 __le32_to_cpu(map->num_data_stripes));
-       printf("     Chunk Size : %u KiB\n",
+       printf("     Chunk Size : %u KiB",
                 __le16_to_cpu(map->blocks_per_strip) / 2);
+       if (map2)
+               printf(" <-- %u KiB",
+                       __le16_to_cpu(map2->blocks_per_strip) / 2);
+       printf("\n");
         printf("       Reserved : %d\n", __le32_to_cpu(dev->reserved_blocks));
-       printf("  Migrate State : %s", dev->vol.migr_state ? "migrating" : "idle\n");
+       printf("  Migrate State : ");
         if (dev->vol.migr_state) {
                 if (migr_type(dev) == MIGR_INIT)
-                       printf(": initializing\n");
+                       printf("initialize\n");
                 else if (migr_type(dev) == MIGR_REBUILD)
-                       printf(": rebuilding\n");
+                       printf("rebuild\n");
                 else if (migr_type(dev) == MIGR_VERIFY)
-                       printf(": check\n");
+                       printf("check\n");
                 else if (migr_type(dev) == MIGR_GEN_MIGR)
-                       printf(": general migration\n");
+                       printf("general migration\n");
                 else if (migr_type(dev) == MIGR_STATE_CHANGE)
-                       printf(": state change\n");
+                       printf("state change\n");
                 else if (migr_type(dev) == MIGR_REPAIR)
-                       printf(": repair\n");
+                       printf("repair\n");
                 else
-                       printf(": <unknown:%d>\n", migr_type(dev));
-       }
+                       printf("<unknown:%d>\n", migr_type(dev));
+       } else
+               printf("idle\n");
         printf("      Map State : %s", map_state_str[map->map_state]);
         if (dev->vol.migr_state) {
                 struct imsm_map *map = get_imsm_map(dev, 1);
+
                 printf(" <-- %s", map_state_str[map->map_state]);
+               printf("\n     Checkpoint : %u (%llu)",
+                      __le32_to_cpu(dev->vol.curr_migr_unit),
+                      (unsigned long long)blocks_per_migr_unit(dev));
         }
         printf("\n");
         printf("    Dirty State : %s\n", dev->vol.dirty ? "dirty" : "clean");
@@ -701,7 +968,7 @@ static void print_imsm_disk(struct imsm_super *mpb, int index, __u32 reserved)
         char str[MAX_RAID_SERIAL_LEN + 1];
         __u64 sz;
  
-       if (index < 0)
+       if (index < 0 || !disk)
                 return;
  
         printf("\n");
@@ -716,7 +983,7 @@ static void print_imsm_disk(struct imsm_super *mpb, int index, __u32 reserved)
                human_size(sz * 512));
  }
  
-static void getinfo_super_imsm(struct supertype *st, struct mdinfo *info);
+static void getinfo_super_imsm(struct supertype *st, struct mdinfo *info, char *map);
  
  static void examine_super_imsm(struct supertype *st, char *homehost)
  {
@@ -728,7 +995,7 @@ static void examine_super_imsm(struct supertype *st, char *homehost)
         char nbuf[64];
         __u32 sum;
         __u32 reserved = imsm_reserved_sectors(super, super->disks);
-
+       struct dl *dl;
  
         snprintf(str, MPB_SIG_LEN, "%s", mpb->sig);
         printf("          Magic : %s\n", str);
@@ -737,7 +1004,7 @@ static void examine_super_imsm(struct supertype *st, char *homehost)
         printf("    Orig Family : %08x\n", __le32_to_cpu(mpb->orig_family_num));
         printf("         Family : %08x\n", __le32_to_cpu(mpb->family_num));
         printf("     Generation : %08x\n", __le32_to_cpu(mpb->generation_num));
-       getinfo_super_imsm(st, &info);
+       getinfo_super_imsm(st, &info, NULL);
         fname_from_uuid(st, &info, nbuf, ':');
         printf("           UUID : %s\n", nbuf + 5);
         sum = __le32_to_cpu(mpb->check_sum);
@@ -764,7 +1031,7 @@ static void examine_super_imsm(struct supertype *st, char *homehost)
                 struct imsm_dev *dev = __get_imsm_dev(mpb, i);
  
                 super->current_vol = i;
-               getinfo_super_imsm(st, &info);
+               getinfo_super_imsm(st, &info, NULL);
                 fname_from_uuid(st, &info, nbuf, ':');
                 print_imsm_dev(dev, nbuf + 5, super->disks->index);
         }
@@ -773,6 +1040,26 @@ static void examine_super_imsm(struct supertype *st, char *homehost)
                         continue;
                 print_imsm_disk(mpb, i, reserved);
         }
+       for (dl = super->disks ; dl; dl = dl->next) {
+               struct imsm_disk *disk;
+               char str[MAX_RAID_SERIAL_LEN + 1];
+               __u64 sz;
+
+               if (dl->index >= 0)
+                       continue;
+
+               disk = &dl->disk;
+               printf("\n");
+               snprintf(str, MAX_RAID_SERIAL_LEN + 1, "%s", disk->serial);
+               printf("    Disk Serial : %s\n", str);
+               printf("          State :%s%s%s\n", is_spare(disk) ? " spare" : "",
+                      is_configured(disk) ? " active" : "",
+                      is_failed(disk) ? " failed" : "");
+               printf("             Id : %08x\n", __le32_to_cpu(disk->scsi_id));
+               sz = __le32_to_cpu(disk->total_blocks) - reserved;
+               printf("    Usable Size : %llu%s\n", (unsigned long long)sz,
+                      human_size(sz * 512));
+       }
  }
  
  static void brief_examine_super_imsm(struct supertype *st, int verbose)
@@ -787,7 +1074,7 @@ static void brief_examine_super_imsm(struct supertype *st, int verbose)
                 return;
         }
  
-       getinfo_super_imsm(st, &info);
+       getinfo_super_imsm(st, &info, NULL);
         fname_from_uuid(st, &info, nbuf, ':');
         printf("ARRAY metadata=imsm UUID=%s\n", nbuf + 5);
  }
@@ -804,13 +1091,13 @@ static void brief_examine_subarrays_imsm(struct supertype *st, int verbose)
         if (!super->anchor->num_raid_devs)
                 return;
  
-       getinfo_super_imsm(st, &info);
+       getinfo_super_imsm(st, &info, NULL);
         fname_from_uuid(st, &info, nbuf, ':');
         for (i = 0; i < super->anchor->num_raid_devs; i++) {
                 struct imsm_dev *dev = get_imsm_dev(super, i);
  
                 super->current_vol = i;
-               getinfo_super_imsm(st, &info);
+               getinfo_super_imsm(st, &info, NULL);
                 fname_from_uuid(st, &info, nbuf1, ':');
                 printf("ARRAY /dev/md/%.16s container=%s member=%d UUID=%s\n",
                        dev->volume, nbuf + 5, i, nbuf1 + 5);
@@ -824,7 +1111,7 @@ static void export_examine_super_imsm(struct supertype *st)
         struct mdinfo info;
         char nbuf[64];
  
-       getinfo_super_imsm(st, &info);
+       getinfo_super_imsm(st, &info, NULL);
         fname_from_uuid(st, &info, nbuf, ':');
         printf("MD_METADATA=imsm\n");
         printf("MD_LEVEL=container\n");
@@ -837,7 +1124,7 @@ static void detail_super_imsm(struct supertype *st, char *homehost)
         struct mdinfo info;
         char nbuf[64];
  
-       getinfo_super_imsm(st, &info);
+       getinfo_super_imsm(st, &info, NULL);
         fname_from_uuid(st, &info, nbuf, ':');
         printf("\n           UUID : %s\n", nbuf + 5);
  }
@@ -846,7 +1133,7 @@ static void brief_detail_super_imsm(struct supertype *st)
  {
         struct mdinfo info;
         char nbuf[64];
-       getinfo_super_imsm(st, &info);
+       getinfo_super_imsm(st, &info, NULL);
         fname_from_uuid(st, &info, nbuf, ':');
         printf(" UUID=%s", nbuf + 5);
  }
@@ -854,10 +1141,10 @@ static void brief_detail_super_imsm(struct supertype *st)
  static int imsm_read_serial(int fd, char *devname, __u8 *serial);
  static void fd2devname(int fd, char *name);
  
-static int imsm_enumerate_ports(const char *hba_path, int port_count, int host_base, int verbose)
+static int ahci_enumerate_ports(const char *hba_path, int port_count, int host_base, int verbose)
  {
-       /* dump an unsorted list of devices attached to ahci, as well as
-        * non-connected ports
+       /* dump an unsorted list of devices attached to AHCI Intel storage
+        * controller, as well as non-connected ports
          */
         int hba_len = strlen(hba_path) + 1;
         struct dirent *ent;
@@ -866,7 +1153,7 @@ static int imsm_enumerate_ports(const char *hba_path, int port_count, int host_b
         int err = 0;
         unsigned long port_mask = (1 << port_count) - 1;
  
-       if (port_count > sizeof(port_mask) * 8) {
+       if (port_count > (int)sizeof(port_mask) * 8) {
                 if (verbose)
                         fprintf(stderr, Name ": port_count %d out of range\n", port_count);
                 return 2;
@@ -959,6 +1246,12 @@ static int imsm_enumerate_ports(const char *hba_path, int port_count, int host_b
  
                 /* chop device path to 'host%d' and calculate the port number */
                 c = strchr(&path[hba_len], '/');
+               if (!c) {
+                       if (verbose)
+                               fprintf(stderr, Name ": %s - invalid path name\n", path + hba_len);
+                       err = 2;
+                       break;
+               }
                 *c = '\0';
                 if (sscanf(&path[hba_len], "host%d", &port) == 1)
                         port -= host_base;
@@ -1011,56 +1304,53 @@ static int imsm_enumerate_ports(const char *hba_path, int port_count, int host_b
         return err;
  }
  
-static int detail_platform_imsm(int verbose, int enumerate_only)
+
+
+static void print_found_intel_controllers(struct sys_dev *elem)
+{
+       for (; elem; elem = elem->next) {
+               fprintf(stderr, Name ": found Intel(R) ");
+               if (elem->type == SYS_DEV_SATA)
+                       fprintf(stderr, "SATA ");
+               else if (elem->type == SYS_DEV_SAS)
+                       fprintf(stderr, "SAS ");
+               fprintf(stderr, "RAID controller");
+               if (elem->pci_id)
+                       fprintf(stderr, " at %s", elem->pci_id);
+               fprintf(stderr, ".\n");
+       }
+       fflush(stderr);
+}
+
+static int ahci_get_port_count(const char *hba_path, int *port_count)
  {
-       /* There are two components to imsm platform support, the ahci SATA
-        * controller and the option-rom.  To find the SATA controller we
-        * simply look in /sys/bus/pci/drivers/ahci to see if an ahci
-        * controller with the Intel vendor id is present.  This approach
-        * allows mdadm to leverage the kernel's ahci detection logic, with the
-        * caveat that if ahci.ko is not loaded mdadm will not be able to
-        * detect platform raid capabilities.  The option-rom resides in a
-        * platform "Adapter ROM".  We scan for its signature to retrieve the
-        * platform capabilities.  If raid support is disabled in the BIOS the
-        * option-rom capability structure will not be available.
-        */
-       const struct imsm_orom *orom;
-       struct sys_dev *list, *hba;
-       DIR *dir;
         struct dirent *ent;
-       const char *hba_path;
-       int host_base = 0;
-       int port_count = 0;
+       DIR *dir;
+       int host_base = -1;
  
-       if (enumerate_only) {
-               if (check_env("IMSM_NO_PLATFORM") || find_imsm_orom())
-                       return 0;
-               return 2;
-       }
+       *port_count = 0;
+       if ((dir = opendir(hba_path)) == NULL)
+               return -1;
  
-       list = find_driver_devices("pci", "ahci");
-       for (hba = list; hba; hba = hba->next)
-               if (devpath_to_vendor(hba->path) == 0x8086)
-                       break;
+       for (ent = readdir(dir); ent; ent = readdir(dir)) {
+               int host;
  
-       if (!hba) {
-               if (verbose)
-                       fprintf(stderr, Name ": unable to find active ahci controller\n");
-               free_sys_dev(&list);
-               return 2;
-       } else if (verbose)
-               fprintf(stderr, Name ": found Intel SATA AHCI Controller\n");
-       hba_path = hba->path;
-       hba->path = NULL;
-       free_sys_dev(&list);
+               if (sscanf(ent->d_name, "host%d", &host) != 1)
+                       continue;
+               if (*port_count == 0)
+                       host_base = host;
+               else if (host < host_base)
+                       host_base = host;
  
-       orom = find_imsm_orom();
-       if (!orom) {
-               if (verbose)
-                       fprintf(stderr, Name ": imsm option-rom not found\n");
-               return 2;
+               if (host + 1 > *port_count + host_base)
+                       *port_count = host + 1 - host_base;
         }
+       closedir(dir);
+       return host_base;
+}
  
+static void print_imsm_capability(const struct imsm_orom *orom)
+{
         printf("       Platform : Intel(R) Matrix Storage Manager\n");
         printf("        Version : %d.%d.%d.%d\n", orom->major_ver, orom->minor_ver,
                orom->hotfix_ver, orom->build);
@@ -1089,35 +1379,81 @@ static int detail_platform_imsm(int verbose, int enumerate_only)
                imsm_orom_has_chunk(orom, 1024*64) ? " 64M" : "");
         printf("      Max Disks : %d\n", orom->tds);
         printf("    Max Volumes : %d\n", orom->vpa);
-       printf(" I/O Controller : %s\n", hba_path);
-
-       /* find the smallest scsi host number to determine a port number base */
-       dir = opendir(hba_path);
-       for (ent = dir ? readdir(dir) : NULL; ent; ent = readdir(dir)) {
-               int host;
-
-               if (sscanf(ent->d_name, "host%d", &host) != 1)
-                       continue;
-               if (port_count == 0)
-                       host_base = host;
-               else if (host < host_base)
-                       host_base = host;
+       return;
+}
  
-               if (host + 1 > port_count + host_base)
-                       port_count = host + 1 - host_base;
+static int detail_platform_imsm(int verbose, int enumerate_only)
+{
+       /* There are two components to imsm platform support, the ahci SATA
+        * controller and the option-rom.  To find the SATA controller we
+        * simply look in /sys/bus/pci/drivers/ahci to see if an ahci
+        * controller with the Intel vendor id is present.  This approach
+        * allows mdadm to leverage the kernel's ahci detection logic, with the
+        * caveat that if ahci.ko is not loaded mdadm will not be able to
+        * detect platform raid capabilities.  The option-rom resides in a
+        * platform "Adapter ROM".  We scan for its signature to retrieve the
+        * platform capabilities.  If raid support is disabled in the BIOS the
+        * option-rom capability structure will not be available.
+        */
+       const struct imsm_orom *orom;
+       struct sys_dev *list, *hba;
+       int host_base = 0;
+       int port_count = 0;
+       int result=0;
  
+       if (enumerate_only) {
+               if (check_env("IMSM_NO_PLATFORM"))
+                       return 0;
+               list = find_intel_devices();
+               if (!list)
+                       return 2;
+               for (hba = list; hba; hba = hba->next) {
+                       orom = find_imsm_capability(hba->type);
+                       if (!orom) {
+                               result = 2;
+                               break;
+                       }
+               }
+               free_sys_dev(&list);
+               return result;
         }
-       if (dir)
-               closedir(dir);
  
-       if (!port_count || imsm_enumerate_ports(hba_path, port_count,
-                                               host_base, verbose) != 0) {
+       list = find_intel_devices();
+       if (!list) {
                 if (verbose)
-                       fprintf(stderr, Name ": failed to enumerate ports\n");
+                       fprintf(stderr, Name ": no active Intel(R) RAID "
+                               "controller found.\n");
+               free_sys_dev(&list);
                 return 2;
+       } else if (verbose)
+               print_found_intel_controllers(list);
+
+       for (hba = list; hba; hba = hba->next) {
+               orom = find_imsm_capability(hba->type);
+               if (!orom)
+                       fprintf(stderr, Name ": imsm capabilities not found for controller: %s (type %s)\n",
+                               hba->path, get_sys_dev_type(hba->type));
+               else
+                       print_imsm_capability(orom);
         }
  
-       return 0;
+       for (hba = list; hba; hba = hba->next) {
+               printf(" I/O Controller : %s (%s)\n",
+                       hba->path, get_sys_dev_type(hba->type));
+
+               if (hba->type == SYS_DEV_SATA) {
+                       host_base = ahci_get_port_count(hba->path, &port_count);
+                       if (ahci_enumerate_ports(hba->path, port_count, host_base, verbose)) {
+                               if (verbose)
+                                       fprintf(stderr, Name ": failed to enumerate "
+                                               "ports on SATA controller at %s.", hba->pci_id);
+                               result |= 2;
+                       }
+               }
+       }
+
+       free_sys_dev(&list);
+       return result;
  }
  #endif
  
@@ -1215,44 +1551,272 @@ get_imsm_numerical_version(struct imsm_super *mpb, int *m, int *p)
  }
  #endif
  
-static int imsm_level_to_layout(int level)
+static __u32 migr_strip_blocks_resync(struct imsm_dev *dev)
  {
-       switch (level) {
-       case 0:
-       case 1:
-               return 0;
+       /* migr_strip_size when repairing or initializing parity */
+       struct imsm_map *map = get_imsm_map(dev, 0);
+       __u32 chunk = __le32_to_cpu(map->blocks_per_strip);
+
+       switch (get_imsm_raid_level(map)) {
         case 5:
-       case 6:
-               return ALGORITHM_LEFT_ASYMMETRIC;
         case 10:
-               return 0x102;
+               return chunk;
+       default:
+               return 128*1024 >> 9;
         }
-       return UnSet;
  }
  
-static void getinfo_super_imsm_volume(struct supertype *st, struct mdinfo *info)
+static __u32 migr_strip_blocks_rebuild(struct imsm_dev *dev)
  {
-       struct intel_super *super = st->sb;
-       struct imsm_dev *dev = get_imsm_dev(super, super->current_vol);
-       struct imsm_map *map = get_imsm_map(dev, 0);
-       struct dl *dl;
+       /* migr_strip_size when rebuilding a degraded disk, no idea why
+        * this is different than migr_strip_size_resync(), but it's good
+        * to be compatible
+        */
+       struct imsm_map *map = get_imsm_map(dev, 1);
+       __u32 chunk = __le32_to_cpu(map->blocks_per_strip);
  
-       for (dl = super->disks; dl; dl = dl->next)
-               if (dl->raiddisk == info->disk.raid_disk)
+       switch (get_imsm_raid_level(map)) {
+       case 1:
+       case 10:
+               if (map->num_members % map->num_domains == 0)
+                       return 128*1024 >> 9;
+               else
+                       return chunk;
+       case 5:
+               return max((__u32) 64*1024 >> 9, chunk);
+       default:
+               return 128*1024 >> 9;
+       }
+}
+
+static __u32 num_stripes_per_unit_resync(struct imsm_dev *dev)
+{
+       struct imsm_map *lo = get_imsm_map(dev, 0);
+       struct imsm_map *hi = get_imsm_map(dev, 1);
+       __u32 lo_chunk = __le32_to_cpu(lo->blocks_per_strip);
+       __u32 hi_chunk = __le32_to_cpu(hi->blocks_per_strip);
+
+       return max((__u32) 1, hi_chunk / lo_chunk);
+}
+
+static __u32 num_stripes_per_unit_rebuild(struct imsm_dev *dev)
+{
+       struct imsm_map *lo = get_imsm_map(dev, 0);
+       int level = get_imsm_raid_level(lo);
+
+       if (level == 1 || level == 10) {
+               struct imsm_map *hi = get_imsm_map(dev, 1);
+
+               return hi->num_domains;
+       } else
+               return num_stripes_per_unit_resync(dev);
+}
+
+static __u8 imsm_num_data_members(struct imsm_dev *dev, int second_map)
+{
+       /* named 'imsm_' because raid0, raid1 and raid10
+        * counter-intuitively have the same number of data disks
+        */
+       struct imsm_map *map = get_imsm_map(dev, second_map);
+
+       switch (get_imsm_raid_level(map)) {
+       case 0:
+       case 1:
+       case 10:
+               return map->num_members;
+       case 5:
+               return map->num_members - 1;
+       default:
+               dprintf("%s: unsupported raid level\n", __func__);
+               return 0;
+       }
+}
+
+static __u32 parity_segment_depth(struct imsm_dev *dev)
+{
+       struct imsm_map *map = get_imsm_map(dev, 0);
+       __u32 chunk =  __le32_to_cpu(map->blocks_per_strip);
+
+       switch(get_imsm_raid_level(map)) {
+       case 1:
+       case 10:
+               return chunk * map->num_domains;
+       case 5:
+               return chunk * map->num_members;
+       default:
+               return chunk;
+       }
+}
+
+static __u32 map_migr_block(struct imsm_dev *dev, __u32 block)
+{
+       struct imsm_map *map = get_imsm_map(dev, 1);
+       __u32 chunk = __le32_to_cpu(map->blocks_per_strip);
+       __u32 strip = block / chunk;
+
+       switch (get_imsm_raid_level(map)) {
+       case 1:
+       case 10: {
+               __u32 vol_strip = (strip * map->num_domains) + 1;
+               __u32 vol_stripe = vol_strip / map->num_members;
+
+               return vol_stripe * chunk + block % chunk;
+       } case 5: {
+               __u32 stripe = strip / (map->num_members - 1);
+
+               return stripe * chunk + block % chunk;
+       }
+       default:
+               return 0;
+       }
+}
+
+static __u64 blocks_per_migr_unit(struct imsm_dev *dev)
+{
+       /* calculate the conversion factor between per member 'blocks'
+        * (md/{resync,rebuild}_start) and imsm migration units, return
+        * 0 for the 'not migrating' and 'unsupported migration' cases
+        */
+       if (!dev->vol.migr_state)
+               return 0;
+
+       switch (migr_type(dev)) {
+       case MIGR_GEN_MIGR:
+       case MIGR_VERIFY:
+       case MIGR_REPAIR:
+       case MIGR_INIT: {
+               struct imsm_map *map = get_imsm_map(dev, 0);
+               __u32 stripes_per_unit;
+               __u32 blocks_per_unit;
+               __u32 parity_depth;
+               __u32 migr_chunk;
+               __u32 block_map;
+               __u32 block_rel;
+               __u32 segment;
+               __u32 stripe;
+               __u8  disks;
+
+               /* yes, this is really the translation of migr_units to
+                * per-member blocks in the 'resync' case
+                */
+               stripes_per_unit = num_stripes_per_unit_resync(dev);
+               migr_chunk = migr_strip_blocks_resync(dev);
+               disks = imsm_num_data_members(dev, 0);
+               blocks_per_unit = stripes_per_unit * migr_chunk * disks;
+               stripe = __le32_to_cpu(map->blocks_per_strip) * disks;
+               segment = blocks_per_unit / stripe;
+               block_rel = blocks_per_unit - segment * stripe;
+               parity_depth = parity_segment_depth(dev);
+               block_map = map_migr_block(dev, block_rel);
+               return block_map + parity_depth * segment;
+       }
+       case MIGR_REBUILD: {
+               __u32 stripes_per_unit;
+               __u32 migr_chunk;
+
+               stripes_per_unit = num_stripes_per_unit_rebuild(dev);
+               migr_chunk = migr_strip_blocks_rebuild(dev);
+               return migr_chunk * stripes_per_unit;
+       }
+       case MIGR_STATE_CHANGE:
+       default:
+               return 0;
+       }
+}
+
+static int imsm_level_to_layout(int level)
+{
+       switch (level) {
+       case 0:
+       case 1:
+               return 0;
+       case 5:
+       case 6:
+               return ALGORITHM_LEFT_ASYMMETRIC;
+       case 10:
+               return 0x102;
+       }
+       return UnSet;
+}
+
+static void getinfo_super_imsm_volume(struct supertype *st, struct mdinfo *info, char *dmap)
+{
+       struct intel_super *super = st->sb;
+       struct imsm_dev *dev = get_imsm_dev(super, super->current_vol);
+       struct imsm_map *map = get_imsm_map(dev, 0);
+       struct imsm_map *prev_map = get_imsm_map(dev, 1);
+       struct imsm_map *map_to_analyse = map;
+       struct dl *dl;
+       char *devname;
+       int map_disks = info->array.raid_disks;
+
+       if (prev_map)
+               map_to_analyse = prev_map;
+
+       for (dl = super->disks; dl; dl = dl->next)
+               if (dl->raiddisk == info->disk.raid_disk)
                         break;
         info->container_member    = super->current_vol;
-       info->array.raid_disks    = map->num_members;
-       info->array.level         = get_imsm_raid_level(map);
+       info->array.raid_disks    = map_to_analyse->num_members;
+       info->array.level         = get_imsm_raid_level(map_to_analyse);
         info->array.layout        = imsm_level_to_layout(info->array.level);
         info->array.md_minor      = -1;
         info->array.ctime         = 0;
         info->array.utime         = 0;
-       info->array.chunk_size    = __le16_to_cpu(map->blocks_per_strip) << 9;
+       info->array.chunk_size    =
+               __le16_to_cpu(map_to_analyse->blocks_per_strip) << 9;
         info->array.state         = !dev->vol.dirty;
         info->custom_array_size   = __le32_to_cpu(dev->size_high);
         info->custom_array_size   <<= 32;
         info->custom_array_size   |= __le32_to_cpu(dev->size_low);
-
+       if (prev_map && map->map_state == prev_map->map_state) {
+               info->reshape_active = 1;
+               info->new_level = get_imsm_raid_level(map);
+               info->new_layout = imsm_level_to_layout(info->new_level);
+               info->new_chunk = __le16_to_cpu(map->blocks_per_strip) << 9;
+               info->delta_disks = map->num_members - prev_map->num_members;
+               if (info->delta_disks) {
+                       /* this needs to be applied to every array
+                        * in the container.
+                        */
+                       info->reshape_active = 2;
+               }
+               /* We shape information that we give to md might have to be
+                * modify to cope with md's requirement for reshaping arrays.
+                * For example, when reshaping a RAID0, md requires it to be
+                * presented as a degraded RAID4.
+                * Also if a RAID0 is migrating to a RAID5 we need to specify
+                * the array as already being RAID5, but the 'before' layout
+                * is a RAID4-like layout.
+                */
+               switch (info->array.level) {
+               case 0:
+                       switch(info->new_level) {
+                       case 0:
+                               /* conversion is happening as RAID4 */
+                               info->array.level = 4;
+                               info->array.raid_disks += 1;
+                               break;
+                       case 5:
+                               /* conversion is happening as RAID5 */
+                               info->array.level = 5;
+                               info->array.layout = ALGORITHM_PARITY_N;
+                               info->array.raid_disks += 1;
+                               info->delta_disks -= 1;
+                               break;
+                       default:
+                               /* FIXME error message */
+                               info->array.level = UnSet;
+                               break;
+                       }
+                       break;
+               }
+       } else {
+               info->new_level = UnSet;
+               info->new_layout = UnSet;
+               info->new_chunk = info->array.chunk_size;
+               info->delta_disks = 0;
+       }
         info->disk.major = 0;
         info->disk.minor = 0;
         if (dl) {
@@ -1260,68 +1824,123 @@ static void getinfo_super_imsm_volume(struct supertype *st, struct mdinfo *info)
                 info->disk.minor = dl->minor;
         }
  
-       info->data_offset         = __le32_to_cpu(map->pba_of_lba0);
-       info->component_size      = __le32_to_cpu(map->blocks_per_member);
+       info->data_offset         = __le32_to_cpu(map_to_analyse->pba_of_lba0);
+       info->component_size      =
+               __le32_to_cpu(map_to_analyse->blocks_per_member);
         memset(info->uuid, 0, sizeof(info->uuid));
+       info->recovery_start = MaxSector;
  
-       if (map->map_state == IMSM_T_STATE_UNINITIALIZED || dev->vol.dirty)
-               info->resync_start = 0;
-       else if (dev->vol.migr_state)
-               /* FIXME add curr_migr_unit to resync_start conversion */
+       info->reshape_progress = 0;
+       info->resync_start = MaxSector;
+       if (map_to_analyse->map_state == IMSM_T_STATE_UNINITIALIZED ||
+           dev->vol.dirty) {
                 info->resync_start = 0;
-       else
-               info->resync_start = ~0ULL;
+       }
+       if (dev->vol.migr_state) {
+               switch (migr_type(dev)) {
+               case MIGR_REPAIR:
+               case MIGR_INIT: {
+                       __u64 blocks_per_unit = blocks_per_migr_unit(dev);
+                       __u64 units = __le32_to_cpu(dev->vol.curr_migr_unit);
+
+                       info->resync_start = blocks_per_unit * units;
+                       break;
+               }
+               case MIGR_GEN_MIGR: {
+                       __u64 blocks_per_unit = blocks_per_migr_unit(dev);
+                       __u64 units = __le32_to_cpu(dev->vol.curr_migr_unit);
+                       unsigned long long array_blocks;
+                       int used_disks;
+
+                       info->reshape_progress = blocks_per_unit * units;
+
+                       /* checkpoint is written per disks unit
+                        * recalculate it to reshape position
+                        */
+                       used_disks = imsm_num_data_members(dev, 0);
+                       info->reshape_progress *= used_disks;
+                       dprintf("IMSM: General Migration checkpoint : %llu "
+                              "(%llu) -> read reshape progress : %llu\n",
+                               units, blocks_per_unit, info->reshape_progress);
+
+                       used_disks = imsm_num_data_members(dev, 1);
+                       if (used_disks > 0) {
+                               array_blocks = map->blocks_per_member *
+                                       used_disks;
+                               /* round array size down to closest MB
+                                */
+                               info->custom_array_size = (array_blocks
+                                               >> SECT_PER_MB_SHIFT)
+                                               << SECT_PER_MB_SHIFT;
+                       }
+               }
+               case MIGR_VERIFY:
+                       /* we could emulate the checkpointing of
+                        * 'sync_action=check' migrations, but for now
+                        * we just immediately complete them
+                        */
+               case MIGR_REBUILD:
+                       /* this is handled by container_content_imsm() */
+               case MIGR_STATE_CHANGE:
+                       /* FIXME handle other migrations */
+               default:
+                       /* we are not dirty, so... */
+                       info->resync_start = MaxSector;
+               }
+       }
  
         strncpy(info->name, (char *) dev->volume, MAX_RAID_SERIAL_LEN);
         info->name[MAX_RAID_SERIAL_LEN] = 0;
  
         info->array.major_version = -1;
         info->array.minor_version = -2;
-       sprintf(info->text_version, "/%s/%d",
-               devnum2devname(st->container_dev),
-               info->container_member);
+       devname = devnum2devname(st->container_dev);
+       *info->text_version = '\0';
+       if (devname)
+               sprintf(info->text_version, "/%s/%d", devname, info->container_member);
+       free(devname);
         info->safe_mode_delay = 4000;  /* 4 secs like the Matrix driver */
         uuid_from_super_imsm(st, info->uuid);
-}
-
-/* check the config file to see if we can return a real uuid for this spare */
-static void fixup_container_spare_uuid(struct mdinfo *inf)
-{
-       struct mddev_ident_s *array_list;
-
-       if (inf->array.level != LEVEL_CONTAINER ||
-           memcmp(inf->uuid, uuid_match_any, sizeof(int[4])) != 0)
-               return;
-
-       array_list = conf_get_ident(NULL);
-
-       for (; array_list; array_list = array_list->next) {
-               if (array_list->uuid_set) {
-                       struct supertype *_sst; /* spare supertype */
-                       struct supertype *_cst; /* container supertype */
  
-                       _cst = array_list->st;
-                       if (_cst)
-                               _sst = _cst->ss->match_metadata_desc(inf->text_version);
-                       else
-                               _sst = NULL;
-
-                       if (_sst) {
-                               memcpy(inf->uuid, array_list->uuid, sizeof(int[4]));
-                               free(_sst);
-                               break;
+       if (dmap) {
+               int i, j;
+               for (i=0; i<map_disks; i++) {
+                       dmap[i] = 0;
+                       if (i < info->array.raid_disks) {
+                               struct imsm_disk *dsk;
+                               j = get_imsm_disk_idx(dev, i, -1);
+                               dsk = get_imsm_disk(super, j);
+                               if (dsk && (dsk->status & CONFIGURED_DISK))
+                                       dmap[i] = 1;
                         }
                 }
         }
  }
  
-static void getinfo_super_imsm(struct supertype *st, struct mdinfo *info)
+static __u8 imsm_check_degraded(struct intel_super *super, struct imsm_dev *dev, int failed);
+static int imsm_count_failed(struct intel_super *super, struct imsm_dev *dev);
+
+static struct imsm_disk *get_imsm_missing(struct intel_super *super, __u8 index)
+{
+       struct dl *d;
+
+       for (d = super->missing; d; d = d->next)
+               if (d->index == index)
+                       return &d->disk;
+       return NULL;
+}
+
+static void getinfo_super_imsm(struct supertype *st, struct mdinfo *info, char *map)
  {
         struct intel_super *super = st->sb;
         struct imsm_disk *disk;
+       int map_disks = info->array.raid_disks;
+       int max_enough = -1;
+       int i;
+       struct imsm_super *mpb;
  
         if (super->current_vol >= 0) {
-               getinfo_super_imsm_volume(st, info);
+               getinfo_super_imsm_volume(st, info, map);
                 return;
         }
  
@@ -1347,6 +1966,50 @@ static void getinfo_super_imsm(struct supertype *st, struct mdinfo *info)
         info->disk.number = -1;
         info->disk.state = 0;
         info->name[0] = 0;
+       info->recovery_start = MaxSector;
+
+       /* do we have the all the insync disks that we expect? */
+       mpb = super->anchor;
+
+       for (i = 0; i < mpb->num_raid_devs; i++) {
+               struct imsm_dev *dev = get_imsm_dev(super, i);
+               int failed, enough, j, missing = 0;
+               struct imsm_map *map;
+               __u8 state;
+
+               failed = imsm_count_failed(super, dev);
+               state = imsm_check_degraded(super, dev, failed);
+               map = get_imsm_map(dev, dev->vol.migr_state);
+
+               /* any newly missing disks?
+                * (catches single-degraded vs double-degraded)
+                */
+               for (j = 0; j < map->num_members; j++) {
+                       __u32 ord = get_imsm_ord_tbl_ent(dev, i, -1);
+                       __u32 idx = ord_to_idx(ord);
+
+                       if (!(ord & IMSM_ORD_REBUILD) &&
+                           get_imsm_missing(super, idx)) {
+                               missing = 1;
+                               break;
+                       }
+               }
+
+               if (state == IMSM_T_STATE_FAILED)
+                       enough = -1;
+               else if (state == IMSM_T_STATE_DEGRADED &&
+                        (state != map->map_state || missing))
+                       enough = 0;
+               else /* we're normal, or already degraded */
+                       enough = 1;
+
+               /* in the missing/failed disk case check to see
+                * if at least one array is runnable
+                */
+               max_enough = max(max_enough, enough);
+       }
+       dprintf("%s: enough: %d\n", __func__, max_enough);
+       info->container_enough = max_enough;
  
         if (super->disks) {
                 __u32 reserved = imsm_reserved_sectors(super, super->disks);
@@ -1368,10 +2031,61 @@ static void getinfo_super_imsm(struct supertype *st, struct mdinfo *info)
          */
         if (info->disk.state & (1 << MD_DISK_SYNC) || super->anchor->num_raid_devs)
                 uuid_from_super_imsm(st, info->uuid);
-       else {
-               memcpy(info->uuid, uuid_match_any, sizeof(int[4]));
-               fixup_container_spare_uuid(info);
+       else
+               memcpy(info->uuid, uuid_zero, sizeof(uuid_zero));
+
+       /* I don't know how to compute 'map' on imsm, so use safe default */
+       if (map) {
+               int i;
+               for (i = 0; i < map_disks; i++)
+                       map[i] = 1;
+       }
+
+}
+
+/* allocates memory and fills disk in mdinfo structure
+ * for each disk in array */
+struct mdinfo *getinfo_super_disks_imsm(struct supertype *st)
+{
+       struct mdinfo *mddev = NULL;
+       struct intel_super *super = st->sb;
+       struct imsm_disk *disk;
+       int count = 0;
+       struct dl *dl;
+       if (!super || !super->disks)
+               return NULL;
+       dl = super->disks;
+       mddev = malloc(sizeof(*mddev));
+       if (!mddev) {
+               fprintf(stderr, Name ": Failed to allocate memory.\n");
+               return NULL;
         }
+       memset(mddev, 0, sizeof(*mddev));
+       while (dl) {
+               struct mdinfo *tmp;
+               disk = &dl->disk;
+               tmp = malloc(sizeof(*tmp));
+               if (!tmp) {
+                       fprintf(stderr, Name ": Failed to allocate memory.\n");
+                       if (mddev)
+                               sysfs_free(mddev);
+                       return NULL;
+               }
+               memset(tmp, 0, sizeof(*tmp));
+               if (mddev->devs)
+                       tmp->next = mddev->devs;
+               mddev->devs = tmp;
+               tmp->disk.number = count++;
+               tmp->disk.major = dl->major;
+               tmp->disk.minor = dl->minor;
+               tmp->disk.state = is_configured(disk) ?
+                                 (1 << MD_DISK_ACTIVE) : 0;
+               tmp->disk.state |= is_failed(disk) ? (1 << MD_DISK_FAULTY) : 0;
+               tmp->disk.state |= is_spare(disk) ? 0 : (1 << MD_DISK_SYNC);
+               tmp->disk.raid_disk = -1;
+               dl = dl->next;
+       }
+       return mddev;
  }
  
  static int update_super_imsm(struct supertype *st, struct mdinfo *info,
@@ -1413,8 +2127,7 @@ static int update_super_imsm(struct supertype *st, struct mdinfo *info,
         mpb = super->anchor;
  
         if (strcmp(update, "uuid") == 0 && uuid_set && !info->update_private)
-               fprintf(stderr,
-                       Name ": '--uuid' not supported for imsm metadata\n");
+               rv = -1;
         else if (strcmp(update, "uuid") == 0 && uuid_set && info->update_private) {
                 mpb->orig_family_num = *((__u32 *) info->update_private);
                 rv = 0;
@@ -1435,9 +2148,7 @@ static int update_super_imsm(struct supertype *st, struct mdinfo *info,
         } else if (strcmp(update, "assemble") == 0)
                 rv = 0;
         else
-               fprintf(stderr,
-                       Name ": '--update=%s' not supported for imsm metadata\n",
-                       update);
+               rv = -1;
  
         /* successful update? recompute checksum */
         if (rv == 0)
@@ -1503,6 +2214,19 @@ static int compare_super_imsm(struct supertype *st, struct supertype *tst)
                  tst->sb = NULL;
                  return 0;
          }
+       /* in platform dependent environment test if the disks
+        * use the same Intel hba
+        */
+       if (!check_env("IMSM_NO_PLATFORM")) {
+               if (!first->hba || !sec->hba ||
+                   (first->hba->type != sec->hba->type))  {
+                       fprintf(stderr,
+                               "HBAs of devices does not match %s != %s\n",
+                               first->hba ? get_sys_dev_type(first->hba->type) : NULL,
+                               sec->hba ? get_sys_dev_type(sec->hba->type) : NULL);
+                       return 3;
+               }
+       }
  
         /* if an anchor does not have num_raid_devs set then it is a free
          * floating spare
@@ -1566,6 +2290,7 @@ static int compare_super_imsm(struct supertype *st, struct supertype *tst)
                 first->anchor->num_raid_devs = sec->anchor->num_raid_devs;
                 first->anchor->orig_family_num = sec->anchor->orig_family_num;
                 first->anchor->family_num = sec->anchor->family_num;
+               memcpy(first->anchor->sig, sec->anchor->sig, MAX_SIGNATURE_LENGTH);
                 for (i = 0; i < sec->anchor->num_raid_devs; i++)
                         imsm_copy_dev(get_imsm_dev(first, i), get_imsm_dev(sec, i));
         }
@@ -1577,7 +2302,7 @@ static void fd2devname(int fd, char *name)
  {
         struct stat st;
         char path[256];
-       char dname[100];
+       char dname[PATH_MAX];
         char *nm;
         int rv;
  
@@ -1793,7 +2518,8 @@ static void migrate(struct imsm_dev *dev, __u8 to_state, int migr_type)
  
         /* duplicate and then set the target end state in map[0] */
         memcpy(dest, src, sizeof_imsm_map(src));
-       if (migr_type == MIGR_REBUILD) {
+       if ((migr_type == MIGR_REBUILD) ||
+           (migr_type ==  MIGR_GEN_MIGR)) {
                 __u32 ord;
                 int i;
  
@@ -1810,18 +2536,26 @@ static void end_migration(struct imsm_dev *dev, __u8 map_state)
  {
         struct imsm_map *map = get_imsm_map(dev, 0);
         struct imsm_map *prev = get_imsm_map(dev, dev->vol.migr_state);
-       int i;
+       int i, j;
  
         /* merge any IMSM_ORD_REBUILD bits that were not successfully
          * completed in the last migration.
          *
-        * FIXME add support for online capacity expansion and
-        * raid-level-migration
+        * FIXME add support for raid-level-migration
          */
         for (i = 0; i < prev->num_members; i++)
-               map->disk_ord_tbl[i] |= prev->disk_ord_tbl[i];
+               for (j = 0; j < map->num_members; j++)
+                       /* during online capacity expansion
+                        * disks position can be changed if takeover is used
+                        */
+                       if (ord_to_idx(map->disk_ord_tbl[j]) ==
+                           ord_to_idx(prev->disk_ord_tbl[i])) {
+                               map->disk_ord_tbl[j] |= prev->disk_ord_tbl[i];
+                               break;
+                       }
  
         dev->vol.migr_state = 0;
+       dev->vol.migr_type = 0;
         dev->vol.curr_migr_unit = 0;
         map->map_state = map_state;
  }
@@ -1832,6 +2566,7 @@ static int parse_raid_devices(struct intel_super *super)
         int i;
         struct imsm_dev *dev_new;
         size_t len, len_migr;
+       size_t max_len = 0;
         size_t space_needed = 0;
         struct imsm_super *mpb = super->anchor;
  
@@ -1847,7 +2582,11 @@ static int parse_raid_devices(struct intel_super *super)
                 dv = malloc(sizeof(*dv));
                 if (!dv)
                         return 1;
-               dev_new = malloc(len_migr);
+               if (max_len < len_migr)
+                       max_len = len_migr;
+               if (max_len > len_migr)
+                       space_needed += max_len - len_migr;
+               dev_new = malloc(max_len);
                 if (!dev_new) {
                         free(dv);
                         return 1;
@@ -1895,7 +2634,7 @@ struct bbm_log *__get_imsm_bbm_log(struct imsm_super *mpb)
  static void __free_imsm(struct intel_super *super, int free_disks);
  
  /* load_imsm_mpb - read matrix metadata
- * allocates super->mpb to be freed by free_super
+ * allocates super->mpb to be freed by free_imsm
   */
  static int load_imsm_mpb(int fd, struct intel_super *super, char *devname)
  {
@@ -1906,6 +2645,13 @@ static int load_imsm_mpb(int fd, struct intel_super *super, char *devname)
         __u32 check_sum;
  
         get_dev_size(fd, NULL, &dsize);
+       if (dsize < 1024) {
+               if (devname)
+                       fprintf(stderr,
+                               Name ": %s: device to small for imsm\n",
+                               devname);
+               return 1;
+       }
  
         if (lseek64(fd, dsize - (512 * 2), SEEK_SET) < 0) {
                 if (devname)
@@ -1940,6 +2686,10 @@ static int load_imsm_mpb(int fd, struct intel_super *super, char *devname)
         }
  
         __free_imsm(super, 0);
+       /*  reload capability and hba */
+
+       /* capability and hba must be updated with new super allocation */
+       find_intel_hba_capability(fd, super, devname);
         super->len = ROUND_UP(anchor->mpb_size, 512);
         if (posix_memalign(&super->buf, 512, super->len) != 0) {
                 if (devname)
@@ -1977,7 +2727,7 @@ static int load_imsm_mpb(int fd, struct intel_super *super, char *devname)
                 return 1;
         }
  
-       if (read(fd, super->buf + 512, super->len - 512) != super->len - 512) {
+       if ((unsigned)read(fd, super->buf + 512, super->len - 512) != super->len - 512) {
                 if (devname)
                         fprintf(stderr,
                                 Name ": Cannot read extended mpb on %s: %s\n",
@@ -2031,6 +2781,7 @@ static void __free_imsm_disk(struct dl *d)
         free(d);
  
  }
+
  static void free_imsm_disks(struct intel_super *super)
  {
         struct dl *d;
@@ -2040,6 +2791,11 @@ static void free_imsm_disks(struct intel_super *super)
                 super->disks = d->next;
                 __free_imsm_disk(d);
         }
+       while (super->disk_mgmt_list) {
+               d = super->disk_mgmt_list;
+               super->disk_mgmt_list = d->next;
+               __free_imsm_disk(d);
+       }
         while (super->missing) {
                 d = super->missing;
                 super->missing = d->next;
@@ -2051,17 +2807,26 @@ static void free_imsm_disks(struct intel_super *super)
  /* free all the pieces hanging off of a super pointer */
  static void __free_imsm(struct intel_super *super, int free_disks)
  {
+       struct intel_hba *elem, *next;
+
         if (super->buf) {
                 free(super->buf);
                 super->buf = NULL;
         }
+       /* unlink capability description */
+       super->orom = NULL;
         if (free_disks)
                 free_imsm_disks(super);
         free_devlist(super);
-       if (super->hba) {
-               free((void *) super->hba);
-               super->hba = NULL;
-       }
+       elem = super->hba;
+       while (elem) {
+               if (elem->path)
+                       free((void *)elem->path);
+               next = elem->next;
+               free(elem);
+               elem = next;
+       }
+       super->hba = NULL;
  }
  
  static void free_imsm(struct intel_super *super)
@@ -2081,34 +2846,72 @@ static void free_super_imsm(struct supertype *st)
         st->sb = NULL;
  }
  
-static struct intel_super *alloc_super(int creating_imsm)
+static struct intel_super *alloc_super(void)
  {
         struct intel_super *super = malloc(sizeof(*super));
  
         if (super) {
                 memset(super, 0, sizeof(*super));
-               super->creating_imsm = creating_imsm;
                 super->current_vol = -1;
                 super->create_offset = ~((__u32 ) 0);
-               if (!check_env("IMSM_NO_PLATFORM"))
-                       super->orom = find_imsm_orom();
-               if (super->orom && !check_env("IMSM_TEST_OROM")) {
-                       struct sys_dev *list, *ent;
-
-                       /* find the first intel ahci controller */
-                       list = find_driver_devices("pci", "ahci");
-                       for (ent = list; ent; ent = ent->next)
-                               if (devpath_to_vendor(ent->path) == 0x8086)
-                                       break;
-                       if (ent) {
-                               super->hba = ent->path;
-                               ent->path = NULL;
+       }
+       return super;
+}
+
+/*
+ * find and allocate hba and OROM/EFI based on valid fd of RAID component device
+ */
+static int find_intel_hba_capability(int fd, struct intel_super *super, char *devname)
+{
+       struct sys_dev *hba_name;
+       int rv = 0;
+
+       if ((fd < 0) || check_env("IMSM_NO_PLATFORM")) {
+               super->orom = NULL;
+               super->hba = NULL;
+               return 0;
+       }
+       hba_name = find_disk_attached_hba(fd, NULL);
+       if (!hba_name) {
+               if (devname)
+                       fprintf(stderr,
+                               Name ": %s is not attached to Intel(R) RAID controller.\n",
+                               devname);
+               return 1;
+       }
+       rv = attach_hba_to_super(super, hba_name);
+       if (rv == 2) {
+               if (devname) {
+                       struct intel_hba *hba = super->hba;
+
+                       fprintf(stderr, Name ": %s is attached to Intel(R) %s RAID "
+                               "controller (%s),\n"
+                               "    but the container is assigned to Intel(R) "
+                               "%s RAID controller (",
+                               devname,
+                               hba_name->path,
+                               hba_name->pci_id ? : "Err!",
+                               get_sys_dev_type(hba_name->type));
+
+                       while (hba) {
+                               fprintf(stderr, "%s", hba->pci_id ? : "Err!");
+                               if (hba->next)
+                                       fprintf(stderr, ", ");
+                               hba = hba->next;
                         }
-                       free_sys_dev(&list);
+
+                       fprintf(stderr, ").\n"
+                               "    Mixing devices attached to different controllers "
+                               "is not allowed.\n");
                 }
+               free_sys_dev(&hba_name);
+               return 2;
         }
-
-       return super;
+       super->orom = find_imsm_capability(hba_name->type);
+       free_sys_dev(&hba_name);
+       if (!super->orom)
+               return 3;
+       return 0;
  }
  
  #ifndef MDASSEMBLE
@@ -2428,7 +3231,7 @@ imsm_thunderdome(struct intel_super **super_list, int len)
                         struct intel_disk *idisk;
  
                         idisk = disk_list_get(dl->serial, disk_list);
-                       if (is_spare(&idisk->disk) &&
+                       if (idisk && is_spare(&idisk->disk) &&
                             !is_failed(&idisk->disk) && !is_configured(&idisk->disk))
                                 dl->index = -1;
                         else {
@@ -2464,7 +3267,7 @@ imsm_thunderdome(struct intel_super **super_list, int len)
  }
  
  static int load_super_imsm_all(struct supertype *st, int fd, void **sbp,
-                              char *devname, int keep_fd)
+                              char *devname)
  {
         struct mdinfo *sra;
         struct intel_super *super_list = NULL;
@@ -2474,27 +3277,24 @@ static int load_super_imsm_all(struct supertype *st, int fd, void **sbp,
         int retry;
         int err = 0;
         int i;
-       enum sysfs_read_flags flags;
-
-       flags = GET_LEVEL|GET_VERSION|GET_DEVS|GET_STATE;
-       if (mdmon_running(devnum))
-               flags |= SKIP_GONE_DEVS;
  
         /* check if 'fd' an opened container */
-       sra = sysfs_read(fd, 0, flags);
+       sra = sysfs_read(fd, 0, GET_LEVEL|GET_VERSION|GET_DEVS|GET_STATE);
         if (!sra)
                 return 1;
  
         if (sra->array.major_version != -1 ||
             sra->array.minor_version != -2 ||
-           strcmp(sra->text_version, "imsm") != 0)
-               return 1;
-
+           strcmp(sra->text_version, "imsm") != 0) {
+               err = 1;
+               goto error;
+       }
         /* load all mpbs */
         for (sd = sra->devs, i = 0; sd; sd = sd->next, i++) {
-               struct intel_super *s = alloc_super(0);
-               char nm[20];
+               struct intel_super *s = alloc_super();
+               char nm[32];
                 int dfd;
+               int rv;
  
                 err = 1;
                 if (!s)
@@ -2504,22 +3304,25 @@ static int load_super_imsm_all(struct supertype *st, int fd, void **sbp,
  
                 err = 2;
                 sprintf(nm, "%d:%d", sd->disk.major, sd->disk.minor);
-               dfd = dev_open(nm, keep_fd ? O_RDWR : O_RDONLY);
+               dfd = dev_open(nm, O_RDWR);
                 if (dfd < 0)
                         goto error;
  
-               err = load_and_parse_mpb(dfd, s, NULL, keep_fd);
+               rv = find_intel_hba_capability(dfd, s, devname);
+               /* no orom/efi or non-intel hba of the disk */
+               if (rv != 0)
+                       goto error;
+
+               err = load_and_parse_mpb(dfd, s, NULL, 1);
  
                 /* retry the load if we might have raced against mdmon */
                 if (err == 3 && mdmon_running(devnum))
                         for (retry = 0; retry < 3; retry++) {
                                 usleep(3000);
-                               err = load_and_parse_mpb(dfd, s, NULL, keep_fd);
+                               err = load_and_parse_mpb(dfd, s, NULL, 1);
                                 if (err != 3)
                                         break;
                         }
-               if (!keep_fd)
-                       close(dfd);
                 if (err)
                         goto error;
         }
@@ -2536,16 +3339,6 @@ static int load_super_imsm_all(struct supertype *st, int fd, void **sbp,
                 err = 2;
                 goto error;
         }
-
-       if (st->subarray[0]) {
-               if (atoi(st->subarray) <= super->anchor->num_raid_devs)
-                       super->current_vol = atoi(st->subarray);
-               else {
-                       free_imsm(super);
-                       err = 1;
-                       goto error;
-               }
-       }
         err = 0;
  
   error:
@@ -2555,6 +3348,7 @@ static int load_super_imsm_all(struct supertype *st, int fd, void **sbp,
                 super_list = super_list->next;
                 free_imsm(s);
         }
+       sysfs_free(sra);
  
         if (err)
                 return err;
@@ -2566,10 +3360,13 @@ static int load_super_imsm_all(struct supertype *st, int fd, void **sbp,
                 st->minor_version = 0;
                 st->max_devs = IMSM_MAX_DEVICES;
         }
-       st->loaded_container = 1;
-
         return 0;
  }
+
+static int load_container_imsm(struct supertype *st, int fd, char *devname)
+{
+       return load_super_imsm_all(st, fd, &st->sb, devname);
+}
  #endif
  
  static int load_super_imsm(struct supertype *st, int fd, char *devname)
@@ -2577,21 +3374,32 @@ static int load_super_imsm(struct supertype *st, int fd, char *devname)
         struct intel_super *super;
         int rv;
  
-#ifndef MDASSEMBLE
-       if (load_super_imsm_all(st, fd, &st->sb, devname, 1) == 0)
-               return 0;
-#endif
+       if (test_partition(fd))
+               /* IMSM not allowed on partitions */
+               return 1;
  
         free_super_imsm(st);
  
-       super = alloc_super(0);
+       super = alloc_super();
         if (!super) {
                 fprintf(stderr,
                         Name ": malloc of %zu failed.\n",
                         sizeof(*super));
                 return 1;
         }
-
+       /* Load hba and capabilities if they exist.
+        * But do not preclude loading metadata in case capabilities or hba are
+        * non-compliant and ignore_hw_compat is set.
+        */
+       rv = find_intel_hba_capability(fd, super, devname);
+       /* no orom/efi or non-intel hba of the disk */
+       if ((rv != 0) && (st->ignore_hw_compat == 0)) {
+               if (devname)
+                       fprintf(stderr,
+                               Name ": No OROM/EFI properties for %s\n", devname);
+               free_imsm(super);
+               return 2;
+       }
         rv = load_and_parse_mpb(fd, super, devname, 0);
  
         if (rv) {
@@ -2603,23 +3411,12 @@ static int load_super_imsm(struct supertype *st, int fd, char *devname)
                 return rv;
         }
  
-       if (st->subarray[0]) {
-               if (atoi(st->subarray) <= super->anchor->num_raid_devs)
-                       super->current_vol = atoi(st->subarray);
-               else {
-                       free_imsm(super);
-                       return 1;
-               }
-       }
-
         st->sb = super;
         if (st->ss == NULL) {
                 st->ss = &super_imsm;
                 st->minor_version = 0;
                 st->max_devs = IMSM_MAX_DEVICES;
         }
-       st->loaded_container = 0;
-
         return 0;
  }
  
@@ -2695,6 +3492,30 @@ static void imsm_update_version_info(struct intel_super *super)
         }
  }
  
+static int check_name(struct intel_super *super, char *name, int quiet)
+{
+       struct imsm_super *mpb = super->anchor;
+       char *reason = NULL;
+       int i;
+
+       if (strlen(name) > MAX_RAID_SERIAL_LEN)
+               reason = "must be 16 characters or less";
+
+       for (i = 0; i < mpb->num_raid_devs; i++) {
+               struct imsm_dev *dev = get_imsm_dev(super, i);
+
+               if (strncmp((char *) dev->volume, name, MAX_RAID_SERIAL_LEN) == 0) {
+                       reason = "already exists";
+                       break;
+               }
+       }
+
+       if (reason && !quiet)
+               fprintf(stderr, Name ": imsm volume name %s\n", reason);
+
+       return !reason;
+}
+
  static int init_super_imsm_volume(struct supertype *st, mdu_array_info_t *info,
                                   unsigned long long size, char *name,
                                   char *homehost, int *uuid)
@@ -2746,28 +3567,20 @@ static int init_super_imsm_volume(struct supertype *st, mdu_array_info_t *info,
         if (super->current_vol == 0)
                 mpb->num_disks = 0;
  
-       for (i = 0; i < super->current_vol; i++) {
-               dev = get_imsm_dev(super, i);
-               if (strncmp((char *) dev->volume, name,
-                            MAX_RAID_SERIAL_LEN) == 0) {
-                       fprintf(stderr, Name": '%s' is already defined for this container\n",
-                               name);
-                       return 0;
-               }
-       }
-
-       sprintf(st->subarray, "%d", idx);
+       if (!check_name(super, name, 0))
+               return 0;
         dv = malloc(sizeof(*dv));
         if (!dv) {
                 fprintf(stderr, Name ": failed to allocate device list entry\n");
                 return 0;
         }
-       dev = malloc(sizeof(*dev) + sizeof(__u32) * (info->raid_disks - 1));
+       dev = calloc(1, sizeof(*dev) + sizeof(__u32) * (info->raid_disks - 1));
         if (!dev) {
                 free(dv);
                 fprintf(stderr, Name": could not allocate raid device\n");
                 return 0;
         }
+
         strncpy((char *) dev->volume, name, MAX_RAID_SERIAL_LEN);
         if (info->level == 1)
                 array_blocks = info_to_blocks_per_member(info);
@@ -2780,8 +3593,7 @@ static int init_super_imsm_volume(struct supertype *st, mdu_array_info_t *info,
  
         dev->size_low = __cpu_to_le32((__u32) array_blocks);
         dev->size_high = __cpu_to_le32((__u32) (array_blocks >> 32));
-       dev->status = __cpu_to_le32(0);
-       dev->reserved_blocks = __cpu_to_le32(0);
+       dev->status = (DEV_READ_COALESCING | DEV_WRITE_COALESCING);
         vol = &dev->vol;
         vol->migr_state = 0;
         set_migr_type(dev, MIGR_INIT);
@@ -2797,6 +3609,8 @@ static int init_super_imsm_volume(struct supertype *st, mdu_array_info_t *info,
         map->ddf = 1;
  
         if (info->level == 1 && info->raid_disks > 2) {
+               free(dev);
+               free(dv);
                 fprintf(stderr, Name": imsm does not support more than 2 disks"
                                 "in a raid1 volume\n");
                 return 0;
@@ -2817,7 +3631,7 @@ static int init_super_imsm_volume(struct supertype *st, mdu_array_info_t *info,
         map->num_members = info->raid_disks;
         for (i = 0; i < map->num_members; i++) {
                 /* initialized in add_to_super */
-               set_imsm_ord_tbl_ent(map, i, 0);
+               set_imsm_ord_tbl_ent(map, i, IMSM_ORD_REBUILD);
         }
         mpb->num_raid_devs++;
  
@@ -2856,7 +3670,7 @@ static int init_super_imsm(struct supertype *st, mdu_array_info_t *info,
         else
                 mpb_size = 512;
  
-       super = alloc_super(1);
+       super = alloc_super();
         if (super && posix_memalign(&super->buf, 512, mpb_size) != 0) {
                 free(super);
                 super = NULL;
@@ -2895,6 +3709,7 @@ static int add_to_super_imsm_volume(struct supertype *st, mdu_disk_info_t *dk,
         struct dl *dl;
         struct imsm_dev *dev;
         struct imsm_map *map;
+       int slot;
  
         dev = get_imsm_dev(super, super->current_vol);
         map = get_imsm_map(dev, 0);
@@ -2929,6 +3744,14 @@ static int add_to_super_imsm_volume(struct supertype *st, mdu_disk_info_t *dk,
                 dl->index = super->anchor->num_disks;
                 super->anchor->num_disks++;
         }
+       /* Check the device has not already been added */
+       slot = get_imsm_disk_slot(map, dl->index);
+       if (slot >= 0 &&
+           (get_imsm_ord_tbl_ent(dev, slot, -1) & IMSM_ORD_REBUILD) == 0) {
+               fprintf(stderr, Name ": %s has been included in this array twice\n",
+                       devname);
+               return 1;
+       }
         set_imsm_ord_tbl_ent(map, dk->number, dl->index);
         dl->disk.status = CONFIGURED_DISK;
  
@@ -2938,6 +3761,10 @@ static int add_to_super_imsm_volume(struct supertype *st, mdu_disk_info_t *dk,
                 struct imsm_dev *_dev = __get_imsm_dev(mpb, 0);
                 struct imsm_disk *_disk = __get_imsm_disk(mpb, dl->index);
  
+               if (!_dev || !_disk) {
+                       fprintf(stderr, Name ": BUG mpb setup error\n");
+                       return 1;
+               }
                 *_dev = *dev;
                 *_disk = dl->disk;
                 sum = random32();
@@ -2949,8 +3776,9 @@ static int add_to_super_imsm_volume(struct supertype *st, mdu_disk_info_t *dk,
         return 0;
  }
  
+
  static int add_to_super_imsm(struct supertype *st, mdu_disk_info_t *dk,
-                             int fd, char *devname)
+                            int fd, char *devname)
  {
         struct intel_super *super = st->sb;
         struct dl *dd;
@@ -2959,13 +3787,16 @@ static int add_to_super_imsm(struct supertype *st, mdu_disk_info_t *dk,
         int rv;
         struct stat stb;
  
-       /* if we are on an RAID enabled platform check that the disk is
-        * attached to the raid controller
+       /* If we are on an RAID enabled platform check that the disk is
+        * attached to the raid controller.
+        * We do not need to test disks attachment for container based additions,
+        * they shall be already tested when container was created/assembled.
          */
-       if (super->hba && !disk_attached_to_hba(fd, super->hba)) {
-               fprintf(stderr,
-                       Name ": %s is not attached to the raid controller: %s\n",
-                       devname ? : "disk", super->hba);
+       rv = find_intel_hba_capability(fd, super, devname);
+       /* no orom/efi or non-intel hba of the disk */
+       if (rv != 0) {
+               dprintf("capability: %p fd: %d ret: %d\n",
+                       super->orom, fd, rv);
                 return 1;
         }
  
@@ -2986,6 +3817,7 @@ static int add_to_super_imsm(struct supertype *st, mdu_disk_info_t *dk,
         dd->devname = devname ? strdup(devname) : NULL;
         dd->fd = fd;
         dd->e = NULL;
+       dd->action = DISK_ADD;
         rv = imsm_read_serial(fd, devname, dd->serial);
         if (rv) {
                 fprintf(stderr,
@@ -3005,12 +3837,50 @@ static int add_to_super_imsm(struct supertype *st, mdu_disk_info_t *dk,
                 dd->disk.scsi_id = __cpu_to_le32(0);
  
         if (st->update_tail) {
-               dd->next = super->add;
-               super->add = dd;
+               dd->next = super->disk_mgmt_list;
+               super->disk_mgmt_list = dd;
         } else {
                 dd->next = super->disks;
                 super->disks = dd;
+               super->updates_pending++;
+       }
+
+       return 0;
+}
+
+
+static int remove_from_super_imsm(struct supertype *st, mdu_disk_info_t *dk)
+{
+       struct intel_super *super = st->sb;
+       struct dl *dd;
+
+       /* remove from super works only in mdmon - for communication
+        * manager - monitor. Check if communication memory buffer
+        * is prepared.
+        */
+       if (!st->update_tail) {
+               fprintf(stderr,
+                       Name ": %s shall be used in mdmon context only"
+                       "(line %d).\n", __func__, __LINE__);
+               return 1;
+       }
+       dd = malloc(sizeof(*dd));
+       if (!dd) {
+               fprintf(stderr,
+                       Name ": malloc failed %s:%d.\n", __func__, __LINE__);
+               return 1;
         }
+       memset(dd, 0, sizeof(*dd));
+       dd->major = dk->major;
+       dd->minor = dk->minor;
+       dd->index = -1;
+       dd->fd = -1;
+       dd->disk.status = SPARE_DISK;
+       dd->action = DISK_REMOVE;
+
+       dd->next = super->disk_mgmt_list;
+       super->disk_mgmt_list = dd;
+
  
         return 0;
  }
@@ -3068,8 +3938,9 @@ static int write_super_imsm_spares(struct intel_super *super, int doclose)
         return 0;
  }
  
-static int write_super_imsm(struct intel_super *super, int doclose)
+static int write_super_imsm(struct supertype *st, int doclose)
  {
+       struct intel_super *super = st->sb;
         struct imsm_super *mpb = super->anchor;
         struct dl *d;
         __u32 generation;
@@ -3077,6 +3948,7 @@ static int write_super_imsm(struct intel_super *super, int doclose)
         int spares = 0;
         int i;
         __u32 mpb_size = sizeof(struct imsm_super) - sizeof(struct imsm_disk);
+       int num_disks = 0;
  
         /* 'generation' is incremented everytime the metadata is written */
         generation = __le32_to_cpu(mpb->generation_num);
@@ -3089,21 +3961,28 @@ static int write_super_imsm(struct intel_super *super, int doclose)
         if (mpb->orig_family_num == 0)
                 mpb->orig_family_num = mpb->family_num;
  
-       mpb_size += sizeof(struct imsm_disk) * mpb->num_disks;
         for (d = super->disks; d; d = d->next) {
                 if (d->index == -1)
                         spares++;
-               else
+               else {
                         mpb->disk[d->index] = d->disk;
+                       num_disks++;
+               }
         }
-       for (d = super->missing; d; d = d->next)
+       for (d = super->missing; d; d = d->next) {
                 mpb->disk[d->index] = d->disk;
+               num_disks++;
+       }
+       mpb->num_disks = num_disks;
+       mpb_size += sizeof(struct imsm_disk) * mpb->num_disks;
  
         for (i = 0; i < mpb->num_raid_devs; i++) {
                 struct imsm_dev *dev = __get_imsm_dev(mpb, i);
-
-               imsm_copy_dev(dev, get_imsm_dev(super, i));
-               mpb_size += sizeof_imsm_dev(dev, 0);
+               struct imsm_dev *dev2 = get_imsm_dev(super, i);
+               if (dev && dev2) {
+                       imsm_copy_dev(dev, dev2);
+                       mpb_size += sizeof_imsm_dev(dev, 0);
+               }
         }
         mpb_size += __le32_to_cpu(mpb->bbm_log_size);
         mpb->mpb_size = __cpu_to_le32(mpb_size);
@@ -3157,7 +4036,7 @@ static int create_array(struct supertype *st, int dev_idx)
         imsm_copy_dev(&u->dev, dev);
         inf = get_disk_info(u);
         for (i = 0; i < map->num_members; i++) {
-               int idx = get_imsm_disk_idx(dev, i);
+               int idx = get_imsm_disk_idx(dev, i, -1);
  
                 disk = get_imsm_disk(super, idx);
                 serialcpy(inf[i].serial, disk->serial);
@@ -3167,13 +4046,13 @@ static int create_array(struct supertype *st, int dev_idx)
         return 0;
  }
  
-static int _add_disk(struct supertype *st)
+static int mgmt_disk(struct supertype *st)
  {
         struct intel_super *super = st->sb;
         size_t len;
-       struct imsm_update_add_disk *u;
+       struct imsm_update_add_remove_disk *u;
  
-       if (!super->add)
+       if (!super->disk_mgmt_list)
                 return 0;
  
         len = sizeof(*u);
@@ -3184,7 +4063,7 @@ static int _add_disk(struct supertype *st)
                 return 1;
         }
  
-       u->type = update_add_disk;
+       u->type = update_add_remove_disk;
         append_metadata_update(st, u, len);
  
         return 0;
@@ -3201,26 +4080,24 @@ static int write_init_super_imsm(struct supertype *st)
         if (st->update_tail) {
                 /* queue the recently created array / added disk
                  * as a metadata update */
-               struct dl *d;
                 int rv;
  
                 /* determine if we are creating a volume or adding a disk */
                 if (current_vol < 0) {
-                       /* in the add disk case we are running in mdmon
-                        * context, so don't close fd's
+                       /* in the mgmt (add/remove) disk case we are running
+                        * in mdmon context, so don't close fd's
                          */
-                       return _add_disk(st);
+                       return mgmt_disk(st);
                 } else
                         rv = create_array(st, current_vol);
  
-               for (d = super->disks; d ; d = d->next) {
-                       close(d->fd);
-                       d->fd = -1;
-               }
-
                 return rv;
-       } else
-               return write_super_imsm(st->sb, 1);
+       } else {
+               struct dl *d;
+               for (d = super->disks; d; d = d->next)
+                       Kill(d->devname, NULL, 0, 1, 1);
+               return write_super_imsm(st, 1);
+       }
  }
  #endif
  
@@ -3253,25 +4130,14 @@ static int validate_geometry_imsm_container(struct supertype *st, int level,
  {
         int fd;
         unsigned long long ldsize;
-       const struct imsm_orom *orom;
+       struct intel_super *super=NULL;
+       int rv = 0;
  
         if (level != LEVEL_CONTAINER)
                 return 0;
         if (!dev)
                 return 1;
  
-       if (check_env("IMSM_NO_PLATFORM"))
-               orom = NULL;
-       else
-               orom = find_imsm_orom();
-       if (orom && raiddisks > orom->tds) {
-               if (verbose)
-                       fprintf(stderr, Name ": %d exceeds maximum number of"
-                               " platform supported disks: %d\n",
-                               raiddisks, orom->tds);
-               return 0;
-       }
-
         fd = open(dev, O_RDONLY|O_EXCL, 0);
         if (fd < 0) {
                 if (verbose)
@@ -3283,9 +4149,45 @@ static int validate_geometry_imsm_container(struct supertype *st, int level,
                 close(fd);
                 return 0;
         }
+
+       /* capabilities retrieve could be possible
+        * note that there is no fd for the disks in array.
+        */
+       super = alloc_super();
+       if (!super) {
+               fprintf(stderr,
+                       Name ": malloc of %zu failed.\n",
+                       sizeof(*super));
+               close(fd);
+               return 0;
+       }
+
+       rv = find_intel_hba_capability(fd, super, verbose ? dev : NULL);
+       if (rv != 0) {
+#if DEBUG
+               char str[256];
+               fd2devname(fd, str);
+               dprintf("validate_geometry_imsm_container: fd: %d %s orom: %p rv: %d raiddisk: %d\n",
+                       fd, str, super->orom, rv, raiddisks);
+#endif
+               /* no orom/efi or non-intel hba of the disk */
+               close(fd);
+               free_imsm(super);
+               return 0;
+       }
         close(fd);
+       if (super->orom && raiddisks > super->orom->tds) {
+               if (verbose)
+                       fprintf(stderr, Name ": %d exceeds maximum number of"
+                               " platform supported disks: %d\n",
+                               raiddisks, super->orom->tds);
+
+               free_imsm(super);
+               return 0;
+       }
  
         *freesize = avail_size_imsm(st, ldsize >> 9);
+       free_imsm(super);
  
         return 1;
  }
@@ -3333,7 +4235,7 @@ static unsigned long long merge_extents(struct intel_super *super, int sum_exten
         unsigned long reserve;
  
         if (!e)
-               return ~0ULL; /* error */
+               return 0;
  
         /* coalesce and sort all extents. also, check to see if we need to
          * reserve space between member arrays
@@ -3376,17 +4278,23 @@ static unsigned long long merge_extents(struct intel_super *super, int sum_exten
         } while (e[i-1].size);
         free(e);
  
+       if (maxsize == 0)
+               return 0;
+
+       /* FIXME assumes volume at offset 0 is the first volume in a
+        * container
+        */
         if (start_extent > 0)
                 reserve = IMSM_RESERVED_SECTORS; /* gap between raid regions */
         else
                 reserve = 0;
  
         if (maxsize < reserve)
-               return ~0ULL;
+               return 0;
  
         super->create_offset = ~((__u32) 0);
         if (start + reserve > super->create_offset)
-               return ~0ULL; /* start overflows create_offset */
+               return 0; /* start overflows create_offset */
         super->create_offset = start + reserve;
  
         return maxsize - reserve;
@@ -3414,12 +4322,61 @@ static int is_raid_level_supported(const struct imsm_orom *orom, int level, int
         return 0;
  }
  
+
  #define pr_vrb(fmt, arg...) (void) (verbose && fprintf(stderr, Name fmt, ##arg))
+/*
+ * validate volume parameters with OROM/EFI capabilities
+ */
+static int
+validate_geometry_imsm_orom(struct intel_super *super, int level, int layout,
+                           int raiddisks, int *chunk, int verbose)
+{
+#if DEBUG
+       verbose = 1;
+#endif
+       /* validate container capabilities */
+       if (super->orom && raiddisks > super->orom->tds) {
+               if (verbose)
+                       fprintf(stderr, Name ": %d exceeds maximum number of"
+                               " platform supported disks: %d\n",
+                               raiddisks, super->orom->tds);
+               return 0;
+       }
+
+        /* capabilities of OROM tested - copied from validate_geometry_imsm_volume */
+       if (super->orom && (!is_raid_level_supported(super->orom, level,
+                                                    raiddisks))) {
+               pr_vrb(": platform does not support raid%d with %d disk%s\n",
+                       level, raiddisks, raiddisks > 1 ? "s" : "");
+               return 0;
+       }
+       if (super->orom && level != 1) {
+               if (chunk && (*chunk == 0 || *chunk == UnSet))
+                       *chunk = imsm_orom_default_chunk(super->orom);
+               else if (chunk && !imsm_orom_has_chunk(super->orom, *chunk)) {
+                       pr_vrb(": platform does not support a chunk size of: "
+                              "%d\n", *chunk);
+                       return 0;
+               }
+       }
+       if (layout != imsm_level_to_layout(level)) {
+               if (level == 5)
+                       pr_vrb(": imsm raid 5 only supports the left-asymmetric layout\n");
+               else if (level == 10)
+                       pr_vrb(": imsm raid 10 only supports the n2 layout\n");
+               else
+                       pr_vrb(": imsm unknown layout %#x for this raid level %d\n",
+                               layout, level);
+               return 0;
+       }
+       return 1;
+}
+
  /* validate_geometry_imsm_volume - lifted from validate_geometry_ddf_bvd 
   * FIX ME add ahci details
   */
  static int validate_geometry_imsm_volume(struct supertype *st, int level,
-                                        int layout, int raiddisks, int chunk,
+                                        int layout, int raiddisks, int *chunk,
                                          unsigned long long size, char *dev,
                                          unsigned long long *freesize,
                                          int verbose)
@@ -3437,34 +4394,18 @@ static int validate_geometry_imsm_volume(struct supertype *st, int level,
         if (!super)
                 return 0;
  
-       if (!is_raid_level_supported(super->orom, level, raiddisks)) {
-               pr_vrb(": platform does not support raid%d with %d disk%s\n",
-                       level, raiddisks, raiddisks > 1 ? "s" : "");
-               return 0;
-       }
-       if (super->orom && level != 1 &&
-           !imsm_orom_has_chunk(super->orom, chunk)) {
-               pr_vrb(": platform does not support a chunk size of: %d\n", chunk);
-               return 0;
-       }
-       if (layout != imsm_level_to_layout(level)) {
-               if (level == 5)
-                       pr_vrb(": imsm raid 5 only supports the left-asymmetric layout\n");
-               else if (level == 10)
-                       pr_vrb(": imsm raid 10 only supports the n2 layout\n");
-               else
-                       pr_vrb(": imsm unknown layout %#x for this raid level %d\n",
-                               layout, level);
+       if (!validate_geometry_imsm_orom(super, level, layout, raiddisks, chunk, verbose)) {
+               fprintf(stderr, Name ": RAID gemetry validation failed. "
+                       "Cannot proceed with the action(s).\n");
                 return 0;
         }
-
         if (!dev) {
                 /* General test:  make sure there is space for
                  * 'raiddisks' device extents of size 'size' at a given
                  * offset
                  */
                 unsigned long long minsize = size;
-               unsigned long long start_offset = ~0ULL;
+               unsigned long long start_offset = MaxSector;
                 int dcnt = 0;
                 if (minsize == 0)
                         minsize = MPB_SECTOR_CNT + IMSM_RESERVED_SECTORS;
@@ -3480,7 +4421,7 @@ static int validate_geometry_imsm_volume(struct supertype *st, int level,
                                 esize = e[i].start - pos;
                                 if (esize >= minsize)
                                         found = 1;
-                               if (found && start_offset == ~0ULL) {
+                               if (found && start_offset == MaxSector) {
                                         start_offset = pos;
                                         break;
                                 } else if (found && pos != start_offset) {
@@ -3511,8 +4452,8 @@ static int validate_geometry_imsm_volume(struct supertype *st, int level,
         if ((S_IFMT & stb.st_mode) != S_IFBLK)
                 return 0;
         for (dl = super->disks ; dl ; dl = dl->next) {
-               if (dl->major == major(stb.st_rdev) &&
-                   dl->minor == minor(stb.st_rdev))
+               if (dl->major == (int)major(stb.st_rdev) &&
+                   dl->minor == (int)minor(stb.st_rdev))
                         break;
         }
         if (!dl) {
@@ -3569,15 +4510,11 @@ static int validate_geometry_imsm_volume(struct supertype *st, int level,
                         i += dl->extent_cnt;
  
         maxsize = merge_extents(super, i);
-       if (maxsize < size) {
+       if (maxsize < size || maxsize == 0) {
                 if (verbose)
                         fprintf(stderr, Name ": not enough space after merge (%llu < %llu)\n",
                                 maxsize, size);
                 return 0;
-       } else if (maxsize == ~0ULL) {
-               if (verbose)
-                       fprintf(stderr, Name ": failed to merge %d extents\n", i);
-               return 0;
         }
  
         *freesize = maxsize;
@@ -3630,11 +4567,13 @@ static int reserve_space(struct supertype *st, int raiddisks,
         maxsize = merge_extents(super, extent_cnt);
         minsize = size;
         if (size == 0)
-               minsize = chunk;
+               /* chunk is in K */
+               minsize = chunk * 2;
  
         if (cnt < raiddisks ||
             (super->orom && used && used != raiddisks) ||
-           maxsize < minsize) {
+           maxsize < minsize ||
+           maxsize == 0) {
                 fprintf(stderr, Name ": not enough devices with space to create array.\n");
                 return 0; /* No enough free spaces large enough */
         }
@@ -3642,8 +4581,8 @@ static int reserve_space(struct supertype *st, int raiddisks,
         if (size == 0) {
                 size = maxsize;
                 if (chunk) {
-                       size /= chunk;
-                       size *= chunk;
+                       size /= 2 * chunk;
+                       size *= 2 * chunk;
                 }
         }
  
@@ -3658,20 +4597,23 @@ static int reserve_space(struct supertype *st, int raiddisks,
  }
  
  static int validate_geometry_imsm(struct supertype *st, int level, int layout,
-                                 int raiddisks, int chunk, unsigned long long size,
+                                 int raiddisks, int *chunk, unsigned long long size,
                                   char *dev, unsigned long long *freesize,
                                   int verbose)
  {
         int fd, cfd;
         struct mdinfo *sra;
+       int is_member = 0;
  
-       /* if given unused devices create a container 
+       /* load capability
+        * if given unused devices create a container
          * if given given devices in a container create a member volume
          */
         if (level == LEVEL_CONTAINER) {
                 /* Must be a fresh device to add to a container */
                 return validate_geometry_imsm_container(st, level, layout,
-                                                       raiddisks, chunk, size,
+                                                       raiddisks,
+                                                       chunk?*chunk:0, size,
                                                         dev, freesize,
                                                         verbose);
         }
@@ -3686,7 +4628,12 @@ static int validate_geometry_imsm(struct supertype *st, int level, int layout,
                          * created.  add_to_super and getinfo_super
                          * detect when autolayout is in progress.
                          */
-                       return reserve_space(st, raiddisks, size, chunk, freesize);
+                       if (!validate_geometry_imsm_orom(st->sb, level, layout,
+                                                        raiddisks, chunk,
+                                                        verbose))
+                               return 0;
+                       return reserve_space(st, raiddisks, size,
+                                            chunk?*chunk:0, freesize);
                 }
                 return 1;
         }
@@ -3697,18 +4644,6 @@ static int validate_geometry_imsm(struct supertype *st, int level, int layout,
                                                      dev, freesize, verbose);
         }
  
-       /* limit creation to the following levels */
-       if (!dev)
-               switch (level) {
-               case 0:
-               case 1:
-               case 10:
-               case 5:
-                       break;
-               default:
-                       return 1;
-               }
-
         /* This device needs to be a device in an 'imsm' container */
         fd = open(dev, O_RDONLY|O_EXCL, 0);
         if (fd >= 0) {
@@ -3727,23 +4662,25 @@ static int validate_geometry_imsm(struct supertype *st, int level, int layout,
         }
         /* Well, it is in use by someone, maybe an 'imsm' container. */
         cfd = open_container(fd);
+       close(fd);
         if (cfd < 0) {
-               close(fd);
                 if (verbose)
                         fprintf(stderr, Name ": Cannot use %s: It is busy\n",
                                 dev);
                 return 0;
         }
         sra = sysfs_read(cfd, 0, GET_VERSION);
-       close(fd);
         if (sra && sra->array.major_version == -1 &&
-           strcmp(sra->text_version, "imsm") == 0) {
+           strcmp(sra->text_version, "imsm") == 0)
+               is_member = 1;
+       sysfs_free(sra);
+       if (is_member) {
                 /* This is a member of a imsm container.  Load the container
                  * and try to create a volume
                  */
                 struct intel_super *super;
  
-               if (load_super_imsm_all(st, cfd, (void **) &super, NULL, 1) == 0) {
+               if (load_super_imsm_all(st, cfd, (void **) &super, NULL) == 0) {
                         st->sb = super;
                         st->container_dev = fd2devnum(cfd);
                         close(cfd);
@@ -3752,101 +4689,350 @@ static int validate_geometry_imsm(struct supertype *st, int level, int layout,
                                                              size, dev,
                                                              freesize, verbose);
                 }
-               close(cfd);
-       } else /* may belong to another container */
-               return 0;
+       }
  
-       return 1;
+       if (verbose)
+               fprintf(stderr, Name ": failed container membership check\n");
+
+       close(cfd);
+       return 0;
  }
-#endif /* MDASSEMBLE */
  
-static struct mdinfo *container_content_imsm(struct supertype *st)
+static void default_geometry_imsm(struct supertype *st, int *level, int *layout, int *chunk)
  {
-       /* Given a container loaded by load_super_imsm_all,
-        * extract information about all the arrays into
-        * an mdinfo tree.
-        *
-        * For each imsm_dev create an mdinfo, fill it in,
-        *  then look for matching devices in super->disks
-        *  and create appropriate device mdinfo.
-        */
         struct intel_super *super = st->sb;
+
+       if (level && *level == UnSet)
+               *level = LEVEL_CONTAINER;
+
+       if (level && layout && *layout == UnSet)
+               *layout = imsm_level_to_layout(*level);
+
+       if (chunk && (*chunk == UnSet || *chunk == 0) && 
+           super && super->orom)
+               *chunk = imsm_orom_default_chunk(super->orom);
+}
+
+static void handle_missing(struct intel_super *super, struct imsm_dev *dev);
+
+static int kill_subarray_imsm(struct supertype *st)
+{
+       /* remove the subarray currently referenced by ->current_vol */
+       __u8 i;
+       struct intel_dev **dp;
+       struct intel_super *super = st->sb;
+       __u8 current_vol = super->current_vol;
         struct imsm_super *mpb = super->anchor;
-       struct mdinfo *rest = NULL;
-       int i;
  
-       /* do not assemble arrays that might have bad blocks */
-       if (imsm_bbm_log_size(super->anchor)) {
-               fprintf(stderr, Name ": BBM log found in metadata. "
-                               "Cannot activate array(s).\n");
-               return NULL;
-       }
+       if (super->current_vol < 0)
+               return 2;
+       super->current_vol = -1; /* invalidate subarray cursor */
  
+       /* block deletions that would change the uuid of active subarrays
+        *
+        * FIXME when immutable ids are available, but note that we'll
+        * also need to fixup the invalidated/active subarray indexes in
+        * mdstat
+        */
         for (i = 0; i < mpb->num_raid_devs; i++) {
-               struct imsm_dev *dev = get_imsm_dev(super, i);
-               struct imsm_map *map = get_imsm_map(dev, 0);
-               struct mdinfo *this;
-               int slot;
+               char subarray[4];
  
-               /* do not publish arrays that are in the middle of an
-                * unsupported migration
-                */
-               if (dev->vol.migr_state &&
-                   (migr_type(dev) == MIGR_GEN_MIGR ||
-                    migr_type(dev) == MIGR_STATE_CHANGE)) {
-                       fprintf(stderr, Name ": cannot assemble volume '%.16s':"
-                               " unsupported migration in progress\n",
-                               dev->volume);
+               if (i < current_vol)
                         continue;
+               sprintf(subarray, "%u", i);
+               if (is_subarray_active(subarray, st->devname)) {
+                       fprintf(stderr,
+                               Name ": deleting subarray-%d would change the UUID of active subarray-%d, aborting\n",
+                               current_vol, i);
+
+                       return 2;
                 }
+       }
  
-               this = malloc(sizeof(*this));
-               memset(this, 0, sizeof(*this));
-               this->next = rest;
+       if (st->update_tail) {
+               struct imsm_update_kill_array *u = malloc(sizeof(*u));
  
-               super->current_vol = i;
-               getinfo_super_imsm_volume(st, this);
-               for (slot = 0 ; slot <  map->num_members; slot++) {
-                       struct mdinfo *info_d;
-                       struct dl *d;
-                       int idx;
-                       int skip;
-                       __u32 ord;
+               if (!u)
+                       return 2;
+               u->type = update_kill_array;
+               u->dev_idx = current_vol;
+               append_metadata_update(st, u, sizeof(*u));
  
-                       skip = 0;
-                       idx = get_imsm_disk_idx(dev, slot);
-                       ord = get_imsm_ord_tbl_ent(dev, slot); 
-                       for (d = super->disks; d ; d = d->next)
-                               if (d->index == idx)
-                                        break;
+               return 0;
+       }
  
-                       if (d == NULL)
-                               skip = 1;
-                       if (d && is_failed(&d->disk))
-                               skip = 1;
-                       if (ord & IMSM_ORD_REBUILD)
-                               skip = 1;
+       for (dp = &super->devlist; *dp;)
+               if ((*dp)->index == current_vol) {
+                       *dp = (*dp)->next;
+               } else {
+                       handle_missing(super, (*dp)->dev);
+                       if ((*dp)->index > current_vol)
+                               (*dp)->index--;
+                       dp = &(*dp)->next;
+               }
  
-                       /* 
-                        * if we skip some disks the array will be assmebled degraded;
-                        * reset resync start to avoid a dirty-degraded situation
-                        *
-                        * FIXME handle dirty degraded
-                        */
-                       if (skip && !dev->vol.dirty)
-                               this->resync_start = ~0ULL;
-                       if (skip)
+       /* no more raid devices, all active components are now spares,
+        * but of course failed are still failed
+        */
+       if (--mpb->num_raid_devs == 0) {
+               struct dl *d;
+
+               for (d = super->disks; d; d = d->next)
+                       if (d->index > -2) {
+                               d->index = -1;
+                               d->disk.status = SPARE_DISK;
+                       }
+       }
+
+       super->updates_pending++;
+
+       return 0;
+}
+
+static int update_subarray_imsm(struct supertype *st, char *subarray,
+                               char *update, struct mddev_ident *ident)
+{
+       /* update the subarray currently referenced by ->current_vol */
+       struct intel_super *super = st->sb;
+       struct imsm_super *mpb = super->anchor;
+
+       if (strcmp(update, "name") == 0) {
+               char *name = ident->name;
+               char *ep;
+               int vol;
+
+               if (is_subarray_active(subarray, st->devname)) {
+                       fprintf(stderr,
+                               Name ": Unable to update name of active subarray\n");
+                       return 2;
+               }
+
+               if (!check_name(super, name, 0))
+                       return 2;
+
+               vol = strtoul(subarray, &ep, 10);
+               if (*ep != '\0' || vol >= super->anchor->num_raid_devs)
+                       return 2;
+
+               if (st->update_tail) {
+                       struct imsm_update_rename_array *u = malloc(sizeof(*u));
+
+                       if (!u)
+                               return 2;
+                       u->type = update_rename_array;
+                       u->dev_idx = vol;
+                       snprintf((char *) u->name, MAX_RAID_SERIAL_LEN, "%s", name);
+                       append_metadata_update(st, u, sizeof(*u));
+               } else {
+                       struct imsm_dev *dev;
+                       int i;
+
+                       dev = get_imsm_dev(super, vol);
+                       snprintf((char *) dev->volume, MAX_RAID_SERIAL_LEN, "%s", name);
+                       for (i = 0; i < mpb->num_raid_devs; i++) {
+                               dev = get_imsm_dev(super, i);
+                               handle_missing(super, dev);
+                       }
+                       super->updates_pending++;
+               }
+       } else
+               return 2;
+
+       return 0;
+}
+
+static int is_gen_migration(struct imsm_dev *dev)
+{
+       if (!dev->vol.migr_state)
+               return 0;
+
+       if (migr_type(dev) == MIGR_GEN_MIGR)
+               return 1;
+
+       return 0;
+}
+#endif /* MDASSEMBLE */
+
+static int is_rebuilding(struct imsm_dev *dev)
+{
+       struct imsm_map *migr_map;
+
+       if (!dev->vol.migr_state)
+               return 0;
+
+       if (migr_type(dev) != MIGR_REBUILD)
+               return 0;
+
+       migr_map = get_imsm_map(dev, 1);
+
+       if (migr_map->map_state == IMSM_T_STATE_DEGRADED)
+               return 1;
+       else
+               return 0;
+}
+
+static void update_recovery_start(struct imsm_dev *dev, struct mdinfo *array)
+{
+       struct mdinfo *rebuild = NULL;
+       struct mdinfo *d;
+       __u32 units;
+
+       if (!is_rebuilding(dev))
+               return;
+
+       /* Find the rebuild target, but punt on the dual rebuild case */
+       for (d = array->devs; d; d = d->next)
+               if (d->recovery_start == 0) {
+                       if (rebuild)
+                               return;
+                       rebuild = d;
+               }
+
+       if (!rebuild) {
+               /* (?) none of the disks are marked with
+                * IMSM_ORD_REBUILD, so assume they are missing and the
+                * disk_ord_tbl was not correctly updated
+                */
+               dprintf("%s: failed to locate out-of-sync disk\n", __func__);
+               return;
+       }
+
+       units = __le32_to_cpu(dev->vol.curr_migr_unit);
+       rebuild->recovery_start = units * blocks_per_migr_unit(dev);
+}
+
+
+static struct mdinfo *container_content_imsm(struct supertype *st, char *subarray)
+{
+       /* Given a container loaded by load_super_imsm_all,
+        * extract information about all the arrays into
+        * an mdinfo tree.
+        * If 'subarray' is given, just extract info about that array.
+        *
+        * For each imsm_dev create an mdinfo, fill it in,
+        *  then look for matching devices in super->disks
+        *  and create appropriate device mdinfo.
+        */
+       struct intel_super *super = st->sb;
+       struct imsm_super *mpb = super->anchor;
+       struct mdinfo *rest = NULL;
+       unsigned int i;
+       int bbm_errors = 0;
+       struct dl *d;
+       int spare_disks = 0;
+
+       /* check for bad blocks */
+       if (imsm_bbm_log_size(super->anchor))
+               bbm_errors = 1;
+
+       /* count spare devices, not used in maps
+        */
+       for (d = super->disks; d; d = d->next)
+               if (d->index == -1)
+                       spare_disks++;
+
+       for (i = 0; i < mpb->num_raid_devs; i++) {
+               struct imsm_dev *dev;
+               struct imsm_map *map;
+               struct imsm_map *map2;
+               struct mdinfo *this;
+               int slot, chunk;
+               char *ep;
+
+               if (subarray &&
+                   (i != strtoul(subarray, &ep, 10) || *ep != '\0'))
+                       continue;
+
+               dev = get_imsm_dev(super, i);
+               map = get_imsm_map(dev, 0);
+               map2 = get_imsm_map(dev, 1);
+
+               /* do not publish arrays that are in the middle of an
+                * unsupported migration
+                */
+               if (dev->vol.migr_state &&
+                   (migr_type(dev) == MIGR_STATE_CHANGE)) {
+                       fprintf(stderr, Name ": cannot assemble volume '%.16s':"
+                               " unsupported migration in progress\n",
+                               dev->volume);
+                       continue;
+               }
+               /* do not publish arrays that are not support by controller's
+                * OROM/EFI
+                */
+
+               chunk = __le16_to_cpu(map->blocks_per_strip) >> 1;
+               if (!validate_geometry_imsm_orom(super,
+                                                get_imsm_raid_level(map), /* RAID level */
+                                                imsm_level_to_layout(get_imsm_raid_level(map)),
+                                                map->num_members, /* raid disks */
+                                                &chunk,
+                                                1 /* verbose */)) {
+                       fprintf(stderr, Name ": RAID gemetry validation failed. "
+                               "Cannot proceed with the action(s).\n");
+                       continue;
+               }
+               this = malloc(sizeof(*this));
+               if (!this) {
+                       fprintf(stderr, Name ": failed to allocate %zu bytes\n",
+                               sizeof(*this));
+                       break;
+               }
+               memset(this, 0, sizeof(*this));
+               this->next = rest;
+
+               super->current_vol = i;
+               getinfo_super_imsm_volume(st, this, NULL);
+               for (slot = 0 ; slot <  map->num_members; slot++) {
+                       unsigned long long recovery_start;
+                       struct mdinfo *info_d;
+                       struct dl *d;
+                       int idx;
+                       int skip;
+                       __u32 ord;
+
+                       skip = 0;
+                       idx = get_imsm_disk_idx(dev, slot, 0);
+                       ord = get_imsm_ord_tbl_ent(dev, slot, -1);
+                       for (d = super->disks; d ; d = d->next)
+                               if (d->index == idx)
+                                       break;
+
+                       recovery_start = MaxSector;
+                       if (d == NULL)
+                               skip = 1;
+                       if (d && is_failed(&d->disk))
+                               skip = 1;
+                       if (ord & IMSM_ORD_REBUILD)
+                               recovery_start = 0;
+
+                       /* 
+                        * if we skip some disks the array will be assmebled degraded;
+                        * reset resync start to avoid a dirty-degraded
+                        * situation when performing the intial sync
+                        *
+                        * FIXME handle dirty degraded
+                        */
+                       if ((skip || recovery_start == 0) && !dev->vol.dirty)
+                               this->resync_start = MaxSector;
+                       if (skip)
                                 continue;
  
-                       info_d = malloc(sizeof(*info_d));
+                       info_d = calloc(1, sizeof(*info_d));
                         if (!info_d) {
                                 fprintf(stderr, Name ": failed to allocate disk"
                                         " for volume %.16s\n", dev->volume);
+                               info_d = this->devs;
+                               while (info_d) {
+                                       struct mdinfo *d = info_d->next;
+
+                                       free(info_d);
+                                       info_d = d;
+                               }
                                 free(this);
                                 this = rest;
                                 break;
                         }
-                       memset(info_d, 0, sizeof(*info_d));
                         info_d->next = this->devs;
                         this->devs = info_d;
  
@@ -3854,40 +5040,39 @@ static struct mdinfo *container_content_imsm(struct supertype *st)
                         info_d->disk.major = d->major;
                         info_d->disk.minor = d->minor;
                         info_d->disk.raid_disk = slot;
-
-                       this->array.working_disks++;
+                       info_d->recovery_start = recovery_start;
+                       if (map2) {
+                               if (slot < map2->num_members)
+                                       info_d->disk.state = (1 << MD_DISK_ACTIVE);
+                               else
+                                       this->array.spare_disks++;
+                       } else {
+                               if (slot < map->num_members)
+                                       info_d->disk.state = (1 << MD_DISK_ACTIVE);
+                               else
+                                       this->array.spare_disks++;
+                       }
+                       if (info_d->recovery_start == MaxSector)
+                               this->array.working_disks++;
  
                         info_d->events = __le32_to_cpu(mpb->generation_num);
                         info_d->data_offset = __le32_to_cpu(map->pba_of_lba0);
                         info_d->component_size = __le32_to_cpu(map->blocks_per_member);
-                       if (d->devname)
-                               strcpy(info_d->name, d->devname);
                 }
+               /* now that the disk list is up-to-date fixup recovery_start */
+               update_recovery_start(dev, this);
+               this->array.spare_disks += spare_disks;
                 rest = this;
         }
  
+       /* if array has bad blocks, set suitable bit in array status */
+       if (bbm_errors)
+               rest->array.state |= (1<<MD_SB_BBM_ERRORS);
+
         return rest;
  }
  
  
-#ifndef MDASSEMBLE
-static int imsm_open_new(struct supertype *c, struct active_array *a,
-                        char *inst)
-{
-       struct intel_super *super = c->sb;
-       struct imsm_super *mpb = super->anchor;
-       
-       if (atoi(inst) >= mpb->num_raid_devs) {
-               fprintf(stderr, "%s: subarry index %d, out of range\n",
-                       __func__, atoi(inst));
-               return -ENODEV;
-       }
-
-       dprintf("imsm: open_new %s\n", inst);
-       a->info.container_member = atoi(inst);
-       return 0;
-}
-
  static __u8 imsm_check_degraded(struct intel_super *super, struct imsm_dev *dev, int failed)
  {
         struct imsm_map *map = get_imsm_map(dev, 0);
@@ -3918,7 +5103,7 @@ static __u8 imsm_check_degraded(struct intel_super *super, struct imsm_dev *dev,
                 int insync = insync;
  
                 for (i = 0; i < map->num_members; i++) {
-                       __u32 ord = get_imsm_ord_tbl_ent(dev, i);
+                       __u32 ord = get_imsm_ord_tbl_ent(dev, i, -1);
                         int idx = ord_to_idx(ord);
                         struct imsm_disk *disk;
  
@@ -3986,6 +5171,24 @@ static int imsm_count_failed(struct intel_super *super, struct imsm_dev *dev)
         return failed;
  }
  
+#ifndef MDASSEMBLE
+static int imsm_open_new(struct supertype *c, struct active_array *a,
+                        char *inst)
+{
+       struct intel_super *super = c->sb;
+       struct imsm_super *mpb = super->anchor;
+       
+       if (atoi(inst) >= mpb->num_raid_devs) {
+               fprintf(stderr, "%s: subarry index %d, out of range\n",
+                       __func__, atoi(inst));
+               return -ENODEV;
+       }
+
+       dprintf("imsm: open_new %s\n", inst);
+       a->info.container_member = atoi(inst);
+       return 0;
+}
+
  static int is_resyncing(struct imsm_dev *dev)
  {
         struct imsm_map *migr_map;
@@ -3997,27 +5200,13 @@ static int is_resyncing(struct imsm_dev *dev)
             migr_type(dev) == MIGR_REPAIR)
                 return 1;
  
-       migr_map = get_imsm_map(dev, 1);
-
-       if (migr_map->map_state == IMSM_T_STATE_NORMAL)
-               return 1;
-       else
-               return 0;
-}
-
-static int is_rebuilding(struct imsm_dev *dev)
-{
-       struct imsm_map *migr_map;
-
-       if (!dev->vol.migr_state)
-               return 0;
-
-       if (migr_type(dev) != MIGR_REBUILD)
+       if (migr_type(dev) == MIGR_GEN_MIGR)
                 return 0;
  
         migr_map = get_imsm_map(dev, 1);
  
-       if (migr_map->map_state == IMSM_T_STATE_DEGRADED)
+       if ((migr_map->map_state == IMSM_T_STATE_NORMAL) &&
+           (dev->vol.migr_type != MIGR_GEN_MIGR))
                 return 1;
         else
                 return 0;
@@ -4029,6 +5218,8 @@ static int mark_failure(struct imsm_dev *dev, struct imsm_disk *disk, int idx)
         __u32 ord;
         int slot;
         struct imsm_map *map;
+       char buf[MAX_RAID_SERIAL_LEN+3];
+       unsigned int len, shift = 0;
  
         /* new failures are always set in map[0] */
         map = get_imsm_map(dev, 0);
@@ -4041,10 +5232,14 @@ static int mark_failure(struct imsm_dev *dev, struct imsm_disk *disk, int idx)
         if (is_failed(disk) && (ord & IMSM_ORD_REBUILD))
                 return 0;
  
+       sprintf(buf, "%s:0", disk->serial);
+       if ((len = strlen(buf)) >= MAX_RAID_SERIAL_LEN)
+               shift = len - MAX_RAID_SERIAL_LEN + 1;
+       strncpy((char *)disk->serial, &buf[shift], MAX_RAID_SERIAL_LEN);
+
         disk->status |= FAILED_DISK;
-       disk->status &= ~CONFIGURED_DISK;
         set_imsm_ord_tbl_ent(map, slot, idx | IMSM_ORD_REBUILD);
-       if (~map->failed_disk_num == 0)
+       if (map->failed_disk_num == 0xff)
                 map->failed_disk_num = slot;
         return 1;
  }
@@ -4060,7 +5255,107 @@ static void mark_missing(struct imsm_dev *dev, struct imsm_disk *disk, int idx)
         memmove(&disk->serial[0], &disk->serial[1], MAX_RAID_SERIAL_LEN - 1);
  }
  
-/* Handle dirty -> clean transititions and resync.  Degraded and rebuild
+static void handle_missing(struct intel_super *super, struct imsm_dev *dev)
+{
+       __u8 map_state;
+       struct dl *dl;
+       int failed;
+
+       if (!super->missing)
+               return;
+       failed = imsm_count_failed(super, dev);
+       map_state = imsm_check_degraded(super, dev, failed);
+
+       dprintf("imsm: mark missing\n");
+       end_migration(dev, map_state);
+       for (dl = super->missing; dl; dl = dl->next)
+               mark_missing(dev, &dl->disk, dl->index);
+       super->updates_pending++;
+}
+
+static unsigned long long imsm_set_array_size(struct imsm_dev *dev)
+{
+       int used_disks = imsm_num_data_members(dev, 0);
+       unsigned long long array_blocks;
+       struct imsm_map *map;
+
+       if (used_disks == 0) {
+               /* when problems occures
+                * return current array_blocks value
+                */
+               array_blocks = __le32_to_cpu(dev->size_high);
+               array_blocks = array_blocks << 32;
+               array_blocks += __le32_to_cpu(dev->size_low);
+
+               return array_blocks;
+       }
+
+       /* set array size in metadata
+        */
+       map = get_imsm_map(dev, 0);
+       array_blocks = map->blocks_per_member * used_disks;
+
+       /* round array size down to closest MB
+        */
+       array_blocks = (array_blocks >> SECT_PER_MB_SHIFT) << SECT_PER_MB_SHIFT;
+       dev->size_low = __cpu_to_le32((__u32)array_blocks);
+       dev->size_high = __cpu_to_le32((__u32)(array_blocks >> 32));
+
+       return array_blocks;
+}
+
+static void imsm_set_disk(struct active_array *a, int n, int state);
+
+static void imsm_progress_container_reshape(struct intel_super *super)
+{
+       /* if no device has a migr_state, but some device has a
+        * different number of members than the previous device, start
+        * changing the number of devices in this device to match
+        * previous.
+        */
+       struct imsm_super *mpb = super->anchor;
+       int prev_disks = -1;
+       int i;
+       int copy_map_size;
+
+       for (i = 0; i < mpb->num_raid_devs; i++) {
+               struct imsm_dev *dev = get_imsm_dev(super, i);
+               struct imsm_map *map = get_imsm_map(dev, 0);
+               struct imsm_map *map2;
+               int prev_num_members;
+
+               if (dev->vol.migr_state)
+                       return;
+
+               if (prev_disks == -1)
+                       prev_disks = map->num_members;
+               if (prev_disks == map->num_members)
+                       continue;
+
+               /* OK, this array needs to enter reshape mode.
+                * i.e it needs a migr_state
+                */
+
+               copy_map_size = sizeof_imsm_map(map);
+               prev_num_members = map->num_members;
+               map->num_members = prev_disks;
+               dev->vol.migr_state = 1;
+               dev->vol.curr_migr_unit = 0;
+               dev->vol.migr_type = MIGR_GEN_MIGR;
+               for (i = prev_num_members;
+                    i < map->num_members; i++)
+                       set_imsm_ord_tbl_ent(map, i, i);
+               map2 = get_imsm_map(dev, 1);
+               /* Copy the current map */
+               memcpy(map2, map, copy_map_size);
+               map2->num_members = prev_num_members;
+
+               imsm_set_array_size(dev);
+               super->updates_pending++;
+       }
+}
+
+/* Handle dirty -> clean transititions, resync and reshape.  Degraded and rebuild
   * states are handled in imsm_set_disk() with one exception, when a
   * resync is stopped due to a new failure this routine will set the
   * 'degraded' state for the array.
@@ -4073,25 +5368,75 @@ static int imsm_set_array_state(struct active_array *a, int consistent)
         struct imsm_map *map = get_imsm_map(dev, 0);
         int failed = imsm_count_failed(super, dev);
         __u8 map_state = imsm_check_degraded(super, dev, failed);
+       __u32 blocks_per_unit;
+
+       if (dev->vol.migr_state &&
+           dev->vol.migr_type  == MIGR_GEN_MIGR) {
+               /* array state change is blocked due to reshape action
+                * We might need to
+                * - abort the reshape (if last_checkpoint is 0 and action!= reshape)
+                * - finish the reshape (if last_checkpoint is big and action != reshape)
+                * - update curr_migr_unit
+                */
+               if (a->curr_action == reshape) {
+                       /* still reshaping, maybe update curr_migr_unit */
+                       goto mark_checkpoint;
+               } else {
+                       if (a->last_checkpoint == 0 && a->prev_action == reshape) {
+                               /* for some reason we aborted the reshape.
+                                * Better clean up
+                                */
+                               struct imsm_map *map2 = get_imsm_map(dev, 1);
+                               dev->vol.migr_state = 0;
+                               dev->vol.migr_type = 0;
+                               dev->vol.curr_migr_unit = 0;
+                               memcpy(map, map2, sizeof_imsm_map(map2));
+                               super->updates_pending++;
+                       }
+                       if (a->last_checkpoint >= a->info.component_size) {
+                               unsigned long long array_blocks;
+                               int used_disks;
+                               struct mdinfo *mdi;
+
+                               used_disks = imsm_num_data_members(dev, 0);
+                               if (used_disks > 0) {
+                                       array_blocks =
+                                               map->blocks_per_member *
+                                               used_disks;
+                                       /* round array size down to closest MB
+                                        */
+                                       array_blocks = (array_blocks
+                                                       >> SECT_PER_MB_SHIFT)
+                                               << SECT_PER_MB_SHIFT;
+                                       a->info.custom_array_size = array_blocks;
+                                       /* encourage manager to update array
+                                        * size
+                                        */
+
+                                       a->check_reshape = 1;
+                               }
+                               /* finalize online capacity expansion/reshape */
+                               for (mdi = a->info.devs; mdi; mdi = mdi->next)
+                                       imsm_set_disk(a,
+                                                     mdi->disk.raid_disk,
+                                                     mdi->curr_state);
+
+                               imsm_progress_container_reshape(super);
+                       }
+               }
+       }
  
         /* before we activate this array handle any missing disks */
-       if (consistent == 2 && super->missing) {
-               struct dl *dl;
+       if (consistent == 2)
+               handle_missing(super, dev);
  
-               dprintf("imsm: mark missing\n");
-               end_migration(dev, map_state);
-               for (dl = super->missing; dl; dl = dl->next)
-                       mark_missing(dev, &dl->disk, dl->index);
-               super->updates_pending++;
-       }
-               
         if (consistent == 2 &&
-           (!is_resync_complete(a) ||
+           (!is_resync_complete(&a->info) ||
              map_state != IMSM_T_STATE_NORMAL ||
              dev->vol.migr_state))
                 consistent = 0;
  
-       if (is_resync_complete(a)) {
+       if (is_resync_complete(&a->info)) {
                 /* complete intialization / resync,
                  * recovery and interrupted recovery is completed in
                  * ->set_disk
@@ -4100,10 +5445,11 @@ static int imsm_set_array_state(struct active_array *a, int consistent)
                         dprintf("imsm: mark resync done\n");
                         end_migration(dev, map_state);
                         super->updates_pending++;
+                       a->last_checkpoint = 0;
                 }
         } else if (!is_resyncing(dev) && !failed) {
                 /* mark the start of the init process if nothing is failed */
-               dprintf("imsm: mark resync start (%llu)\n", a->resync_start);
+               dprintf("imsm: mark resync start\n");
                 if (map->map_state == IMSM_T_STATE_UNINITIALIZED)
                         migrate(dev, IMSM_T_STATE_NORMAL, MIGR_INIT);
                 else
@@ -4111,18 +5457,37 @@ static int imsm_set_array_state(struct active_array *a, int consistent)
                 super->updates_pending++;
         }
  
-        /* FIXME check if we can update curr_migr_unit from resync_start */
+mark_checkpoint:
+       /* check if we can update curr_migr_unit from resync_start, recovery_start */
+       blocks_per_unit = blocks_per_migr_unit(dev);
+       if (blocks_per_unit) {
+               __u32 units32;
+               __u64 units;
+
+               units = a->last_checkpoint / blocks_per_unit;
+               units32 = units;
+
+               /* check that we did not overflow 32-bits, and that
+                * curr_migr_unit needs updating
+                */
+               if (units32 == units &&
+                   __le32_to_cpu(dev->vol.curr_migr_unit) != units32) {
+                       dprintf("imsm: mark checkpoint (%u)\n", units32);
+                       dev->vol.curr_migr_unit = __cpu_to_le32(units32);
+                       super->updates_pending++;
+               }
+       }
  
         /* mark dirty / clean */
         if (dev->vol.dirty != !consistent) {
-               dprintf("imsm: mark '%s' (%llu)\n",
-                       consistent ? "clean" : "dirty", a->resync_start);
+               dprintf("imsm: mark '%s'\n", consistent ? "clean" : "dirty");
                 if (consistent)
                         dev->vol.dirty = 0;
                 else
                         dev->vol.dirty = 1;
                 super->updates_pending++;
         }
+
         return consistent;
  }
  
@@ -4146,7 +5511,7 @@ static void imsm_set_disk(struct active_array *a, int n, int state)
  
         dprintf("imsm: set_disk %d:%x\n", n, state);
  
-       ord = get_imsm_ord_tbl_ent(dev, n);
+       ord = get_imsm_ord_tbl_ent(dev, n, -1);
         disk = get_imsm_disk(super, ord_to_idx(ord));
  
         /* check for new failures */
@@ -4172,17 +5537,37 @@ static void imsm_set_disk(struct active_array *a, int n, int state)
                 map = get_imsm_map(dev, 0);
                 map->failed_disk_num = ~0;
                 super->updates_pending++;
+               a->last_checkpoint = 0;
         } else if (map_state == IMSM_T_STATE_DEGRADED &&
                    map->map_state != map_state &&
                    !dev->vol.migr_state) {
                 dprintf("imsm: mark degraded\n");
                 map->map_state = map_state;
                 super->updates_pending++;
+               a->last_checkpoint = 0;
         } else if (map_state == IMSM_T_STATE_FAILED &&
                    map->map_state != map_state) {
                 dprintf("imsm: mark failed\n");
                 end_migration(dev, map_state);
                 super->updates_pending++;
+               a->last_checkpoint = 0;
+       } else if (is_gen_migration(dev)) {
+               dprintf("imsm: Detected General Migration in state: ");
+               if (map_state == IMSM_T_STATE_NORMAL) {
+                       end_migration(dev, map_state);
+                       map = get_imsm_map(dev, 0);
+                       map->failed_disk_num = ~0;
+                       dprintf("normal\n");
+               } else {
+                       if (map_state == IMSM_T_STATE_DEGRADED) {
+                               printf("degraded\n");
+                               end_migration(dev, map_state);
+                       } else {
+                               dprintf("failed\n");
+                       }
+                       map->map_state = map_state;
+               }
+               super->updates_pending++;
         }
  }
  
@@ -4203,7 +5588,8 @@ static int store_imsm_mpb(int fd, struct imsm_super *mpb)
                 if (lseek64(fd, dsize - (512 * (2 + sectors)), SEEK_SET) < 0)
                         return 1;
  
-               if (write(fd, buf + 512, 512 * sectors) != 512 * sectors)
+               if ((unsigned long long)write(fd, buf + 512, 512 * sectors)
+                   != 512 * sectors)
                         return 1;
         }
  
@@ -4221,10 +5607,11 @@ static void imsm_sync_metadata(struct supertype *container)
  {
         struct intel_super *super = container->sb;
  
+       dprintf("sync metadata: %d\n", super->updates_pending);
         if (!super->updates_pending)
                 return;
  
-       write_super_imsm(super, 0);
+       write_super_imsm(container, 0);
  
         super->updates_pending = 0;
  }
@@ -4232,7 +5619,7 @@ static void imsm_sync_metadata(struct supertype *container)
  static struct dl *imsm_readd(struct intel_super *super, int idx, struct active_array *a)
  {
         struct imsm_dev *dev = get_imsm_dev(super, a->info.container_member);
-       int i = get_imsm_disk_idx(dev, idx);
+       int i = get_imsm_disk_idx(dev, idx, -1);
         struct dl *dl;
  
         for (dl = super->disks; dl; dl = dl->next)
@@ -4249,10 +5636,11 @@ static struct dl *imsm_readd(struct intel_super *super, int idx, struct active_a
  }
  
  static struct dl *imsm_add_spare(struct intel_super *super, int slot,
-                                struct active_array *a, int activate_new)
+                                struct active_array *a, int activate_new,
+                                struct mdinfo *additional_test_list)
  {
         struct imsm_dev *dev = get_imsm_dev(super, a->info.container_member);
-       int idx = get_imsm_disk_idx(dev, slot);
+       int idx = get_imsm_disk_idx(dev, slot, -1);
         struct imsm_super *mpb = super->anchor;
         struct imsm_map *map;
         unsigned long long pos;
@@ -4260,9 +5648,10 @@ static struct dl *imsm_add_spare(struct intel_super *super, int slot,
         struct extent *ex;
         int i, j;
         int found;
-       __u32 array_start;
-       __u32 array_end;
+       __u32 array_start = 0;
+       __u32 array_end = 0;
         struct dl *dl;
+       struct mdinfo *test_list;
  
         for (dl = super->disks; dl; dl = dl->next) {
                 /* If in this array, skip */
@@ -4270,11 +5659,24 @@ static struct dl *imsm_add_spare(struct intel_super *super, int slot,
                         if (d->state_fd >= 0 &&
                             d->disk.major == dl->major &&
                             d->disk.minor == dl->minor) {
-                               dprintf("%x:%x already in array\n", dl->major, dl->minor);
+                               dprintf("%x:%x already in array\n",
+                                       dl->major, dl->minor);
                                 break;
                         }
                 if (d)
                         continue;
+               test_list = additional_test_list;
+               while (test_list) {
+                       if (test_list->disk.major == dl->major &&
+                           test_list->disk.minor == dl->minor) {
+                               dprintf("%x:%x already in additional test list\n",
+                                       dl->major, dl->minor);
+                               break;
+                       }
+                       test_list = test_list->next;
+               }
+               if (test_list)
+                       continue;
  
                 /* skip in use or failed drives */
                 if (is_failed(&dl->disk) || idx == dl->index ||
@@ -4344,6 +5746,45 @@ static struct dl *imsm_add_spare(struct intel_super *super, int slot,
         return dl;
  }
  
+
+static int imsm_rebuild_allowed(struct supertype *cont, int dev_idx, int failed)
+{
+       struct imsm_dev *dev2;
+       struct imsm_map *map;
+       struct dl *idisk;
+       int slot;
+       int idx;
+       __u8 state;
+
+       dev2 = get_imsm_dev(cont->sb, dev_idx);
+       if (dev2) {
+               state = imsm_check_degraded(cont->sb, dev2, failed);
+               if (state == IMSM_T_STATE_FAILED) {
+                       map = get_imsm_map(dev2, 0);
+                       if (!map)
+                               return 1;
+                       for (slot = 0; slot < map->num_members; slot++) {
+                               /*
+                                * Check if failed disks are deleted from intel
+                                * disk list or are marked to be deleted
+                                */
+                               idx = get_imsm_disk_idx(dev2, slot, -1);
+                               idisk = get_imsm_dl_disk(cont->sb, idx);
+                               /*
+                                * Do not rebuild the array if failed disks
+                                * from failed sub-array are not removed from
+                                * container.
+                                */
+                               if (idisk &&
+                                   is_failed(&idisk->disk) &&
+                                   (idisk->action != DISK_REMOVE))
+                                       return 0;
+                       }
+               }
+       }
+       return 1;
+}
+
  static struct mdinfo *imsm_activate_spare(struct active_array *a,
                                           struct metadata_update **updates)
  {
@@ -4371,6 +5812,7 @@ static struct mdinfo *imsm_activate_spare(struct active_array *a,
         struct imsm_update_activate_spare *u;
         int num_spares = 0;
         int i;
+       int allowed;
  
         for (d = a->info.devs ; d ; d = d->next) {
                 if ((d->curr_state & DS_FAULTY) &&
@@ -4383,9 +5825,41 @@ static struct mdinfo *imsm_activate_spare(struct active_array *a,
  
         dprintf("imsm: activate spare: inst=%d failed=%d (%d) level=%d\n",
                 inst, failed, a->info.array.raid_disks, a->info.array.level);
+
+       if (dev->vol.migr_state &&
+           dev->vol.migr_type == MIGR_GEN_MIGR)
+               /* No repair during migration */
+               return NULL;
+
+       if (a->info.array.level == 4)
+               /* No repair for takeovered array
+                * imsm doesn't support raid4
+                */
+               return NULL;
+
         if (imsm_check_degraded(super, dev, failed) != IMSM_T_STATE_DEGRADED)
                 return NULL;
  
+       /*
+        * If there are any failed disks check state of the other volume.
+        * Block rebuild if the another one is failed until failed disks
+        * are removed from container.
+        */
+       if (failed) {
+               dprintf("found failed disks in %s, check if there another"
+                       "failed sub-array.\n",
+                       dev->volume);
+               /* check if states of the other volumes allow for rebuild */
+               for (i = 0; i <  super->anchor->num_raid_devs; i++) {
+                       if (i != inst) {
+                               allowed = imsm_rebuild_allowed(a->container,
+                                                              i, failed);
+                               if (!allowed)
+                                       return NULL;
+                       }
+               }
+       }
+
         /* For each slot, if it is not working, find a spare */
         for (i = 0; i < a->info.array.raid_disks; i++) {
                 for (d = a->info.devs ; d ; d = d->next)
@@ -4404,9 +5878,9 @@ static struct mdinfo *imsm_activate_spare(struct active_array *a,
                  */
                 dl = imsm_readd(super, i, a);
                 if (!dl)
-                       dl = imsm_add_spare(super, i, a, 0);
+                       dl = imsm_add_spare(super, i, a, 0, NULL);
                 if (!dl)
-                       dl = imsm_add_spare(super, i, a, 1);
+                       dl = imsm_add_spare(super, i, a, 1, NULL);
                 if (!dl)
                         continue;
   
@@ -4433,6 +5907,7 @@ static struct mdinfo *imsm_activate_spare(struct active_array *a,
                 di->disk.major = dl->major;
                 di->disk.minor = dl->minor;
                 di->disk.state = 0;
+               di->recovery_start = 0;
                 di->data_offset = __le32_to_cpu(map->pba_of_lba0);
                 di->component_size = a->info.component_size;
                 di->container_member = inst;
@@ -4472,6 +5947,7 @@ static struct mdinfo *imsm_activate_spare(struct active_array *a,
         }
                         
         mu->space = NULL;
+       mu->space_list = NULL;
         mu->len = sizeof(struct imsm_update_activate_spare) * num_spares;
         mu->next = *updates;
         u = (struct imsm_update_activate_spare *) mu->buf;
@@ -4485,33 +5961,315 @@ static struct mdinfo *imsm_activate_spare(struct active_array *a,
                 u->next = u + 1;
                 u++;
         }
-       (u-1)->next = NULL;
-       *updates = mu;
+       (u-1)->next = NULL;
+       *updates = mu;
+
+       return rv;
+}
+
+static int disks_overlap(struct intel_super *super, int idx, struct imsm_update_create_array *u)
+{
+       struct imsm_dev *dev = get_imsm_dev(super, idx);
+       struct imsm_map *map = get_imsm_map(dev, 0);
+       struct imsm_map *new_map = get_imsm_map(&u->dev, 0);
+       struct disk_info *inf = get_disk_info(u);
+       struct imsm_disk *disk;
+       int i;
+       int j;
+
+       for (i = 0; i < map->num_members; i++) {
+               disk = get_imsm_disk(super, get_imsm_disk_idx(dev, i, -1));
+               for (j = 0; j < new_map->num_members; j++)
+                       if (serialcmp(disk->serial, inf[j].serial) == 0)
+                               return 1;
+       }
+
+       return 0;
+}
+
+
+static struct dl *get_disk_super(struct intel_super *super, int major, int minor)
+{
+       struct dl *dl = NULL;
+       for (dl = super->disks; dl; dl = dl->next)
+               if ((dl->major == major) &&  (dl->minor == minor))
+                       return dl;
+       return NULL;
+}
+
+static int remove_disk_super(struct intel_super *super, int major, int minor)
+{
+       struct dl *prev = NULL;
+       struct dl *dl;
+
+       prev = NULL;
+       for (dl = super->disks; dl; dl = dl->next) {
+               if ((dl->major == major) && (dl->minor == minor)) {
+                       /* remove */
+                       if (prev)
+                               prev->next = dl->next;
+                       else
+                               super->disks = dl->next;
+                       dl->next = NULL;
+                       __free_imsm_disk(dl);
+                       dprintf("%s: removed %x:%x\n",
+                               __func__, major, minor);
+                       break;
+               }
+               prev = dl;
+       }
+       return 0;
+}
+
+static void imsm_delete(struct intel_super *super, struct dl **dlp, unsigned index);
+
+static int add_remove_disk_update(struct intel_super *super)
+{
+       int check_degraded = 0;
+       struct dl *disk = NULL;
+       /* add/remove some spares to/from the metadata/contrainer */
+       while (super->disk_mgmt_list) {
+               struct dl *disk_cfg;
+
+               disk_cfg = super->disk_mgmt_list;
+               super->disk_mgmt_list = disk_cfg->next;
+               disk_cfg->next = NULL;
+
+               if (disk_cfg->action == DISK_ADD) {
+                       disk_cfg->next = super->disks;
+                       super->disks = disk_cfg;
+                       check_degraded = 1;
+                       dprintf("%s: added %x:%x\n",
+                               __func__, disk_cfg->major,
+                               disk_cfg->minor);
+               } else if (disk_cfg->action == DISK_REMOVE) {
+                       dprintf("Disk remove action processed: %x.%x\n",
+                               disk_cfg->major, disk_cfg->minor);
+                       disk = get_disk_super(super,
+                                             disk_cfg->major,
+                                             disk_cfg->minor);
+                       if (disk) {
+                               /* store action status */
+                               disk->action = DISK_REMOVE;
+                               /* remove spare disks only */
+                               if (disk->index == -1) {
+                                       remove_disk_super(super,
+                                                         disk_cfg->major,
+                                                         disk_cfg->minor);
+                               }
+                       }
+                       /* release allocate disk structure */
+                       __free_imsm_disk(disk_cfg);
+               }
+       }
+       return check_degraded;
+}
+
+static int apply_reshape_container_disks_update(struct imsm_update_reshape *u,
+                                               struct intel_super *super,
+                                               void ***space_list)
+{
+       struct dl *new_disk;
+       struct intel_dev *id;
+       int i;
+       int delta_disks = u->new_raid_disks - u->old_raid_disks;
+       int disk_count = u->old_raid_disks;
+       void **tofree = NULL;
+       int devices_to_reshape = 1;
+       struct imsm_super *mpb = super->anchor;
+       int ret_val = 0;
+       unsigned int dev_id;
+
+       dprintf("imsm: apply_reshape_container_disks_update()\n");
+
+       /* enable spares to use in array */
+       for (i = 0; i < delta_disks; i++) {
+               new_disk = get_disk_super(super,
+                                         major(u->new_disks[i]),
+                                         minor(u->new_disks[i]));
+               dprintf("imsm: new disk for reshape is: %i:%i "
+                       "(%p, index = %i)\n",
+                       major(u->new_disks[i]), minor(u->new_disks[i]),
+                       new_disk, new_disk->index);
+               if ((new_disk == NULL) ||
+                   ((new_disk->index >= 0) &&
+                    (new_disk->index < u->old_raid_disks)))
+                       goto update_reshape_exit;
+               new_disk->index = disk_count++;
+               /* slot to fill in autolayout
+                */
+               new_disk->raiddisk = new_disk->index;
+               new_disk->disk.status |=
+                       CONFIGURED_DISK;
+               new_disk->disk.status &= ~SPARE_DISK;
+       }
+
+       dprintf("imsm: volume set mpb->num_raid_devs = %i\n",
+               mpb->num_raid_devs);
+       /* manage changes in volume
+        */
+       for (dev_id = 0; dev_id < mpb->num_raid_devs; dev_id++) {
+               void **sp = *space_list;
+               struct imsm_dev *newdev;
+               struct imsm_map *newmap, *oldmap;
+
+               for (id = super->devlist ; id; id = id->next) {
+                       if (id->index == dev_id)
+                               break;
+               }
+               if (id == NULL)
+                       break;
+               if (!sp)
+                       continue;
+               *space_list = *sp;
+               newdev = (void*)sp;
+               /* Copy the dev, but not (all of) the map */
+               memcpy(newdev, id->dev, sizeof(*newdev));
+               oldmap = get_imsm_map(id->dev, 0);
+               newmap = get_imsm_map(newdev, 0);
+               /* Copy the current map */
+               memcpy(newmap, oldmap, sizeof_imsm_map(oldmap));
+               /* update one device only
+                */
+               if (devices_to_reshape) {
+                       dprintf("imsm: modifying subdev: %i\n",
+                               id->index);
+                       devices_to_reshape--;
+                       newdev->vol.migr_state = 1;
+                       newdev->vol.curr_migr_unit = 0;
+                       newdev->vol.migr_type = MIGR_GEN_MIGR;
+                       newmap->num_members = u->new_raid_disks;
+                       for (i = 0; i < delta_disks; i++) {
+                               set_imsm_ord_tbl_ent(newmap,
+                                                    u->old_raid_disks + i,
+                                                    u->old_raid_disks + i);
+                       }
+                       /* New map is correct, now need to save old map
+                        */
+                       newmap = get_imsm_map(newdev, 1);
+                       memcpy(newmap, oldmap, sizeof_imsm_map(oldmap));
+
+                       imsm_set_array_size(newdev);
+               }
+
+               sp = (void **)id->dev;
+               id->dev = newdev;
+               *sp = tofree;
+               tofree = sp;
+       }
+       if (tofree)
+               *space_list = tofree;
+       ret_val = 1;
  
-       return rv;
+update_reshape_exit:
+
+       return ret_val;
  }
  
-static int disks_overlap(struct intel_super *super, int idx, struct imsm_update_create_array *u)
+static int apply_takeover_update(struct imsm_update_takeover *u,
+                                struct intel_super *super,
+                                void ***space_list)
  {
-       struct imsm_dev *dev = get_imsm_dev(super, idx);
-       struct imsm_map *map = get_imsm_map(dev, 0);
-       struct imsm_map *new_map = get_imsm_map(&u->dev, 0);
-       struct disk_info *inf = get_disk_info(u);
-       struct imsm_disk *disk;
+       struct imsm_dev *dev = NULL;
+       struct intel_dev *dv;
+       struct imsm_dev *dev_new;
+       struct imsm_map *map;
+       struct dl *dm, *du;
         int i;
-       int j;
  
-       for (i = 0; i < map->num_members; i++) {
-               disk = get_imsm_disk(super, get_imsm_disk_idx(dev, i));
-               for (j = 0; j < new_map->num_members; j++)
-                       if (serialcmp(disk->serial, inf[j].serial) == 0)
-                               return 1;
+       for (dv = super->devlist; dv; dv = dv->next)
+               if (dv->index == (unsigned int)u->subarray) {
+                       dev = dv->dev;
+                       break;
+               }
+
+       if (dev == NULL)
+               return 0;
+
+       map = get_imsm_map(dev, 0);
+
+       if (u->direction == R10_TO_R0) {
+               /* Number of failed disks must be half of initial disk number */
+               if (imsm_count_failed(super, dev) != (map->num_members / 2))
+                       return 0;
+
+               /* iterate through devices to mark removed disks as spare */
+               for (dm = super->disks; dm; dm = dm->next) {
+                       if (dm->disk.status & FAILED_DISK) {
+                               int idx = dm->index;
+                               /* update indexes on the disk list */
+/* FIXME this loop-with-the-loop looks wrong,  I'm not convinced
+   the index values will end up being correct.... NB */
+                               for (du = super->disks; du; du = du->next)
+                                       if (du->index > idx)
+                                               du->index--;
+                               /* mark as spare disk */
+                               dm->disk.status = SPARE_DISK;
+                               dm->index = -1;
+                       }
+               }
+               /* update map */
+               map->num_members = map->num_members / 2;
+               map->map_state = IMSM_T_STATE_NORMAL;
+               map->num_domains = 1;
+               map->raid_level = 0;
+               map->failed_disk_num = -1;
         }
  
-       return 0;
-}
+       if (u->direction == R0_TO_R10) {
+               void **space;
+               /* update slots in current disk list */
+               for (dm = super->disks; dm; dm = dm->next) {
+                       if (dm->index >= 0)
+                               dm->index *= 2;
+               }
+               /* create new *missing* disks */
+               for (i = 0; i < map->num_members; i++) {
+                       space = *space_list;
+                       if (!space)
+                               continue;
+                       *space_list = *space;
+                       du = (void *)space;
+                       memcpy(du, super->disks, sizeof(*du));
+                       du->fd = -1;
+                       du->minor = 0;
+                       du->major = 0;
+                       du->index = (i * 2) + 1;
+                       sprintf((char *)du->disk.serial,
+                               " MISSING_%d", du->index);
+                       sprintf((char *)du->serial,
+                               "MISSING_%d", du->index);
+                       du->next = super->missing;
+                       super->missing = du;
+               }
+               /* create new dev and map */
+               space = *space_list;
+               if (!space)
+                       return 0;
+               *space_list = *space;
+               dev_new = (void *)space;
+               memcpy(dev_new, dev, sizeof(*dev));
+               /* update new map */
+               map = get_imsm_map(dev_new, 0);
+               map->num_members = map->num_members * 2;
+               map->map_state = IMSM_T_STATE_DEGRADED;
+               map->num_domains = 2;
+               map->raid_level = 1;
+               /* replace dev<->dev_new */
+               dv->dev = dev_new;
+       }
+       /* update disk order table */
+       for (du = super->disks; du; du = du->next)
+               if (du->index >= 0)
+                       set_imsm_ord_tbl_ent(map, du->index, du->index);
+       for (du = super->missing; du; du = du->next)
+               if (du->index >= 0) {
+                       set_imsm_ord_tbl_ent(map, du->index, du->index);
+                       mark_missing(dev_new, &du->disk, du->index);
+               }
  
-static void imsm_delete(struct intel_super *super, struct dl **dlp, int index);
+       return 1;
+}
  
  static void imsm_process_update(struct supertype *st,
                                 struct metadata_update *update)
@@ -4519,10 +6277,18 @@ static void imsm_process_update(struct supertype *st,
         /**
          * crack open the metadata_update envelope to find the update record
          * update can be one of:
-        *      update_activate_spare - a spare device has replaced a failed
+        *    update_reshape_container_disks - all the arrays in the container
+        *      are being reshaped to have more devices.  We need to mark
+        *      the arrays for general migration and convert selected spares
+        *      into active devices.
+        *    update_activate_spare - a spare device has replaced a failed
          *      device in an array, update the disk_ord_tbl.  If this disk is
          *      present in all member arrays then also clear the SPARE_DISK
          *      flag
+        *    update_create_array
+        *    update_kill_array
+        *    update_rename_array
+        *    update_add_remove_disk
          */
         struct intel_super *super = st->sb;
         struct imsm_super *mpb;
@@ -4547,6 +6313,22 @@ static void imsm_process_update(struct supertype *st,
         mpb = super->anchor;
  
         switch (type) {
+       case update_takeover: {
+               struct imsm_update_takeover *u = (void *)update->buf;
+               if (apply_takeover_update(u, super, &update->space_list)) {
+                       imsm_update_version_info(super);
+                       super->updates_pending++;
+               }
+               break;
+       }
+
+       case update_reshape_container_disks: {
+               struct imsm_update_reshape *u = (void *)update->buf;
+               if (apply_reshape_container_disks_update(
+                           u, super, &update->space_list))
+                       super->updates_pending++;
+               break;
+       }
         case update_activate_spare: {
                 struct imsm_update_activate_spare *u = (void *) update->buf; 
                 struct imsm_dev *dev = get_imsm_dev(super, u->array);
@@ -4558,7 +6340,7 @@ static void imsm_process_update(struct supertype *st,
                 struct dl *dl;
                 unsigned int found;
                 int failed;
-               int victim = get_imsm_disk_idx(dev, u->slot);
+               int victim = get_imsm_disk_idx(dev, u->slot, -1);
                 int i;
  
                 for (dl = super->disks; dl; dl = dl->next)
@@ -4581,7 +6363,8 @@ static void imsm_process_update(struct supertype *st,
                 for (i = 0; i < map->num_members; i++) {
                         if (i == u->slot)
                                 continue;
-                       disk = get_imsm_disk(super, get_imsm_disk_idx(dev, i));
+                       disk = get_imsm_disk(super,
+                                            get_imsm_disk_idx(dev, i, -1));
                         if (!disk || is_failed(disk))
                                 failed++;
                 }
@@ -4758,31 +6541,88 @@ static void imsm_process_update(struct supertype *st,
                 }
                 break;
         }
-       case update_add_disk:
+       case update_kill_array: {
+               struct imsm_update_kill_array *u = (void *) update->buf;
+               int victim = u->dev_idx;
+               struct active_array *a;
+               struct intel_dev **dp;
+               struct imsm_dev *dev;
+
+               /* sanity check that we are not affecting the uuid of
+                * active arrays, or deleting an active array
+                *
+                * FIXME when immutable ids are available, but note that
+                * we'll also need to fixup the invalidated/active
+                * subarray indexes in mdstat
+                */
+               for (a = st->arrays; a; a = a->next)
+                       if (a->info.container_member >= victim)
+                               break;
+               /* by definition if mdmon is running at least one array
+                * is active in the container, so checking
+                * mpb->num_raid_devs is just extra paranoia
+                */
+               dev = get_imsm_dev(super, victim);
+               if (a || !dev || mpb->num_raid_devs == 1) {
+                       dprintf("failed to delete subarray-%d\n", victim);
+                       break;
+               }
+
+               for (dp = &super->devlist; *dp;)
+                       if ((*dp)->index == (unsigned)super->current_vol) {
+                               *dp = (*dp)->next;
+                       } else {
+                               if ((*dp)->index > (unsigned)victim)
+                                       (*dp)->index--;
+                               dp = &(*dp)->next;
+                       }
+               mpb->num_raid_devs--;
+               super->updates_pending++;
+               break;
+       }
+       case update_rename_array: {
+               struct imsm_update_rename_array *u = (void *) update->buf;
+               char name[MAX_RAID_SERIAL_LEN+1];
+               int target = u->dev_idx;
+               struct active_array *a;
+               struct imsm_dev *dev;
+
+               /* sanity check that we are not affecting the uuid of
+                * an active array
+                */
+               snprintf(name, MAX_RAID_SERIAL_LEN, "%s", (char *) u->name);
+               name[MAX_RAID_SERIAL_LEN] = '\0';
+               for (a = st->arrays; a; a = a->next)
+                       if (a->info.container_member == target)
+                               break;
+               dev = get_imsm_dev(super, u->dev_idx);
+               if (a || !dev || !check_name(super, name, 1)) {
+                       dprintf("failed to rename subarray-%d\n", target);
+                       break;
+               }
  
+               snprintf((char *) dev->volume, MAX_RAID_SERIAL_LEN, "%s", name);
+               super->updates_pending++;
+               break;
+       }
+       case update_add_remove_disk: {
                 /* we may be able to repair some arrays if disks are
-                * being added */
-               if (super->add) {
+                * being added, check teh status of add_remove_disk
+                * if discs has been added.
+                */
+               if (add_remove_disk_update(super)) {
                         struct active_array *a;
  
                         super->updates_pending++;
-                       for (a = st->arrays; a; a = a->next)
+                       for (a = st->arrays; a; a = a->next)
                                 a->check_degraded = 1;
                 }
-               /* add some spares to the metadata */
-               while (super->add) {
-                       struct dl *al;
-
-                       al = super->add;
-                       super->add = al->next;
-                       al->next = super->disks;
-                       super->disks = al;
-                       dprintf("%s: added %x:%x\n",
-                               __func__, al->major, al->minor);
-               }
-
                 break;
         }
+       default:
+               fprintf(stderr, "error: unsuported process update type:"
+                       "(type: %d)\n", type);
+       }
  }
  
  static void imsm_prepare_update(struct supertype *st,
@@ -4802,6 +6642,86 @@ static void imsm_prepare_update(struct supertype *st,
         size_t len = 0;
  
         switch (type) {
+       case update_takeover: {
+               struct imsm_update_takeover *u = (void *)update->buf;
+               if (u->direction == R0_TO_R10) {
+                       void **tail = (void **)&update->space_list;
+                       struct imsm_dev *dev = get_imsm_dev(super, u->subarray);
+                       struct imsm_map *map = get_imsm_map(dev, 0);
+                       int num_members = map->num_members;
+                       void *space;
+                       int size, i;
+                       int err = 0;
+                       /* allocate memory for added disks */
+                       for (i = 0; i < num_members; i++) {
+                               size = sizeof(struct dl);
+                               space = malloc(size);
+                               if (!space) {
+                                       err++;
+                                       break;
+                               }
+                               *tail = space;
+                               tail = space;
+                               *tail = NULL;
+                       }
+                       /* allocate memory for new device */
+                       size = sizeof_imsm_dev(super->devlist->dev, 0) +
+                               (num_members * sizeof(__u32));
+                       space = malloc(size);
+                       if (!space)
+                               err++;
+                       else {
+                               *tail = space;
+                               tail = space;
+                               *tail = NULL;
+                       }
+                       if (!err) {
+                               len = disks_to_mpb_size(num_members * 2);
+                       } else {
+                               /* if allocation didn't success, free buffer */
+                               while (update->space_list) {
+                                       void **sp = update->space_list;
+                                       update->space_list = *sp;
+                                       free(sp);
+                               }
+                       }
+               }
+
+               break;
+       }
+       case update_reshape_container_disks: {
+               /* Every raid device in the container is about to
+                * gain some more devices, and we will enter a
+                * reconfiguration.
+                * So each 'imsm_map' will be bigger, and the imsm_vol
+                * will now hold 2 of them.
+                * Thus we need new 'struct imsm_dev' allocations sized
+                * as sizeof_imsm_dev but with more devices in both maps.
+                */
+               struct imsm_update_reshape *u = (void *)update->buf;
+               struct intel_dev *dl;
+               void **space_tail = (void**)&update->space_list;
+
+               dprintf("imsm: imsm_prepare_update() for update_reshape\n");
+
+               for (dl = super->devlist; dl; dl = dl->next) {
+                       int size = sizeof_imsm_dev(dl->dev, 1);
+                       void *s;
+                       if (u->new_raid_disks > u->old_raid_disks)
+                               size += sizeof(__u32)*2*
+                                       (u->new_raid_disks - u->old_raid_disks);
+                       s = malloc(size);
+                       if (!s)
+                               break;
+                       *space_tail = s;
+                       space_tail = s;
+                       *space_tail = NULL;
+               }
+
+               len = disks_to_mpb_size(u->new_raid_disks);
+               dprintf("New anchor length is %llu\n", (unsigned long long)len);
+               break;
+       }
         case update_create_array: {
                 struct imsm_update_create_array *u = (void *) update->buf;
                 struct intel_dev *dv;
@@ -4869,7 +6789,7 @@ static void imsm_prepare_update(struct supertype *st,
  }
  
  /* must be called while manager is quiesced */
-static void imsm_delete(struct intel_super *super, struct dl **dlp, int index)
+static void imsm_delete(struct intel_super *super, struct dl **dlp, unsigned index)
  {
         struct imsm_super *mpb = super->anchor;
         struct dl *iter;
@@ -4883,10 +6803,10 @@ static void imsm_delete(struct intel_super *super, struct dl **dlp, int index)
  
         /* shift all indexes down one */
         for (iter = super->disks; iter; iter = iter->next)
-               if (iter->index > index)
+               if (iter->index > (int)index)
                         iter->index--;
         for (iter = super->missing; iter; iter = iter->next)
-               if (iter->index > index)
+               if (iter->index > (int)index)
                         iter->index--;
  
         for (i = 0; i < mpb->num_raid_devs; i++) {
@@ -4897,7 +6817,7 @@ static void imsm_delete(struct intel_super *super, struct dl **dlp, int index)
                         /* update ord entries being careful not to propagate
                          * ord-flags to the first map
                          */
-                       ord = get_imsm_ord_tbl_ent(dev, j);
+                       ord = get_imsm_ord_tbl_ent(dev, j, -1);
  
                         if (ord_to_idx(ord) <= index)
                                 continue;
@@ -4919,6 +6839,536 @@ static void imsm_delete(struct intel_super *super, struct dl **dlp, int index)
                 __free_imsm_disk(dl);
         }
  }
+
+static char disk_by_path[] = "/dev/disk/by-path/";
+
+static const char *imsm_get_disk_controller_domain(const char *path)
+{
+       char disk_path[PATH_MAX];
+       char *drv=NULL;
+       struct stat st;
+
+       strncpy(disk_path, disk_by_path, PATH_MAX - 1);
+       strncat(disk_path, path, PATH_MAX - strlen(disk_path) - 1);
+       if (stat(disk_path, &st) == 0) {
+               struct sys_dev* hba;
+               char *path=NULL;
+
+               path = devt_to_devpath(st.st_rdev);
+               if (path == NULL)
+                       return "unknown";
+               hba = find_disk_attached_hba(-1, path);
+               if (hba && hba->type == SYS_DEV_SAS)
+                       drv = "isci";
+               else if (hba && hba->type == SYS_DEV_SATA)
+                       drv = "ahci";
+               else 
+                       drv = "unknown";
+               dprintf("path: %s hba: %s attached: %s\n",
+                       path, (hba) ? hba->path : "NULL", drv);
+               free(path);
+               if (hba)
+                       free_sys_dev(&hba);
+       }
+       return drv;
+}
+
+static int imsm_find_array_minor_by_subdev(int subdev, int container, int *minor)
+{
+       char subdev_name[20];
+       struct mdstat_ent *mdstat;
+
+       sprintf(subdev_name, "%d", subdev);
+       mdstat = mdstat_by_subdev(subdev_name, container);
+       if (!mdstat)
+               return -1;
+
+       *minor = mdstat->devnum;
+       free_mdstat(mdstat);
+       return 0;
+}
+
+static int imsm_reshape_is_allowed_on_container(struct supertype *st,
+                                               struct geo_params *geo,
+                                               int *old_raid_disks)
+{
+       /* currently we only support increasing the number of devices
+        * for a container.  This increases the number of device for each
+        * member array.  They must all be RAID0 or RAID5.
+        */
+       int ret_val = 0;
+       struct mdinfo *info, *member;
+       int devices_that_can_grow = 0;
+
+       dprintf("imsm: imsm_reshape_is_allowed_on_container(ENTER): "
+               "st->devnum = (%i)\n",
+               st->devnum);
+
+       if (geo->size != -1 ||
+           geo->level != UnSet ||
+           geo->layout != UnSet ||
+           geo->chunksize != 0 ||
+           geo->raid_disks == UnSet) {
+               dprintf("imsm: Container operation is allowed for "
+                       "raid disks number change only.\n");
+               return ret_val;
+       }
+
+       info = container_content_imsm(st, NULL);
+       for (member = info; member; member = member->next) {
+               int result;
+               int minor;
+
+               dprintf("imsm: checking device_num: %i\n",
+                       member->container_member);
+
+               if (geo->raid_disks <= member->array.raid_disks) {
+                       /* we work on container for Online Capacity Expansion
+                        * only so raid_disks has to grow
+                        */
+                       dprintf("imsm: for container operation raid disks "
+                               "increase is required\n");
+                       break;
+               }
+
+               if ((info->array.level != 0) &&
+                   (info->array.level != 5)) {
+                       /* we cannot use this container with other raid level
+                        */
+                       dprintf("imsm: for container operation wrong"
+                               " raid level (%i) detected\n",
+                               info->array.level);
+                       break;
+               } else {
+                       /* check for platform support
+                        * for this raid level configuration
+                        */
+                       struct intel_super *super = st->sb;
+                       if (!is_raid_level_supported(super->orom,
+                                                    member->array.level,
+                                                    geo->raid_disks)) {
+                               dprintf("platform does not support raid%d with"
+                                       " %d disk%s\n",
+                                        info->array.level,
+                                        geo->raid_disks,
+                                        geo->raid_disks > 1 ? "s" : "");
+                               break;
+                       }
+               }
+
+               if (*old_raid_disks &&
+                   info->array.raid_disks != *old_raid_disks)
+                       break;
+               *old_raid_disks = info->array.raid_disks;
+
+               /* All raid5 and raid0 volumes in container
+                * have to be ready for Online Capacity Expansion
+                * so they need to be assembled.  We have already
+                * checked that no recovery etc is happening.
+                */
+               result = imsm_find_array_minor_by_subdev(member->container_member,
+                                                        st->container_dev,
+                                                        &minor);
+               if (result < 0) {
+                       dprintf("imsm: cannot find array\n");
+                       break;
+               }
+               devices_that_can_grow++;
+       }
+       sysfs_free(info);
+       if (!member && devices_that_can_grow)
+               ret_val = 1;
+
+       if (ret_val)
+               dprintf("\tContainer operation allowed\n");
+       else
+               dprintf("\tError: %i\n", ret_val);
+
+       return ret_val;
+}
+
+/* Function: get_spares_for_grow
+ * Description: Allocates memory and creates list of spare devices
+ *             avaliable in container. Checks if spare drive size is acceptable.
+ * Parameters: Pointer to the supertype structure
+ * Returns: Pointer to the list of spare devices (mdinfo structure) on success,
+ *             NULL if fail
+ */
+static struct mdinfo *get_spares_for_grow(struct supertype *st)
+{
+       unsigned long long min_size = min_acceptable_spare_size_imsm(st);
+       return container_choose_spares(st, min_size, NULL, NULL, NULL, 0);
+}
+
+/******************************************************************************
+ * function: imsm_create_metadata_update_for_reshape
+ * Function creates update for whole IMSM container.
+ *
+ ******************************************************************************/
+static int imsm_create_metadata_update_for_reshape(
+       struct supertype *st,
+       struct geo_params *geo,
+       int old_raid_disks,
+       struct imsm_update_reshape **updatep)
+{
+       struct intel_super *super = st->sb;
+       struct imsm_super *mpb = super->anchor;
+       int update_memory_size = 0;
+       struct imsm_update_reshape *u = NULL;
+       struct mdinfo *spares = NULL;
+       int i;
+       int delta_disks = 0;
+       struct mdinfo *dev;
+
+       dprintf("imsm_update_metadata_for_reshape(enter) raid_disks = %i\n",
+               geo->raid_disks);
+
+       delta_disks = geo->raid_disks - old_raid_disks;
+
+       /* size of all update data without anchor */
+       update_memory_size = sizeof(struct imsm_update_reshape);
+
+       /* now add space for spare disks that we need to add. */
+       update_memory_size += sizeof(u->new_disks[0]) * (delta_disks - 1);
+
+       u = calloc(1, update_memory_size);
+       if (u == NULL) {
+               dprintf("error: "
+                       "cannot get memory for imsm_update_reshape update\n");
+               return 0;
+       }
+       u->type = update_reshape_container_disks;
+       u->old_raid_disks = old_raid_disks;
+       u->new_raid_disks = geo->raid_disks;
+
+       /* now get spare disks list
+        */
+       spares = get_spares_for_grow(st);
+
+       if (spares == NULL
+           || delta_disks > spares->array.spare_disks) {
+               fprintf(stderr, Name ": imsm: ERROR: Cannot get spare devices "
+                       "for %s.\n", geo->dev_name);
+               goto abort;
+       }
+
+       /* we have got spares
+        * update disk list in imsm_disk list table in anchor
+        */
+       dprintf("imsm: %i spares are available.\n\n",
+               spares->array.spare_disks);
+
+       dev = spares->devs;
+       for (i = 0; i < delta_disks; i++) {
+               struct dl *dl;
+
+               if (dev == NULL)
+                       break;
+               u->new_disks[i] = makedev(dev->disk.major,
+                                         dev->disk.minor);
+               dl = get_disk_super(super, dev->disk.major, dev->disk.minor);
+               dl->index = mpb->num_disks;
+               mpb->num_disks++;
+               dev = dev->next;
+       }
+
+abort:
+       /* free spares
+        */
+       sysfs_free(spares);
+
+       dprintf("imsm: reshape update preparation :");
+       if (i == delta_disks) {
+               dprintf(" OK\n");
+               *updatep = u;
+               return update_memory_size;
+       }
+       free(u);
+       dprintf(" Error\n");
+
+       return 0;
+}
+
+static void imsm_update_metadata_locally(struct supertype *st,
+                                        void *buf, int len)
+{
+       struct metadata_update mu;
+
+       mu.buf = buf;
+       mu.len = len;
+       mu.space = NULL;
+       mu.space_list = NULL;
+       mu.next = NULL;
+       imsm_prepare_update(st, &mu);
+       imsm_process_update(st, &mu);
+
+       while (mu.space_list) {
+               void **space = mu.space_list;
+               mu.space_list = *space;
+               free(space);
+       }
+}
+
+/***************************************************************************
+* Function:    imsm_analyze_change
+* Description: Function analyze change for single volume
+*              and validate if transition is supported
+* Parameters:  Geometry parameters, supertype structure
+* Returns:     Operation type code on success, -1 if fail
+****************************************************************************/
+enum imsm_reshape_type imsm_analyze_change(struct supertype *st,
+                                          struct geo_params *geo)
+{
+       struct mdinfo info;
+       int change = -1;
+       int check_devs = 0;
+       int chunk;
+
+       getinfo_super_imsm_volume(st, &info, NULL);
+
+       if ((geo->level != info.array.level) &&
+           (geo->level >= 0) &&
+           (geo->level != UnSet)) {
+               switch (info.array.level) {
+               case 0:
+                       if (geo->level == 5) {
+                               change = CH_MIGRATION;
+                               check_devs = 1;
+                       }
+                       if (geo->level == 10) {
+                               change = CH_TAKEOVER;
+                               check_devs = 1;
+                       }
+                       break;
+               case 1:
+                       if (geo->level == 0) {
+                               change = CH_TAKEOVER;
+                               check_devs = 1;
+                       }
+                       break;
+               case 5:
+                       if (geo->level == 0)
+                               change = CH_MIGRATION;
+                       break;
+               case 10:
+                       if (geo->level == 0) {
+                               change = CH_TAKEOVER;
+                               check_devs = 1;
+                       }
+                       break;
+               }
+               if (change == -1) {
+                       fprintf(stderr,
+                               Name " Error. Level Migration from %d to %d "
+                               "not supported!\n",
+                               info.array.level, geo->level);
+                       goto analyse_change_exit;
+               }
+       } else
+               geo->level = info.array.level;
+
+       if ((geo->layout != info.array.layout)
+           && ((geo->layout != UnSet) && (geo->layout != -1))) {
+               change = CH_MIGRATION;
+               if ((info.array.layout == 0)
+                   && (info.array.level == 5)
+                   && (geo->layout == 5)) {
+                       /* reshape 5 -> 4 */
+               } else if ((info.array.layout == 5)
+                          && (info.array.level == 5)
+                          && (geo->layout == 0)) {
+                       /* reshape 4 -> 5 */
+                       geo->layout = 0;
+                       geo->level = 5;
+               } else {
+                       fprintf(stderr,
+                               Name " Error. Layout Migration from %d to %d "
+                               "not supported!\n",
+                               info.array.layout, geo->layout);
+                       change = -1;
+                       goto analyse_change_exit;
+               }
+       } else
+               geo->layout = info.array.layout;
+
+       if ((geo->chunksize > 0) && (geo->chunksize != UnSet)
+           && (geo->chunksize != info.array.chunk_size))
+               change = CH_MIGRATION;
+       else
+               geo->chunksize = info.array.chunk_size;
+
+       chunk = geo->chunksize / 1024;
+       if (!validate_geometry_imsm(st,
+                                   geo->level,
+                                   geo->layout,
+                                   geo->raid_disks,
+                                   &chunk,
+                                   geo->size,
+                                   0, 0, 1))
+               change = -1;
+
+       if (check_devs) {
+               struct intel_super *super = st->sb;
+               struct imsm_super *mpb = super->anchor;
+
+               if (mpb->num_raid_devs > 1) {
+                       fprintf(stderr,
+                               Name " Error. Cannot perform operation on %s"
+                               "- for this operation it MUST be single "
+                               "array in container\n",
+                               geo->dev_name);
+                       change = -1;
+               }
+       }
+
+analyse_change_exit:
+
+       return change;
+}
+
+int imsm_takeover(struct supertype *st, struct geo_params *geo)
+{
+       struct intel_super *super = st->sb;
+       struct imsm_update_takeover *u;
+
+       u = malloc(sizeof(struct imsm_update_takeover));
+       if (u == NULL)
+               return 1;
+
+       u->type = update_takeover;
+       u->subarray = super->current_vol;
+
+       /* 10->0 transition */
+       if (geo->level == 0)
+               u->direction = R10_TO_R0;
+
+       /* 0->10 transition */
+       if (geo->level == 10)
+               u->direction = R0_TO_R10;
+
+       /* update metadata locally */
+       imsm_update_metadata_locally(st, u,
+                                       sizeof(struct imsm_update_takeover));
+       /* and possibly remotely */
+       if (st->update_tail)
+               append_metadata_update(st, u,
+                                       sizeof(struct imsm_update_takeover));
+       else
+               free(u);
+
+       return 0;
+}
+
+static int imsm_reshape_super(struct supertype *st, long long size, int level,
+                             int layout, int chunksize, int raid_disks,
+                             int delta_disks, char *backup, char *dev,
+                             int verbose)
+{
+       int ret_val = 1;
+       struct geo_params geo;
+
+       dprintf("imsm: reshape_super called.\n");
+
+       memset(&geo, 0, sizeof(struct geo_params));
+
+       geo.dev_name = dev;
+       geo.dev_id = st->devnum;
+       geo.size = size;
+       geo.level = level;
+       geo.layout = layout;
+       geo.chunksize = chunksize;
+       geo.raid_disks = raid_disks;
+       if (delta_disks != UnSet)
+               geo.raid_disks += delta_disks;
+
+       dprintf("\tfor level      : %i\n", geo.level);
+       dprintf("\tfor raid_disks : %i\n", geo.raid_disks);
+
+       if (experimental() == 0)
+               return ret_val;
+
+       if (st->container_dev == st->devnum) {
+               /* On container level we can only increase number of devices. */
+               dprintf("imsm: info: Container operation\n");
+               int old_raid_disks = 0;
+               if (imsm_reshape_is_allowed_on_container(
+                           st, &geo, &old_raid_disks)) {
+                       struct imsm_update_reshape *u = NULL;
+                       int len;
+
+                       len = imsm_create_metadata_update_for_reshape(
+                               st, &geo, old_raid_disks, &u);
+
+                       if (len <= 0) {
+                               dprintf("imsm: Cannot prepare update\n");
+                               goto exit_imsm_reshape_super;
+                       }
+
+                       ret_val = 0;
+                       /* update metadata locally */
+                       imsm_update_metadata_locally(st, u, len);
+                       /* and possibly remotely */
+                       if (st->update_tail)
+                               append_metadata_update(st, u, len);
+                       else
+                               free(u);
+
+               } else {
+                       fprintf(stderr, Name ": (imsm) Operation "
+                               "is not allowed on this container\n");
+               }
+       } else {
+               /* On volume level we support following operations
+                * - takeover: raid10 -> raid0; raid0 -> raid10
+                * - chunk size migration
+                * - migration: raid5 -> raid0; raid0 -> raid5
+                */
+               struct intel_super *super = st->sb;
+               struct intel_dev *dev = super->devlist;
+               int change, devnum;
+               dprintf("imsm: info: Volume operation\n");
+               /* find requested device */
+               while (dev) {
+                       imsm_find_array_minor_by_subdev(dev->index, st->container_dev, &devnum);
+                       if (devnum == geo.dev_id)
+                               break;
+                       dev = dev->next;
+               }
+               if (dev == NULL) {
+                       fprintf(stderr, Name " Cannot find %s (%i) subarray\n",
+                               geo.dev_name, geo.dev_id);
+                       goto exit_imsm_reshape_super;
+               }
+               super->current_vol = dev->index;
+               change = imsm_analyze_change(st, &geo);
+               switch (change) {
+               case CH_TAKEOVER:
+                       ret_val = imsm_takeover(st, &geo);
+                       break;
+               case CH_MIGRATION:
+                       ret_val = 0;
+                       break;
+               default:
+                       ret_val = 1;
+               }
+       }
+
+exit_imsm_reshape_super:
+       dprintf("imsm: reshape_super Exit code = %i\n", ret_val);
+       return ret_val;
+}
+
+static int imsm_manage_reshape(
+       int afd, struct mdinfo *sra, struct reshape *reshape,
+       struct supertype *st, unsigned long stripes,
+       int *fds, unsigned long long *offsets,
+       int dests, int *destfd, unsigned long long *destoffsets)
+{
+       /* Just use child_monitor for now */
+       return child_monitor(
+               afd, sra, reshape, st, stripes,
+               fds, offsets, dests, destfd, destoffsets);
+}
  #endif /* MDASSEMBLE */
  
  struct superswitch super_imsm = {
@@ -4932,14 +7382,24 @@ struct superswitch super_imsm = {
         .write_init_super = write_init_super_imsm,
         .validate_geometry = validate_geometry_imsm,
         .add_to_super   = add_to_super_imsm,
+       .remove_from_super = remove_from_super_imsm,
         .detail_platform = detail_platform_imsm,
+       .kill_subarray = kill_subarray_imsm,
+       .update_subarray = update_subarray_imsm,
+       .load_container = load_container_imsm,
+       .default_geometry = default_geometry_imsm,
+       .get_disk_controller_domain = imsm_get_disk_controller_domain,
+       .reshape_super  = imsm_reshape_super,
+       .manage_reshape = imsm_manage_reshape,
  #endif
         .match_home     = match_home_imsm,
         .uuid_from_super= uuid_from_super_imsm,
         .getinfo_super  = getinfo_super_imsm,
+       .getinfo_super_disks = getinfo_super_disks_imsm,
         .update_super   = update_super_imsm,
  
         .avail_size     = avail_size_imsm,
+       .min_acceptable_spare_size = min_acceptable_spare_size_imsm,
  
         .compare_super  = compare_super_imsm,
  
@@ -4949,7 +7409,6 @@ struct superswitch super_imsm = {
         .free_super     = free_super_imsm,
         .match_metadata_desc = match_metadata_desc_imsm,
         .container_content = container_content_imsm,
-       .default_layout = imsm_level_to_layout,
  
         .external       = 1,
         .name = "imsm",
@@ -4957,7 +7416,6 @@ struct superswitch super_imsm = {
  #ifndef MDASSEMBLE
  /* for mdmon */
         .open_new       = imsm_open_new,
-       .load_super     = load_super_imsm,
         .set_array_state= imsm_set_array_state,
         .set_disk       = imsm_set_disk,
         .sync_metadata  = imsm_sync_metadata,