On Thu, 13 Jan 2011 16:32:52 +0100 Krzysztof Wojcik <krzysztof.wojcik@xxxxxxxxx> wrote: > The patch introduces takeover form level 10 to level 0 for imsm > metadata. This patch contains procedures connected with preparing > and applying metadata update during 10 -> 0 takeover. > When performing takeover 10->0 mdmon should update the external > metadata (due to disk slot and level changes). > To achieve that mdadm calls reshape_super() and prepare > the "update_takeover" metadata update type. > Prepared update is processed by mdmon in process_update(). You are using sysfs_read inside super-intel again. That is the wrong thing to do for the same reasons as last time. And I'm not very comfortable about sending a list of devices to delete from mdadm to mdmon. I would think that mdadm would simply fail/remove the devices from the array, then tell mdmon to update the metadata. It would see which ones are still working and construct the RAID0 out of those. NeilBrown > > Signed-off-by: Krzysztof Wojcik <krzysztof.wojcik@xxxxxxxxx> > --- > Grow.c | 1 > super-intel.c | 126 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++ > 2 files changed, 126 insertions(+), 1 deletions(-) > > diff --git a/Grow.c b/Grow.c > index c0f9419..e1ec01c 100644 > --- a/Grow.c > +++ b/Grow.c > @@ -1463,6 +1463,7 @@ int Grow_reshape(char *devname, int fd, int quiet, char *backup_file, > rv = 1; > goto release; > } > + ping_monitor(container); > } > > info.array = array; > diff --git a/super-intel.c b/super-intel.c > index c12ba74..7d2d777 100644 > --- a/super-intel.c > +++ b/super-intel.c > @@ -299,6 +299,7 @@ enum imsm_update_type { > update_rename_array, > update_add_remove_disk, > update_reshape_container_disks, > + update_takeover > }; > > struct imsm_update_activate_spare { > @@ -319,6 +320,17 @@ struct geo_params { > int raid_disks; > }; > > +#define TAKEOVER_DISKS 2 > +enum takeover_direction { > + R10_TO_R0, > + R0_TO_R10 > +}; > +struct imsm_update_takeover { > + enum imsm_update_type type; > + int subarray; > + enum takeover_direction direction; > + int disks[TAKEOVER_DISKS]; > +}; > > struct imsm_update_reshape { > enum imsm_update_type type; > @@ -5793,6 +5805,56 @@ update_reshape_exit: > return ret_val; > } > > +static int apply_takeover_update(struct imsm_update_takeover *u, > + struct intel_super *super) > +{ > + struct imsm_dev *dev = NULL; > + struct imsm_map *map; > + struct dl *dm, *du; > + int *tab; > + int i; > + > + dev = get_imsm_dev(super, u->subarray); > + > + if (dev == NULL) > + return 0; > + > + map = get_imsm_map(dev, 0); > + tab = (int *)&map->disk_ord_tbl; > + > + if (u->direction == R10_TO_R0) { > + /* iterate through devices to mark removed disks as spare */ > + for (i = 0; i < TAKEOVER_DISKS; i++) { > + for (dm = super->disks; dm; dm = dm->next) { > + if (((unsigned int)dm->major != major(u->disks[i])) || > + ((unsigned int)dm->minor != minor(u->disks[i]))) > + continue; > + for (du = super->disks; du; du = du->next) > + if ((du->index > dm->index) && (du->index > 0)) > + du->index--; > + dm->disk.status = SPARE_DISK; > + dm->index = -1; > + } > + } > + /* update disk order table */ > + i = 0; > + for (du = super->disks; du; du = du->next) { > + if (du->index >= 0) { > + tab[du->index] = i; > + i++; > + } > + } > + /* update map */ > + map->num_members = 2; > + map->map_state = IMSM_T_STATE_NORMAL; > + map->num_domains = 1; > + map->raid_level = 0; > + map->failed_disk_num = -1; > + } > + > + return 1; > +} > + > static void imsm_process_update(struct supertype *st, > struct metadata_update *update) > { > @@ -5835,6 +5897,13 @@ static void imsm_process_update(struct supertype *st, > mpb = super->anchor; > > switch (type) { > + case update_takeover: { > + struct imsm_update_takeover *u = (void *)update->buf; > + if (apply_takeover_update(u, super)) > + super->updates_pending++; > + break; > + } > + > case update_reshape_container_disks: { > struct imsm_update_reshape *u = (void *)update->buf; > if (apply_reshape_container_disks_update( > @@ -6682,6 +6751,61 @@ analyse_change_exit: > return change; > } > > +int imsm_takeover(struct supertype *st, struct geo_params *geo) > +{ > + struct intel_super *super = st->sb; > + struct imsm_update_takeover *u; > + struct mdinfo *info; > + struct mdinfo *newdi; > + struct dl *dl; > + int i, fd; > + int found = 0; > + char buf[PATH_MAX]; > + > + sprintf(buf, "/dev/md%i", geo->dev_id); > + fd = open(buf, O_RDONLY); > + if (!fd) { > + fprintf(stderr, Name "Cannot open %s", buf); > + return 1; > + } > + info = sysfs_read(fd, 0, GET_LEVEL|GET_VERSION|GET_DEVS|GET_STATE); > + if (!info) { > + fprintf(stderr, Name "Cannot load sysfs information for %s (%i)", > + geo->dev_name, geo->dev_id); > + return 1; > + } > + > + u = malloc(sizeof(struct imsm_update_takeover)); > + if (u == NULL) > + return 1; > + > + u->type = update_takeover; > + u->subarray = super->current_vol; > + > + /* 10->0 transition - mark disks to remove */ > + if (geo->level == 0) { > + u->direction = R10_TO_R0; > + i = 0; > + for (dl = super->disks; dl; dl = dl->next) { > + found = 0; > + for (newdi = info->devs; newdi; newdi = newdi->next) { > + if ((dl->major != newdi->disk.major) || > + (dl->minor != newdi->disk.minor) || > + (newdi->disk.raid_disk < 0)) > + continue; > + found = 1; > + break; > + } > + /* if disk not found, mark it for remove */ > + if ((found == 0) && (!(dl->disk.status & SPARE_DISK))) > + u->disks[i++] = makedev(dl->major, dl->minor); > + } > + } > + > + append_metadata_update(st, u, sizeof(struct imsm_update_takeover)); > + return 0; > +} > + > static int imsm_reshape_super(struct supertype *st, long long size, int level, > int layout, int chunksize, int raid_disks, > char *backup, char *dev, int verbose) > @@ -6763,7 +6887,7 @@ static int imsm_reshape_super(struct supertype *st, long long size, int level, > change = imsm_analyze_change(st, &geo); > switch (change) { > case CH_TAKEOVER: > - ret_val = 0; > + ret_val = imsm_takeover(st, &geo); > break; > case CH_CHUNK_MIGR: > ret_val = 0; -- To unsubscribe from this list: send the line "unsubscribe linux-raid" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html