]> git.ipfire.org Git - thirdparty/mdadm.git/blame - Manage.c
Add support for "--re-add missing"
[thirdparty/mdadm.git] / Manage.c
CommitLineData
64c4757e 1/*
9a9dab36 2 * mdadm - manage Linux "md" devices aka RAID arrays.
64c4757e 3 *
e736b623 4 * Copyright (C) 2001-2009 Neil Brown <neilb@suse.de>
64c4757e
NB
5 *
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 *
21 * Author: Neil Brown
e736b623 22 * Email: <neilb@suse.de>
64c4757e
NB
23 */
24
9a9dab36 25#include "mdadm.h"
682c7051
NB
26#include "md_u.h"
27#include "md_p.h"
4ccad7b1 28#include <ctype.h>
64c4757e 29
82b27616
NB
30#define REGISTER_DEV _IO (MD_MAJOR, 1)
31#define START_MD _IO (MD_MAJOR, 2)
32#define STOP_MD _IO (MD_MAJOR, 3)
33
64c4757e
NB
34int Manage_ro(char *devname, int fd, int readonly)
35{
682c7051
NB
36 /* switch to readonly or rw
37 *
38 * requires >= 0.90.0
39 * first check that array is runing
40 * use RESTART_ARRAY_RW or STOP_ARRAY_RO
41 *
42 */
43 mdu_array_info_t array;
0e600426 44#ifndef MDASSEMBLE
e9dd1598 45 struct mdinfo *mdi;
0e600426 46#endif
aba69144 47
682c7051
NB
48 if (md_get_version(fd) < 9000) {
49 fprintf(stderr, Name ": need md driver version 0.90.0 or later\n");
50 return 1;
51 }
0e600426 52#ifndef MDASSEMBLE
e9dd1598
N
53 /* If this is an externally-manage array, we need to modify the
54 * metadata_version so that mdmon doesn't undo our change.
55 */
56 mdi = sysfs_read(fd, -1, GET_LEVEL|GET_VERSION);
57 if (mdi &&
58 mdi->array.major_version == -1 &&
59 mdi->array.level > 0 &&
60 is_subarray(mdi->text_version)) {
61 char vers[64];
62 strcpy(vers, "external:");
63 strcat(vers, mdi->text_version);
64 if (readonly > 0) {
65 int rv;
66 /* We set readonly ourselves. */
67 vers[9] = '-';
68 sysfs_set_str(mdi, NULL, "metadata_version", vers);
69
70 close(fd);
71 rv = sysfs_set_str(mdi, NULL, "array_state", "readonly");
72
73 if (rv < 0) {
74 fprintf(stderr, Name ": failed to set readonly for %s: %s\n",
75 devname, strerror(errno));
76
77 vers[9] = mdi->text_version[0];
78 sysfs_set_str(mdi, NULL, "metadata_version", vers);
79 return 1;
80 }
81 } else {
82 char *cp;
83 /* We cannot set read/write - must signal mdmon */
84 vers[9] = '/';
85 sysfs_set_str(mdi, NULL, "metadata_version", vers);
86
87 cp = strchr(vers+10, '/');
88 if (*cp)
89 *cp = 0;
90 ping_monitor(vers+10);
91 }
92 return 0;
93 }
0e600426 94#endif
682c7051
NB
95 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
96 fprintf(stderr, Name ": %s does not appear to be active.\n",
97 devname);
98 return 1;
99 }
aba69144 100
682c7051
NB
101 if (readonly>0) {
102 if (ioctl(fd, STOP_ARRAY_RO, NULL)) {
103 fprintf(stderr, Name ": failed to set readonly for %s: %s\n",
104 devname, strerror(errno));
105 return 1;
106 }
107 } else if (readonly < 0) {
108 if (ioctl(fd, RESTART_ARRAY_RW, NULL)) {
82b27616 109 fprintf(stderr, Name ": failed to set writable for %s: %s\n",
682c7051
NB
110 devname, strerror(errno));
111 return 1;
112 }
113 }
aba69144 114 return 0;
64c4757e
NB
115}
116
435d4ebb
LB
117#ifndef MDASSEMBLE
118
4ccad7b1
N
119static void remove_devices(int devnum, char *path)
120{
121 /* Remove all 'standard' devices for 'devnum', including
122 * partitions. Also remove names at 'path' - possibly with
123 * partition suffixes - which link to those names.
124 */
125 char base[40];
126 char *path2;
127 char link[1024];
128 int n;
129 int part;
130 char *be;
131 char *pe;
132
133 if (devnum >= 0)
134 sprintf(base, "/dev/md%d", devnum);
135 else
136 sprintf(base, "/dev/md_d%d", -1-devnum);
137 be = base + strlen(base);
138 if (path) {
139 path2 = malloc(strlen(path)+20);
140 strcpy(path2, path);
141 pe = path2 + strlen(path2);
142 } else
0eb26465 143 path2 = path = NULL;
4ccad7b1
N
144
145 for (part = 0; part < 16; part++) {
146 if (part) {
147 sprintf(be, "p%d", part);
ef70b9f4
DW
148 if (path) {
149 if (isdigit(pe[-1]))
150 sprintf(pe, "p%d", part);
151 else
152 sprintf(pe, "%d", part);
153 }
4ccad7b1
N
154 }
155 /* FIXME test if really is md device ?? */
156 unlink(base);
157 if (path) {
158 n = readlink(path2, link, sizeof(link));
159 if (n && strlen(base) == n &&
160 strncmp(link, base, n) == 0)
161 unlink(path2);
162 }
163 }
0eb26465 164 free(path2);
4ccad7b1
N
165}
166
167
91f068bf 168int Manage_runstop(char *devname, int fd, int runstop, int quiet)
64c4757e 169{
682c7051
NB
170 /* Run or stop the array. array must already be configured
171 * required >= 0.90.0
4b9d39fc
N
172 * Only print failure messages if quiet == 0;
173 * quiet > 0 means really be quiet
174 * quiet < 0 means we will try again if it fails.
682c7051 175 */
682c7051 176 mdu_param_t param; /* unused */
82b27616
NB
177
178 if (runstop == -1 && md_get_version(fd) < 9000) {
179 if (ioctl(fd, STOP_MD, 0)) {
4b9d39fc
N
180 if (quiet == 0) fprintf(stderr,
181 Name ": stopping device %s "
182 "failed: %s\n",
183 devname, strerror(errno));
82b27616
NB
184 return 1;
185 }
186 }
aba69144 187
682c7051
NB
188 if (md_get_version(fd) < 9000) {
189 fprintf(stderr, Name ": need md driver version 0.90.0 or later\n");
190 return 1;
191 }
82b27616 192 /*
682c7051
NB
193 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
194 fprintf(stderr, Name ": %s does not appear to be active.\n",
195 devname);
196 return 1;
197 }
82b27616 198 */
682c7051
NB
199 if (runstop>0) {
200 if (ioctl(fd, RUN_ARRAY, &param)) {
201 fprintf(stderr, Name ": failed to run array %s: %s\n",
202 devname, strerror(errno));
203 return 1;
204 }
8382f19b
NB
205 if (quiet <= 0)
206 fprintf(stderr, Name ": started %s\n", devname);
682c7051 207 } else if (runstop < 0){
8382f19b
NB
208 struct map_ent *map = NULL;
209 struct stat stb;
daf7a3ce 210 struct mdinfo *mdi;
4ccad7b1 211 int devnum;
daf7a3ce
NB
212 /* If this is an mdmon managed array, just write 'inactive'
213 * to the array state and let mdmon clear up.
214 */
4ccad7b1 215 devnum = fd2devnum(fd);
daf7a3ce
NB
216 mdi = sysfs_read(fd, -1, GET_LEVEL|GET_VERSION);
217 if (mdi &&
218 mdi->array.level > 0 &&
3c558363 219 is_subarray(mdi->text_version)) {
daf7a3ce
NB
220 /* This is mdmon managed. */
221 close(fd);
222 if (sysfs_set_str(mdi, NULL,
223 "array_state", "inactive") < 0) {
4b9d39fc 224 if (quiet == 0)
daf7a3ce 225 fprintf(stderr, Name
4b9d39fc 226 ": failed to stop array %s: %s\n",
daf7a3ce
NB
227 devname, strerror(errno));
228 return 1;
229 }
230
231 /* Give monitor a chance to act */
c94709e8 232 ping_monitor(mdi->text_version);
daf7a3ce
NB
233
234 fd = open(devname, O_RDONLY);
ada6c239
N
235 } else if (mdi &&
236 mdi->array.major_version == -1 &&
237 mdi->array.minor_version == -2 &&
3c558363 238 !is_subarray(mdi->text_version)) {
430ea469 239 struct mdstat_ent *mds, *m;
ada6c239
N
240 /* container, possibly mdmon-managed.
241 * Make sure mdmon isn't opening it, which
242 * would interfere with the 'stop'
243 */
244 ping_monitor(mdi->sys_name);
430ea469
N
245
246 /* now check that there are no existing arrays
247 * which are members of this array
248 */
249 mds = mdstat_read(0, 0);
250 for (m=mds; m; m=m->next)
251 if (m->metadata_version &&
252 strncmp(m->metadata_version, "external:", 9)==0 &&
253 is_subarray(m->metadata_version+9) &&
254 devname2devnum(m->metadata_version+10) == devnum) {
255 if (!quiet)
256 fprintf(stderr, Name
257 ": Cannot stop container %s: "
258 "member %s still active\n",
259 devname, m->dev);
260 free_mdstat(mds);
261 if (mdi)
262 sysfs_free(mdi);
263 return 1;
264 }
daf7a3ce 265 }
daf7a3ce
NB
266
267 if (fd >= 0 && ioctl(fd, STOP_ARRAY, NULL)) {
37ea3936 268 if (quiet == 0) {
daf7a3ce 269 fprintf(stderr, Name
4b9d39fc 270 ": failed to stop array %s: %s\n",
91f068bf 271 devname, strerror(errno));
d927f3c4
NB
272 if (errno == EBUSY)
273 fprintf(stderr, "Perhaps a running "
274 "process, mounted filesystem "
275 "or active volume group?\n");
276 }
97590376
N
277 if (mdi)
278 sysfs_free(mdi);
682c7051
NB
279 return 1;
280 }
97590376 281 /* prior to 2.6.28, KOBJ_CHANGE was not sent when an md array
d49410d3
N
282 * was stopped, so We'll do it here just to be sure. Drop any
283 * partitions as well...
97590376 284 */
d49410d3
N
285 if (fd >= 0)
286 ioctl(fd, BLKRRPART, 0);
97590376
N
287 if (mdi)
288 sysfs_uevent(mdi, "change");
daf7a3ce 289
4ccad7b1
N
290
291 if (devnum != NoMdDev &&
292 (stat("/dev/.udev", &stb) != 0 ||
293 check_env("MDADM_NO_UDEV"))) {
294 struct map_ent *mp = map_by_devnum(&map, devnum);
295 remove_devices(devnum, mp ? mp->path : NULL);
296 }
297
298
ab56093f
NB
299 if (quiet <= 0)
300 fprintf(stderr, Name ": stopped %s\n", devname);
4eb26970
DW
301 map_lock(&map);
302 map_remove(&map, devnum);
303 map_unlock(&map);
682c7051
NB
304 }
305 return 0;
64c4757e
NB
306}
307
dd0781e5
NB
308int Manage_resize(char *devname, int fd, long long size, int raid_disks)
309{
310 mdu_array_info_t info;
311 if (ioctl(fd, GET_ARRAY_INFO, &info) != 0) {
312 fprintf(stderr, Name ": Cannot get array information for %s: %s\n",
313 devname, strerror(errno));
314 return 1;
315 }
316 if (size >= 0)
317 info.size = size;
318 if (raid_disks > 0)
319 info.raid_disks = raid_disks;
320 if (ioctl(fd, SET_ARRAY_INFO, &info) != 0) {
321 fprintf(stderr, Name ": Cannot set device size/shape for %s: %s\n",
322 devname, strerror(errno));
323 return 1;
324 }
325 return 0;
b5e64645 326}
dd0781e5 327
64c4757e 328int Manage_subdevs(char *devname, int fd,
dab6685f 329 mddev_dev_t devlist, int verbose)
cd29a5c8 330{
682c7051
NB
331 /* do something to each dev.
332 * devmode can be
333 * 'a' - add the device
334 * try HOT_ADD_DISK
335 * If that fails EINVAL, try ADD_NEW_DISK
336 * 'r' - remove the device HOT_REMOVE_DISK
b80da661
NB
337 * device can be 'faulty' or 'detached' in which case all
338 * matching devices are removed.
682c7051 339 * 'f' - set the device faulty SET_DISK_FAULTY
b80da661
NB
340 * device can be 'detached' in which case any device that
341 * is inaccessible will be marked faulty.
98d27e39
N
342 * For 'f' and 'r', the device can also be a kernel-internal
343 * name such as 'sdb'.
682c7051 344 */
a4e13010 345 mddev_dev_t add_devlist = NULL;
682c7051
NB
346 mdu_array_info_t array;
347 mdu_disk_info_t disc;
7a3be72f 348 unsigned long long array_size;
b80da661 349 mddev_dev_t dv, next = NULL;
682c7051 350 struct stat stb;
b80da661 351 int j, jnext = 0;
0fbf459d 352 int tfd;
3da92f27 353 struct supertype *st, *tst;
fe80f49b
NB
354 int duuid[4];
355 int ouuid[4];
f94d52f4 356 int lfd = -1;
98d27e39 357 int sysfd = -1;
682c7051
NB
358
359 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
360 fprintf(stderr, Name ": cannot get array info for %s\n",
361 devname);
362 return 1;
363 }
3da92f27 364
7a3be72f
NB
365 /* array.size is only 32 bit and may be truncated.
366 * So read from sysfs if possible, and record number of sectors
367 */
368
369 array_size = get_component_size(fd);
370 if (array_size <= 0)
371 array_size = array.size * 2;
372
1686dc25 373 tst = super_by_fd(fd);
3da92f27
NB
374 if (!tst) {
375 fprintf(stderr, Name ": unsupport array - version %d.%d\n",
376 array.major_version, array.minor_version);
377 return 1;
378 }
379
b3b4e8a7 380 stb.st_rdev = 0;
b80da661 381 for (dv = devlist, j=0 ; dv; dv = next, j = jnext) {
4a39c6f2 382 unsigned long long ldsize;
b80da661
NB
383 char dvname[20];
384 char *dnprintable = dv->devname;
a4e13010 385 char *add_dev = dv->devname;
f94d52f4 386 int err;
4a39c6f2 387
b80da661
NB
388 next = dv->next;
389 jnext = 0;
390
391 if (strcmp(dv->devname, "failed")==0 ||
392 strcmp(dv->devname, "faulty")==0) {
393 if (dv->disposition != 'r') {
394 fprintf(stderr, Name ": %s only meaningful "
395 "with -r, not -%c\n",
396 dv->devname, dv->disposition);
397 return 1;
398 }
399 for (; j < array.raid_disks + array.nr_disks ; j++) {
b3b4e8a7 400 int dev;
b80da661
NB
401 disc.number = j;
402 if (ioctl(fd, GET_DISK_INFO, &disc))
403 continue;
404 if (disc.major == 0 && disc.minor == 0)
405 continue;
406 if ((disc.state & 1) == 0) /* faulty */
407 continue;
b3b4e8a7
N
408 dev = makedev(disc.major, disc.minor);
409 if (stb.st_rdev == dev)
410 /* already did that one */
411 continue;
412 stb.st_rdev = dev;
b80da661 413 next = dv;
b3b4e8a7
N
414 /* same slot again next time - things might
415 * have reshuffled */
416 jnext = j;
b80da661
NB
417 sprintf(dvname,"%d:%d", disc.major, disc.minor);
418 dnprintable = dvname;
419 break;
420 }
421 if (jnext == 0)
422 continue;
423 } else if (strcmp(dv->devname, "detached") == 0) {
424 if (dv->disposition != 'r' && dv->disposition != 'f') {
425 fprintf(stderr, Name ": %s only meaningful "
426 "with -r of -f, not -%c\n",
427 dv->devname, dv->disposition);
428 return 1;
429 }
430 for (; j < array.raid_disks + array.nr_disks; j++) {
431 int sfd;
b3b4e8a7 432 int dev;
b80da661
NB
433 disc.number = j;
434 if (ioctl(fd, GET_DISK_INFO, &disc))
435 continue;
436 if (disc.major == 0 && disc.minor == 0)
437 continue;
438 sprintf(dvname,"%d:%d", disc.major, disc.minor);
439 sfd = dev_open(dvname, O_RDONLY);
440 if (sfd >= 0) {
441 close(sfd);
442 continue;
443 }
444 if (dv->disposition == 'f' &&
445 (disc.state & 1) == 1) /* already faulty */
446 continue;
447 if (errno != ENXIO)
448 continue;
b3b4e8a7
N
449 dev = makedev(disc.major, disc.minor);
450 if (stb.st_rdev == dev)
451 /* already did that one */
452 continue;
453 stb.st_rdev = dev;
b80da661 454 next = dv;
b3b4e8a7
N
455 /* same slot again next time - things might
456 * have reshuffled */
457 jnext = j;
b80da661
NB
458 dnprintable = dvname;
459 break;
460 }
461 if (jnext == 0)
462 continue;
a4e13010
N
463 } else if (strcmp(dv->devname, "missing") == 0) {
464 if (dv->disposition != 'a' || dv->re_add == 0) {
465 fprintf(stderr, Name ": 'missing' only meaningful "
466 "with --re-add\n");
467 return 1;
468 }
469 if (add_devlist == NULL)
470 add_devlist = conf_get_devs();
471 if (add_devlist == NULL) {
472 fprintf(stderr, Name ": no devices to scan for missing members.");
473 continue;
474 }
475 add_dev = add_devlist->devname;
476 add_devlist = add_devlist->next;
477 if (add_devlist != NULL)
478 next = dv;
479 if (stat(add_dev, &stb) < 0)
480 continue;
98d27e39
N
481 } else if (strchr(dv->devname, '/') == NULL &&
482 strlen(dv->devname) < 50) {
483 /* Assume this is a kernel-internal name like 'sda1' */
484 int found = 0;
485 char dname[55];
486 if (dv->disposition != 'r' && dv->disposition != 'f') {
487 fprintf(stderr, Name ": %s only meaningful "
488 "with -r of -f, not -%c\n",
489 dv->devname, dv->disposition);
490 return 1;
491 }
492
493 sprintf(dname, "dev-%s", dv->devname);
494 sysfd = sysfs_open(fd2devnum(fd), dname, "block/dev");
495 if (sysfd >= 0) {
496 char dn[20];
497 int mj,mn;
498 if (sysfs_fd_get_str(sysfd, dn, 20) > 0 &&
499 sscanf(dn, "%d:%d", &mj,&mn) == 2) {
500 stb.st_rdev = makedev(mj,mn);
501 found = 1;
502 }
503 close(sysfd);
504 sysfd = -1;
505 }
506 if (!found) {
507 sysfd = sysfs_open(fd2devnum(fd), dname, "state");
508 if (sysfd < 0) {
509 fprintf(stderr, Name ": %s does not appear "
510 "to be a component of %s\n",
511 dv->devname, devname);
512 return 1;
513 }
514 }
b80da661
NB
515 } else {
516 j = 0;
517
c7b47447 518 tfd = dev_open(dv->devname, O_RDONLY);
5a9de8db
N
519 if (tfd < 0 && dv->disposition == 'r' &&
520 lstat(dv->devname, &stb) == 0)
521 /* Be happy, the lstat worked, that is
522 * enough for --remove
523 */
524 ;
525 else {
526 if (tfd < 0 || fstat(tfd, &stb) != 0) {
527 fprintf(stderr, Name ": cannot find %s: %s\n",
528 dv->devname, strerror(errno));
529 if (tfd >= 0)
530 close(tfd);
531 return 1;
532 }
533 close(tfd);
b80da661
NB
534 }
535 if ((stb.st_mode & S_IFMT) != S_IFBLK) {
536 fprintf(stderr, Name ": %s is not a "
537 "block device.\n",
538 dv->devname);
539 return 1;
540 }
682c7051 541 }
cd29a5c8 542 switch(dv->disposition){
682c7051 543 default:
c913b90e
NB
544 fprintf(stderr, Name ": internal error - devmode[%s]=%d\n",
545 dv->devname, dv->disposition);
682c7051
NB
546 return 1;
547 case 'a':
4a39c6f2 548 /* add the device */
f7e7067b 549 if (tst->subarray[0]) {
f7dd881f
DW
550 fprintf(stderr, Name ": Cannot add disks to a"
551 " \'member\' array, perform this"
552 " operation on the parent container\n");
553 return 1;
f94d52f4 554 }
f277ce36 555 /* Make sure it isn't in use (in 2.6 or later) */
a4e13010
N
556 tfd = dev_open(add_dev, O_RDONLY|O_EXCL|O_DIRECT);
557 if (tfd < 0 && add_dev != dv->devname)
558 continue;
0fbf459d 559 if (tfd < 0) {
d7eaf49f
NB
560 fprintf(stderr, Name ": Cannot open %s: %s\n",
561 dv->devname, strerror(errno));
562 return 1;
563 }
3da92f27 564
1686dc25 565 st = dup_super(tst);
3da92f27 566
fe80f49b 567 if (array.not_persistent==0)
3da92f27
NB
568 st->ss->load_super(st, tfd, NULL);
569
a4e13010
N
570 if (add_dev == dv->devname) {
571 if (!get_dev_size(tfd, dv->devname, &ldsize)) {
572 close(tfd);
573 return 1;
574 }
575 } else if (!get_dev_size(tfd, NULL, &ldsize)) {
4a39c6f2 576 close(tfd);
a4e13010 577 continue;
4a39c6f2 578 }
f94d52f4
NB
579
580 if (!tst->ss->external &&
581 array.major_version == 0 &&
60d9a174 582 md_get_version(fd)%100 < 2) {
a4e13010 583 close(tfd);
892debc8
NB
584 if (ioctl(fd, HOT_ADD_DISK,
585 (unsigned long)stb.st_rdev)==0) {
dab6685f
NB
586 if (verbose >= 0)
587 fprintf(stderr, Name ": hot added %s\n",
a4e13010 588 add_dev);
892debc8
NB
589 continue;
590 }
591
cd29a5c8 592 fprintf(stderr, Name ": hot add failed for %s: %s\n",
a4e13010 593 add_dev, strerror(errno));
cd29a5c8
NB
594 return 1;
595 }
892debc8 596
43dad3d6 597 if (array.not_persistent == 0 || tst->ss->external) {
4a39c6f2 598
fe80f49b 599 /* need to find a sample superblock to copy, and
43dad3d6
DW
600 * a spare slot to use.
601 * For 'external' array (well, container based),
602 * We can just load the metadata for the array.
fe80f49b 603 */
a4e13010
N
604 if (tst->sb)
605 /* already loaded */;
606 else if (tst->ss->external) {
43dad3d6
DW
607 tst->ss->load_super(tst, fd, NULL);
608 } else for (j = 0; j < tst->max_devs; j++) {
fe80f49b
NB
609 char *dev;
610 int dfd;
611 disc.number = j;
612 if (ioctl(fd, GET_DISK_INFO, &disc))
613 continue;
614 if (disc.major==0 && disc.minor==0)
615 continue;
616 if ((disc.state & 4)==0) continue; /* sync */
617 /* Looks like a good device to try */
16c6fa80 618 dev = map_dev(disc.major, disc.minor, 1);
fe80f49b 619 if (!dev) continue;
16c6fa80 620 dfd = dev_open(dev, O_RDONLY);
fe80f49b 621 if (dfd < 0) continue;
3da92f27
NB
622 if (tst->ss->load_super(tst, dfd,
623 NULL)) {
fe80f49b
NB
624 close(dfd);
625 continue;
626 }
892debc8 627 close(dfd);
fe80f49b
NB
628 break;
629 }
43dad3d6 630 /* FIXME this is a bad test to be using */
3da92f27 631 if (!tst->sb) {
a4e13010 632 close(tfd);
fe80f49b
NB
633 fprintf(stderr, Name ": cannot find valid superblock in this array - HELP\n");
634 return 1;
635 }
2a528478
N
636
637 /* Make sure device is large enough */
638 if (tst->ss->avail_size(tst, ldsize/512) <
639 array_size) {
a4e13010
N
640 close(tfd);
641 if (add_dev != dv->devname)
642 continue;
2a528478
N
643 fprintf(stderr, Name ": %s not large enough to join array\n",
644 dv->devname);
645 return 1;
646 }
647
fe80f49b
NB
648 /* Possibly this device was recently part of the array
649 * and was temporarily removed, and is now being re-added.
650 * If so, we can simply re-add it.
651 */
3da92f27 652 tst->ss->uuid_from_super(tst, duuid);
7eae7080
NB
653
654 /* re-add doesn't work for version-1 superblocks
655 * before 2.6.18 :-(
656 */
657 if (array.major_version == 1 &&
658 get_linux_version() <= 2006018)
659 ;
3da92f27
NB
660 else if (st->sb) {
661 st->ss->uuid_from_super(st, ouuid);
fe80f49b 662 if (memcmp(duuid, ouuid, sizeof(ouuid))==0) {
4d20d744
NB
663 /* looks close enough for now. Kernel
664 * will worry about whether a bitmap
665 * based reconstruction is possible.
fe80f49b
NB
666 */
667 struct mdinfo mdi;
3da92f27 668 st->ss->getinfo_super(st, &mdi);
fe80f49b
NB
669 disc.major = major(stb.st_rdev);
670 disc.minor = minor(stb.st_rdev);
671 disc.number = mdi.disk.number;
672 disc.raid_disk = mdi.disk.raid_disk;
673 disc.state = mdi.disk.state;
b3d31955 674 if (dv->writemostly == 1)
4d20d744 675 disc.state |= 1 << MD_DISK_WRITEMOSTLY;
b3d31955
N
676 if (dv->writemostly == 2)
677 disc.state &= ~(1 << MD_DISK_WRITEMOSTLY);
a4e13010
N
678 remove_partitions(tfd);
679 close(tfd);
680 tfd = -1;
5c64fcb5
N
681 /* don't even try if disk is marked as faulty */
682 errno = 0;
683 if ((disc.state & 1) == 0 &&
684 ioctl(fd, ADD_NEW_DISK, &disc) == 0) {
fe80f49b 685 if (verbose >= 0)
a4e13010 686 fprintf(stderr, Name ": re-added %s\n", add_dev);
308e1801 687 continue;
fe80f49b 688 }
c9f39c1b 689 if (errno == ENOMEM || errno == EROFS) {
a4e13010 690 close(tfd);
c9f39c1b 691 fprintf(stderr, Name ": add new device failed for %s: %s\n",
a4e13010
N
692 add_dev, strerror(errno));
693 if (add_dev != dv->devname)
694 continue;
c9f39c1b
N
695 return 1;
696 }
fe80f49b
NB
697 /* fall back on normal-add */
698 }
892debc8 699 }
a4e13010
N
700 if (add_dev != dv->devname) {
701 if (verbose > 0)
702 fprintf(stderr, Name
703 ": --re-add for %s to %s is not possible\n",
704 add_dev, devname);
705 if (tfd >= 0)
706 close(tfd);
707 continue;
708 }
751fd6c0 709 if (dv->re_add) {
a4e13010
N
710 if (tfd >= 0)
711 close(tfd);
751fd6c0
N
712 fprintf(stderr, Name
713 ": --re-add for %s to %s is not possible\n",
714 dv->devname, devname);
715 return 1;
716 }
4a39c6f2
NB
717 } else {
718 /* non-persistent. Must ensure that new drive
719 * is at least array.size big.
720 */
7a3be72f 721 if (ldsize/512 < array_size) {
4a39c6f2
NB
722 fprintf(stderr, Name ": %s not large enough to join array\n",
723 dv->devname);
724 return 1;
725 }
892debc8 726 }
a4e13010
N
727 /* committed to really trying this device now*/
728 if (tfd >= 0) {
729 remove_partitions(tfd);
730 close(tfd);
731 }
7eae7080
NB
732 /* in 2.6.17 and earlier, version-1 superblocks won't
733 * use the number we write, but will choose a free number.
734 * we must choose the same free number, which requires
735 * starting at 'raid_disks' and counting up
736 */
3da92f27 737 for (j = array.raid_disks; j< tst->max_devs; j++) {
aa88f531 738 disc.number = j;
682c7051
NB
739 if (ioctl(fd, GET_DISK_INFO, &disc))
740 break;
741 if (disc.major==0 && disc.minor==0)
742 break;
743 if (disc.state & 8) /* removed */
744 break;
745 }
0df46c2a
NB
746 disc.major = major(stb.st_rdev);
747 disc.minor = minor(stb.st_rdev);
892debc8
NB
748 disc.number =j;
749 disc.state = 0;
43dad3d6 750 if (array.not_persistent==0 || tst->ss->external) {
111d01fc 751 int dfd;
b3d31955 752 if (dv->writemostly == 1)
fe80f49b 753 disc.state |= 1 << MD_DISK_WRITEMOSTLY;
3b435195 754 dfd = dev_open(dv->devname, O_RDWR | O_EXCL|O_DIRECT);
f20c3968
DW
755 if (tst->ss->add_to_super(tst, &disc, dfd,
756 dv->devname)) {
f20c3968
DW
757 close(dfd);
758 return 1;
759 }
111d01fc 760 /* write_init_super will close 'dfd' */
43dad3d6
DW
761 if (tst->ss->external)
762 /* mdmon will write the metadata */
763 close(dfd);
764 else if (tst->ss->write_init_super(tst))
fe80f49b
NB
765 return 1;
766 } else if (dv->re_add) {
767 /* this had better be raid1.
768 * As we are "--re-add"ing we must find a spare slot
769 * to fill.
770 */
771 char *used = malloc(array.raid_disks);
772 memset(used, 0, array.raid_disks);
3da92f27 773 for (j=0; j< tst->max_devs; j++) {
fe80f49b
NB
774 mdu_disk_info_t disc2;
775 disc2.number = j;
776 if (ioctl(fd, GET_DISK_INFO, &disc2))
777 continue;
778 if (disc2.major==0 && disc2.minor==0)
779 continue;
780 if (disc2.state & 8) /* removed */
781 continue;
782 if (disc2.raid_disk < 0)
783 continue;
784 if (disc2.raid_disk > array.raid_disks)
785 continue;
786 used[disc2.raid_disk] = 1;
787 }
788 for (j=0 ; j<array.raid_disks; j++)
789 if (!used[j]) {
790 disc.raid_disk = j;
791 disc.state |= (1<<MD_DISK_SYNC);
792 break;
793 }
0eb26465 794 free(used);
fe80f49b 795 }
b3d31955 796 if (dv->writemostly == 1)
d8def61c 797 disc.state |= (1 << MD_DISK_WRITEMOSTLY);
43dad3d6
DW
798 if (tst->ss->external) {
799 /* add a disk to an external metadata container
800 * only if mdmon is around to see it
801 */
802 struct mdinfo new_mdi;
803 struct mdinfo *sra;
804 int container_fd;
805 int devnum = fd2devnum(fd);
806
807 container_fd = open_dev_excl(devnum);
808 if (container_fd < 0) {
809 fprintf(stderr, Name ": add failed for %s:"
810 " could not get exclusive access to container\n",
811 dv->devname);
812 return 1;
813 }
814
815 if (!mdmon_running(devnum)) {
816 fprintf(stderr, Name ": add failed for %s: mdmon not running\n",
817 dv->devname);
818 close(container_fd);
819 return 1;
820 }
821
822 sra = sysfs_read(container_fd, -1, 0);
823 if (!sra) {
824 fprintf(stderr, Name ": add failed for %s: sysfs_read failed\n",
825 dv->devname);
826 close(container_fd);
827 return 1;
828 }
829 sra->array.level = LEVEL_CONTAINER;
830 /* Need to set data_offset and component_size */
831 tst->ss->getinfo_super(tst, &new_mdi);
832 new_mdi.disk.major = disc.major;
833 new_mdi.disk.minor = disc.minor;
d23534e4 834 new_mdi.recovery_start = 0;
462906cd 835 if (sysfs_add_disk(sra, &new_mdi, 0) != 0) {
43dad3d6
DW
836 fprintf(stderr, Name ": add new device to external metadata"
837 " failed for %s\n", dv->devname);
838 close(container_fd);
839 return 1;
840 }
841 ping_monitor(devnum2devname(devnum));
842 sysfs_free(sra);
843 close(container_fd);
844 } else if (ioctl(fd, ADD_NEW_DISK, &disc)) {
f277ce36
NB
845 fprintf(stderr, Name ": add new device failed for %s as %d: %s\n",
846 dv->devname, j, strerror(errno));
682c7051
NB
847 return 1;
848 }
dab6685f
NB
849 if (verbose >= 0)
850 fprintf(stderr, Name ": added %s\n", dv->devname);
682c7051
NB
851 break;
852
853 case 'r':
854 /* hot remove */
f7e7067b 855 if (tst->subarray[0]) {
f7dd881f
DW
856 fprintf(stderr, Name ": Cannot remove disks from a"
857 " \'member\' array, perform this"
858 " operation on the parent container\n");
98d27e39
N
859 if (sysfd >= 0)
860 close(sysfd);
f7dd881f 861 return 1;
f94d52f4
NB
862 }
863 if (tst->ss->external) {
864 /* To remove a device from a container, we must
865 * check that it isn't in use in an array.
866 * This involves looking in the 'holders'
867 * directory - there must be just one entry,
868 * the container.
869 * To ensure that it doesn't get used as a
870 * hold spare while we are checking, we
871 * get an O_EXCL open on the container
872 */
873 int dnum = fd2devnum(fd);
874 lfd = open_dev_excl(dnum);
875 if (lfd < 0) {
876 fprintf(stderr, Name
877 ": Cannot get exclusive access "
878 " to container - odd\n");
98d27e39
N
879 if (sysfd >= 0)
880 close(sysfd);
f94d52f4
NB
881 return 1;
882 }
85f9b5f7
DW
883 /* in the detached case it is not possible to
884 * check if we are the unique holder, so just
885 * rely on the 'detached' checks
886 */
887 if (strcmp(dv->devname, "detached") == 0 ||
98d27e39 888 sysfd >= 0 ||
85f9b5f7
DW
889 sysfs_unique_holder(dnum, stb.st_rdev))
890 /* pass */;
891 else {
f94d52f4
NB
892 fprintf(stderr, Name
893 ": %s is %s, cannot remove.\n",
894 dnprintable,
895 errno == EEXIST ? "still in use":
896 "not a member");
897 close(lfd);
898 return 1;
899 }
900 }
82b27616 901 /* FIXME check that it is a current member */
98d27e39
N
902 if (sysfd >= 0) {
903 /* device has been removed and we don't know
904 * the major:minor number
905 */
906 int n = write(sysfd, "remove", 6);
907 if (n != 6)
f94d52f4 908 err = -1;
98d27e39
N
909 else
910 err = 0;
911 close(sysfd);
912 sysfd = -1;
913 } else {
914 err = ioctl(fd, HOT_REMOVE_DISK, (unsigned long)stb.st_rdev);
915 if (err && errno == ENODEV) {
916 /* Old kernels rejected this if no personality
917 * registered */
918 struct mdinfo *sra = sysfs_read(fd, 0, GET_DEVS);
919 struct mdinfo *dv = NULL;
920 if (sra)
921 dv = sra->devs;
922 for ( ; dv ; dv=dv->next)
923 if (dv->disk.major == major(stb.st_rdev) &&
924 dv->disk.minor == minor(stb.st_rdev))
925 break;
926 if (dv)
927 err = sysfs_set_str(sra, dv,
928 "state", "remove");
929 else
930 err = -1;
931 if (sra)
932 sysfs_free(sra);
933 }
f94d52f4
NB
934 }
935 if (err) {
b80da661
NB
936 fprintf(stderr, Name ": hot remove failed "
937 "for %s: %s\n", dnprintable,
938 strerror(errno));
f94d52f4
NB
939 if (lfd >= 0)
940 close(lfd);
682c7051
NB
941 return 1;
942 }
313a4a82
DW
943 if (tst->ss->external) {
944 /*
945 * Before dropping our exclusive open we make an
946 * attempt at preventing mdmon from seeing an
947 * 'add' event before reconciling this 'remove'
948 * event.
949 */
950 char *name = devnum2devname(fd2devnum(fd));
951
952 if (!name) {
953 fprintf(stderr, Name ": unable to get container name\n");
954 return 1;
955 }
956
957 ping_manager(name);
958 free(name);
959 }
98d27e39
N
960 if (lfd >= 0)
961 close(lfd);
dab6685f 962 if (verbose >= 0)
29ba4804
N
963 fprintf(stderr, Name ": hot removed %s from %s\n",
964 dnprintable, devname);
682c7051
NB
965 break;
966
967 case 'f': /* set faulty */
968 /* FIXME check current member */
98d27e39
N
969 if ((sysfd >= 0 && write(sysfd, "faulty", 6) != 6) ||
970 (sysfd < 0 && ioctl(fd, SET_DISK_FAULTY,
971 (unsigned long) stb.st_rdev))) {
b83d95f3 972 fprintf(stderr, Name ": set device faulty failed for %s: %s\n",
b80da661 973 dnprintable, strerror(errno));
98d27e39
N
974 if (sysfd >= 0)
975 close(sysfd);
682c7051
NB
976 return 1;
977 }
98d27e39
N
978 if (sysfd >= 0)
979 close(sysfd);
980 sysfd = -1;
dab6685f
NB
981 if (verbose >= 0)
982 fprintf(stderr, Name ": set %s faulty in %s\n",
b80da661 983 dnprintable, devname);
682c7051
NB
984 break;
985 }
986 }
987 return 0;
aba69144 988
64c4757e 989}
1f48664b
NB
990
991int autodetect(void)
992{
993 /* Open any md device, and issue the RAID_AUTORUN ioctl */
994 int rv = 1;
995 int fd = dev_open("9:0", O_RDONLY);
996 if (fd >= 0) {
997 if (ioctl(fd, RAID_AUTORUN, 0) == 0)
998 rv = 0;
999 close(fd);
1000 }
1001 return rv;
1002}
435d4ebb 1003#endif