]> git.ipfire.org Git - thirdparty/mdadm.git/blame - Manage.c
mdmon: Fix crash if /proc/mdstat lists 0.9 superblocks
[thirdparty/mdadm.git] / Manage.c
CommitLineData
64c4757e 1/*
9a9dab36 2 * mdadm - manage Linux "md" devices aka RAID arrays.
64c4757e 3 *
e736b623 4 * Copyright (C) 2001-2009 Neil Brown <neilb@suse.de>
64c4757e
NB
5 *
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 *
21 * Author: Neil Brown
e736b623 22 * Email: <neilb@suse.de>
64c4757e
NB
23 */
24
9a9dab36 25#include "mdadm.h"
682c7051
NB
26#include "md_u.h"
27#include "md_p.h"
4ccad7b1 28#include <ctype.h>
64c4757e 29
82b27616
NB
30#define REGISTER_DEV _IO (MD_MAJOR, 1)
31#define START_MD _IO (MD_MAJOR, 2)
32#define STOP_MD _IO (MD_MAJOR, 3)
33
64c4757e
NB
34int Manage_ro(char *devname, int fd, int readonly)
35{
682c7051
NB
36 /* switch to readonly or rw
37 *
38 * requires >= 0.90.0
39 * first check that array is runing
40 * use RESTART_ARRAY_RW or STOP_ARRAY_RO
41 *
42 */
43 mdu_array_info_t array;
0e600426 44#ifndef MDASSEMBLE
e9dd1598 45 struct mdinfo *mdi;
0e600426 46#endif
aba69144 47
682c7051
NB
48 if (md_get_version(fd) < 9000) {
49 fprintf(stderr, Name ": need md driver version 0.90.0 or later\n");
50 return 1;
51 }
0e600426 52#ifndef MDASSEMBLE
e9dd1598
N
53 /* If this is an externally-manage array, we need to modify the
54 * metadata_version so that mdmon doesn't undo our change.
55 */
56 mdi = sysfs_read(fd, -1, GET_LEVEL|GET_VERSION);
57 if (mdi &&
58 mdi->array.major_version == -1 &&
e9dd1598
N
59 is_subarray(mdi->text_version)) {
60 char vers[64];
61 strcpy(vers, "external:");
62 strcat(vers, mdi->text_version);
63 if (readonly > 0) {
64 int rv;
65 /* We set readonly ourselves. */
66 vers[9] = '-';
67 sysfs_set_str(mdi, NULL, "metadata_version", vers);
68
69 close(fd);
70 rv = sysfs_set_str(mdi, NULL, "array_state", "readonly");
71
72 if (rv < 0) {
73 fprintf(stderr, Name ": failed to set readonly for %s: %s\n",
74 devname, strerror(errno));
75
76 vers[9] = mdi->text_version[0];
77 sysfs_set_str(mdi, NULL, "metadata_version", vers);
78 return 1;
79 }
80 } else {
81 char *cp;
82 /* We cannot set read/write - must signal mdmon */
83 vers[9] = '/';
84 sysfs_set_str(mdi, NULL, "metadata_version", vers);
85
86 cp = strchr(vers+10, '/');
87 if (*cp)
88 *cp = 0;
89 ping_monitor(vers+10);
9ea5a252
DW
90 if (mdi->array.level <= 0)
91 sysfs_set_str(mdi, NULL, "array_state", "active");
e9dd1598
N
92 }
93 return 0;
94 }
0e600426 95#endif
682c7051
NB
96 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
97 fprintf(stderr, Name ": %s does not appear to be active.\n",
98 devname);
99 return 1;
100 }
aba69144 101
682c7051
NB
102 if (readonly>0) {
103 if (ioctl(fd, STOP_ARRAY_RO, NULL)) {
104 fprintf(stderr, Name ": failed to set readonly for %s: %s\n",
105 devname, strerror(errno));
106 return 1;
107 }
108 } else if (readonly < 0) {
109 if (ioctl(fd, RESTART_ARRAY_RW, NULL)) {
82b27616 110 fprintf(stderr, Name ": failed to set writable for %s: %s\n",
682c7051
NB
111 devname, strerror(errno));
112 return 1;
113 }
114 }
aba69144 115 return 0;
64c4757e
NB
116}
117
435d4ebb
LB
118#ifndef MDASSEMBLE
119
4ccad7b1
N
120static void remove_devices(int devnum, char *path)
121{
b1702f48
N
122 /*
123 * Remove names at 'path' - possibly with
124 * partition suffixes - which link to the 'standard'
125 * name for devnum. These were probably created
126 * by mdadm when the array was assembled.
4ccad7b1
N
127 */
128 char base[40];
129 char *path2;
130 char link[1024];
131 int n;
132 int part;
133 char *be;
134 char *pe;
135
b1702f48
N
136 if (!path)
137 return;
138
4ccad7b1
N
139 if (devnum >= 0)
140 sprintf(base, "/dev/md%d", devnum);
141 else
142 sprintf(base, "/dev/md_d%d", -1-devnum);
143 be = base + strlen(base);
b1702f48
N
144
145 path2 = malloc(strlen(path)+20);
146 strcpy(path2, path);
147 pe = path2 + strlen(path2);
4ccad7b1
N
148
149 for (part = 0; part < 16; part++) {
150 if (part) {
151 sprintf(be, "p%d", part);
b1702f48
N
152
153 if (isdigit(pe[-1]))
154 sprintf(pe, "p%d", part);
155 else
156 sprintf(pe, "%d", part);
4ccad7b1 157 }
b1702f48
N
158 n = readlink(path2, link, sizeof(link));
159 if (n && (int)strlen(base) == n &&
160 strncmp(link, base, n) == 0)
161 unlink(path2);
4ccad7b1 162 }
0eb26465 163 free(path2);
4ccad7b1
N
164}
165
166
91f068bf 167int Manage_runstop(char *devname, int fd, int runstop, int quiet)
64c4757e 168{
682c7051
NB
169 /* Run or stop the array. array must already be configured
170 * required >= 0.90.0
4b9d39fc
N
171 * Only print failure messages if quiet == 0;
172 * quiet > 0 means really be quiet
173 * quiet < 0 means we will try again if it fails.
682c7051 174 */
682c7051 175 mdu_param_t param; /* unused */
82b27616
NB
176
177 if (runstop == -1 && md_get_version(fd) < 9000) {
178 if (ioctl(fd, STOP_MD, 0)) {
4b9d39fc
N
179 if (quiet == 0) fprintf(stderr,
180 Name ": stopping device %s "
181 "failed: %s\n",
182 devname, strerror(errno));
82b27616
NB
183 return 1;
184 }
185 }
aba69144 186
682c7051
NB
187 if (md_get_version(fd) < 9000) {
188 fprintf(stderr, Name ": need md driver version 0.90.0 or later\n");
189 return 1;
190 }
82b27616 191 /*
682c7051
NB
192 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
193 fprintf(stderr, Name ": %s does not appear to be active.\n",
194 devname);
195 return 1;
196 }
82b27616 197 */
682c7051
NB
198 if (runstop>0) {
199 if (ioctl(fd, RUN_ARRAY, &param)) {
200 fprintf(stderr, Name ": failed to run array %s: %s\n",
201 devname, strerror(errno));
202 return 1;
203 }
8382f19b
NB
204 if (quiet <= 0)
205 fprintf(stderr, Name ": started %s\n", devname);
682c7051 206 } else if (runstop < 0){
8382f19b
NB
207 struct map_ent *map = NULL;
208 struct stat stb;
daf7a3ce 209 struct mdinfo *mdi;
4ccad7b1 210 int devnum;
eb0af526
N
211 int err;
212 int count;
daf7a3ce
NB
213 /* If this is an mdmon managed array, just write 'inactive'
214 * to the array state and let mdmon clear up.
215 */
4ccad7b1 216 devnum = fd2devnum(fd);
eb0af526
N
217 /* Get EXCL access first. If this fails, then attempting
218 * to stop is probably a bad idea.
219 */
220 close(fd);
221 fd = open(devname, O_RDONLY|O_EXCL);
222 if (fd < 0 || fd2devnum(fd) != devnum) {
223 if (fd >= 0)
224 close(fd);
225 fprintf(stderr,
226 Name ": Cannot get exclusive access to %s:"
1ae42d9d
KW
227 "Perhaps a running "
228 "process, mounted filesystem "
229 "or active volume group?\n",
eb0af526
N
230 devname);
231 return 1;
232 }
daf7a3ce
NB
233 mdi = sysfs_read(fd, -1, GET_LEVEL|GET_VERSION);
234 if (mdi &&
235 mdi->array.level > 0 &&
3c558363 236 is_subarray(mdi->text_version)) {
1ae42d9d 237 int err;
daf7a3ce
NB
238 /* This is mdmon managed. */
239 close(fd);
1ae42d9d
KW
240
241 count = 25;
242 while (count &&
243 (err = sysfs_set_str(mdi, NULL,
244 "array_state",
245 "inactive")) < 0
246 && errno == EBUSY) {
247 usleep(200000);
248 count--;
249 }
250 if (err && !quiet) {
251 fprintf(stderr, Name
252 ": failed to stop array %s: %s\n",
253 devname, strerror(errno));
daf7a3ce
NB
254 return 1;
255 }
256
257 /* Give monitor a chance to act */
c94709e8 258 ping_monitor(mdi->text_version);
daf7a3ce 259
eb0af526
N
260 fd = open_dev_excl(devnum);
261 if (fd < 0) {
262 fprintf(stderr, Name
263 ": failed to completely stop %s"
264 ": Device is busy\n",
265 devname);
266 return 1;
267 }
ada6c239
N
268 } else if (mdi &&
269 mdi->array.major_version == -1 &&
270 mdi->array.minor_version == -2 &&
3c558363 271 !is_subarray(mdi->text_version)) {
430ea469 272 struct mdstat_ent *mds, *m;
ada6c239
N
273 /* container, possibly mdmon-managed.
274 * Make sure mdmon isn't opening it, which
275 * would interfere with the 'stop'
276 */
277 ping_monitor(mdi->sys_name);
430ea469
N
278
279 /* now check that there are no existing arrays
280 * which are members of this array
281 */
282 mds = mdstat_read(0, 0);
283 for (m=mds; m; m=m->next)
284 if (m->metadata_version &&
285 strncmp(m->metadata_version, "external:", 9)==0 &&
286 is_subarray(m->metadata_version+9) &&
287 devname2devnum(m->metadata_version+10) == devnum) {
288 if (!quiet)
289 fprintf(stderr, Name
290 ": Cannot stop container %s: "
291 "member %s still active\n",
292 devname, m->dev);
293 free_mdstat(mds);
294 if (mdi)
295 sysfs_free(mdi);
296 return 1;
297 }
daf7a3ce 298 }
daf7a3ce 299
eb0af526
N
300 /* As we have an O_EXCL open, any use of the device
301 * which blocks STOP_ARRAY is probably a transient use,
302 * so it is reasonable to retry for a while - 5 seconds.
303 */
fb0d4b9c 304 count = 25; err = 0;
eb0af526
N
305 while (count && fd >= 0
306 && (err = ioctl(fd, STOP_ARRAY, NULL)) < 0
307 && errno == EBUSY) {
308 usleep(200000);
309 count --;
310 }
311 if (fd >= 0 && err) {
37ea3936 312 if (quiet == 0) {
daf7a3ce 313 fprintf(stderr, Name
4b9d39fc 314 ": failed to stop array %s: %s\n",
91f068bf 315 devname, strerror(errno));
d927f3c4
NB
316 if (errno == EBUSY)
317 fprintf(stderr, "Perhaps a running "
318 "process, mounted filesystem "
319 "or active volume group?\n");
320 }
97590376
N
321 if (mdi)
322 sysfs_free(mdi);
682c7051
NB
323 return 1;
324 }
97590376 325 /* prior to 2.6.28, KOBJ_CHANGE was not sent when an md array
d49410d3
N
326 * was stopped, so We'll do it here just to be sure. Drop any
327 * partitions as well...
97590376 328 */
d49410d3
N
329 if (fd >= 0)
330 ioctl(fd, BLKRRPART, 0);
97590376
N
331 if (mdi)
332 sysfs_uevent(mdi, "change");
daf7a3ce 333
4ccad7b1
N
334
335 if (devnum != NoMdDev &&
336 (stat("/dev/.udev", &stb) != 0 ||
337 check_env("MDADM_NO_UDEV"))) {
338 struct map_ent *mp = map_by_devnum(&map, devnum);
339 remove_devices(devnum, mp ? mp->path : NULL);
340 }
341
342
ab56093f
NB
343 if (quiet <= 0)
344 fprintf(stderr, Name ": stopped %s\n", devname);
4eb26970
DW
345 map_lock(&map);
346 map_remove(&map, devnum);
347 map_unlock(&map);
682c7051
NB
348 }
349 return 0;
64c4757e
NB
350}
351
dd0781e5
NB
352int Manage_resize(char *devname, int fd, long long size, int raid_disks)
353{
354 mdu_array_info_t info;
355 if (ioctl(fd, GET_ARRAY_INFO, &info) != 0) {
356 fprintf(stderr, Name ": Cannot get array information for %s: %s\n",
357 devname, strerror(errno));
358 return 1;
359 }
360 if (size >= 0)
361 info.size = size;
362 if (raid_disks > 0)
363 info.raid_disks = raid_disks;
364 if (ioctl(fd, SET_ARRAY_INFO, &info) != 0) {
365 fprintf(stderr, Name ": Cannot set device size/shape for %s: %s\n",
366 devname, strerror(errno));
367 return 1;
368 }
369 return 0;
b5e64645 370}
dd0781e5 371
64c4757e 372int Manage_subdevs(char *devname, int fd,
833bb0f8
N
373 struct mddev_dev *devlist, int verbose, int test,
374 char *update)
cd29a5c8 375{
682c7051
NB
376 /* do something to each dev.
377 * devmode can be
378 * 'a' - add the device
379 * try HOT_ADD_DISK
380 * If that fails EINVAL, try ADD_NEW_DISK
381 * 'r' - remove the device HOT_REMOVE_DISK
b80da661
NB
382 * device can be 'faulty' or 'detached' in which case all
383 * matching devices are removed.
682c7051 384 * 'f' - set the device faulty SET_DISK_FAULTY
b80da661
NB
385 * device can be 'detached' in which case any device that
386 * is inaccessible will be marked faulty.
98d27e39
N
387 * For 'f' and 'r', the device can also be a kernel-internal
388 * name such as 'sdb'.
682c7051 389 */
a655e550 390 struct mddev_dev *add_devlist = NULL;
682c7051
NB
391 mdu_array_info_t array;
392 mdu_disk_info_t disc;
7a3be72f 393 unsigned long long array_size;
a655e550 394 struct mddev_dev *dv, *next = NULL;
682c7051 395 struct stat stb;
b80da661 396 int j, jnext = 0;
cfad27a9 397 int tfd = -1;
3da92f27 398 struct supertype *st, *tst;
4725bc31 399 char *subarray = NULL;
fe80f49b
NB
400 int duuid[4];
401 int ouuid[4];
f94d52f4 402 int lfd = -1;
98d27e39 403 int sysfd = -1;
7d2e6486 404 int count = 0; /* number of actions taken */
682c7051
NB
405
406 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
407 fprintf(stderr, Name ": cannot get array info for %s\n",
408 devname);
409 return 1;
410 }
3da92f27 411
7a3be72f
NB
412 /* array.size is only 32 bit and may be truncated.
413 * So read from sysfs if possible, and record number of sectors
414 */
415
416 array_size = get_component_size(fd);
417 if (array_size <= 0)
418 array_size = array.size * 2;
419
4725bc31 420 tst = super_by_fd(fd, &subarray);
3da92f27
NB
421 if (!tst) {
422 fprintf(stderr, Name ": unsupport array - version %d.%d\n",
423 array.major_version, array.minor_version);
424 return 1;
425 }
426
b3b4e8a7 427 stb.st_rdev = 0;
b80da661 428 for (dv = devlist, j=0 ; dv; dv = next, j = jnext) {
4a39c6f2 429 unsigned long long ldsize;
b80da661
NB
430 char dvname[20];
431 char *dnprintable = dv->devname;
a4e13010 432 char *add_dev = dv->devname;
f94d52f4 433 int err;
8453e704 434 int re_add_failed = 0;
4a39c6f2 435
b80da661
NB
436 next = dv->next;
437 jnext = 0;
438
439 if (strcmp(dv->devname, "failed")==0 ||
440 strcmp(dv->devname, "faulty")==0) {
441 if (dv->disposition != 'r') {
442 fprintf(stderr, Name ": %s only meaningful "
443 "with -r, not -%c\n",
444 dv->devname, dv->disposition);
445 return 1;
446 }
447 for (; j < array.raid_disks + array.nr_disks ; j++) {
f21e18ca 448 unsigned dev;
b80da661
NB
449 disc.number = j;
450 if (ioctl(fd, GET_DISK_INFO, &disc))
451 continue;
452 if (disc.major == 0 && disc.minor == 0)
453 continue;
454 if ((disc.state & 1) == 0) /* faulty */
455 continue;
b3b4e8a7
N
456 dev = makedev(disc.major, disc.minor);
457 if (stb.st_rdev == dev)
458 /* already did that one */
459 continue;
460 stb.st_rdev = dev;
b80da661 461 next = dv;
b3b4e8a7
N
462 /* same slot again next time - things might
463 * have reshuffled */
464 jnext = j;
b80da661
NB
465 sprintf(dvname,"%d:%d", disc.major, disc.minor);
466 dnprintable = dvname;
467 break;
468 }
5b660791 469 if (next != dv)
b80da661
NB
470 continue;
471 } else if (strcmp(dv->devname, "detached") == 0) {
472 if (dv->disposition != 'r' && dv->disposition != 'f') {
473 fprintf(stderr, Name ": %s only meaningful "
474 "with -r of -f, not -%c\n",
475 dv->devname, dv->disposition);
476 return 1;
477 }
478 for (; j < array.raid_disks + array.nr_disks; j++) {
479 int sfd;
f21e18ca 480 unsigned dev;
b80da661
NB
481 disc.number = j;
482 if (ioctl(fd, GET_DISK_INFO, &disc))
483 continue;
484 if (disc.major == 0 && disc.minor == 0)
485 continue;
486 sprintf(dvname,"%d:%d", disc.major, disc.minor);
487 sfd = dev_open(dvname, O_RDONLY);
488 if (sfd >= 0) {
489 close(sfd);
490 continue;
491 }
492 if (dv->disposition == 'f' &&
493 (disc.state & 1) == 1) /* already faulty */
494 continue;
495 if (errno != ENXIO)
496 continue;
b3b4e8a7
N
497 dev = makedev(disc.major, disc.minor);
498 if (stb.st_rdev == dev)
499 /* already did that one */
500 continue;
501 stb.st_rdev = dev;
b80da661 502 next = dv;
b3b4e8a7
N
503 /* same slot again next time - things might
504 * have reshuffled */
505 jnext = j;
b80da661
NB
506 dnprintable = dvname;
507 break;
508 }
5b660791 509 if (next != dv)
b80da661 510 continue;
a4e13010
N
511 } else if (strcmp(dv->devname, "missing") == 0) {
512 if (dv->disposition != 'a' || dv->re_add == 0) {
513 fprintf(stderr, Name ": 'missing' only meaningful "
514 "with --re-add\n");
515 return 1;
516 }
517 if (add_devlist == NULL)
518 add_devlist = conf_get_devs();
519 if (add_devlist == NULL) {
520 fprintf(stderr, Name ": no devices to scan for missing members.");
521 continue;
522 }
523 add_dev = add_devlist->devname;
524 add_devlist = add_devlist->next;
525 if (add_devlist != NULL)
526 next = dv;
527 if (stat(add_dev, &stb) < 0)
528 continue;
98d27e39 529 } else if (strchr(dv->devname, '/') == NULL &&
93601c43 530 strchr(dv->devname, ':') == NULL &&
98d27e39
N
531 strlen(dv->devname) < 50) {
532 /* Assume this is a kernel-internal name like 'sda1' */
533 int found = 0;
534 char dname[55];
535 if (dv->disposition != 'r' && dv->disposition != 'f') {
536 fprintf(stderr, Name ": %s only meaningful "
cfad27a9 537 "with -r or -f, not -%c\n",
98d27e39
N
538 dv->devname, dv->disposition);
539 return 1;
540 }
541
542 sprintf(dname, "dev-%s", dv->devname);
543 sysfd = sysfs_open(fd2devnum(fd), dname, "block/dev");
544 if (sysfd >= 0) {
545 char dn[20];
546 int mj,mn;
547 if (sysfs_fd_get_str(sysfd, dn, 20) > 0 &&
548 sscanf(dn, "%d:%d", &mj,&mn) == 2) {
549 stb.st_rdev = makedev(mj,mn);
550 found = 1;
551 }
552 close(sysfd);
553 sysfd = -1;
554 }
555 if (!found) {
556 sysfd = sysfs_open(fd2devnum(fd), dname, "state");
557 if (sysfd < 0) {
558 fprintf(stderr, Name ": %s does not appear "
559 "to be a component of %s\n",
560 dv->devname, devname);
561 return 1;
562 }
563 }
b80da661
NB
564 } else {
565 j = 0;
566
c7b47447 567 tfd = dev_open(dv->devname, O_RDONLY);
5a9de8db
N
568 if (tfd < 0 && dv->disposition == 'r' &&
569 lstat(dv->devname, &stb) == 0)
570 /* Be happy, the lstat worked, that is
571 * enough for --remove
572 */
573 ;
574 else {
575 if (tfd < 0 || fstat(tfd, &stb) != 0) {
576 fprintf(stderr, Name ": cannot find %s: %s\n",
577 dv->devname, strerror(errno));
578 if (tfd >= 0)
579 close(tfd);
580 return 1;
581 }
582 close(tfd);
cfad27a9 583 tfd = -1;
b80da661
NB
584 }
585 if ((stb.st_mode & S_IFMT) != S_IFBLK) {
586 fprintf(stderr, Name ": %s is not a "
587 "block device.\n",
588 dv->devname);
589 return 1;
590 }
682c7051 591 }
cd29a5c8 592 switch(dv->disposition){
682c7051 593 default:
c913b90e
NB
594 fprintf(stderr, Name ": internal error - devmode[%s]=%d\n",
595 dv->devname, dv->disposition);
682c7051
NB
596 return 1;
597 case 'a':
4a39c6f2 598 /* add the device */
4725bc31 599 if (subarray) {
f7dd881f
DW
600 fprintf(stderr, Name ": Cannot add disks to a"
601 " \'member\' array, perform this"
602 " operation on the parent container\n");
603 return 1;
f94d52f4 604 }
f277ce36 605 /* Make sure it isn't in use (in 2.6 or later) */
a4e13010
N
606 tfd = dev_open(add_dev, O_RDONLY|O_EXCL|O_DIRECT);
607 if (tfd < 0 && add_dev != dv->devname)
608 continue;
0fbf459d 609 if (tfd < 0) {
d7eaf49f
NB
610 fprintf(stderr, Name ": Cannot open %s: %s\n",
611 dv->devname, strerror(errno));
612 return 1;
613 }
3da92f27 614
1686dc25 615 st = dup_super(tst);
3da92f27 616
fe80f49b 617 if (array.not_persistent==0)
3da92f27
NB
618 st->ss->load_super(st, tfd, NULL);
619
a4e13010
N
620 if (add_dev == dv->devname) {
621 if (!get_dev_size(tfd, dv->devname, &ldsize)) {
622 close(tfd);
623 return 1;
624 }
625 } else if (!get_dev_size(tfd, NULL, &ldsize)) {
4a39c6f2 626 close(tfd);
cfad27a9 627 tfd = -1;
a4e13010 628 continue;
4a39c6f2 629 }
f94d52f4
NB
630
631 if (!tst->ss->external &&
632 array.major_version == 0 &&
60d9a174 633 md_get_version(fd)%100 < 2) {
a4e13010 634 close(tfd);
cfad27a9 635 tfd = -1;
892debc8
NB
636 if (ioctl(fd, HOT_ADD_DISK,
637 (unsigned long)stb.st_rdev)==0) {
dab6685f
NB
638 if (verbose >= 0)
639 fprintf(stderr, Name ": hot added %s\n",
a4e13010 640 add_dev);
892debc8
NB
641 continue;
642 }
643
cd29a5c8 644 fprintf(stderr, Name ": hot add failed for %s: %s\n",
a4e13010 645 add_dev, strerror(errno));
cd29a5c8
NB
646 return 1;
647 }
892debc8 648
43dad3d6 649 if (array.not_persistent == 0 || tst->ss->external) {
4a39c6f2 650
fe80f49b 651 /* need to find a sample superblock to copy, and
43dad3d6
DW
652 * a spare slot to use.
653 * For 'external' array (well, container based),
654 * We can just load the metadata for the array.
fe80f49b 655 */
a4e13010
N
656 if (tst->sb)
657 /* already loaded */;
658 else if (tst->ss->external) {
0fb69d1d 659 tst->ss->load_container(tst, fd, NULL);
43dad3d6 660 } else for (j = 0; j < tst->max_devs; j++) {
fe80f49b
NB
661 char *dev;
662 int dfd;
663 disc.number = j;
664 if (ioctl(fd, GET_DISK_INFO, &disc))
665 continue;
666 if (disc.major==0 && disc.minor==0)
667 continue;
668 if ((disc.state & 4)==0) continue; /* sync */
669 /* Looks like a good device to try */
16c6fa80 670 dev = map_dev(disc.major, disc.minor, 1);
fe80f49b 671 if (!dev) continue;
16c6fa80 672 dfd = dev_open(dev, O_RDONLY);
fe80f49b 673 if (dfd < 0) continue;
3da92f27
NB
674 if (tst->ss->load_super(tst, dfd,
675 NULL)) {
fe80f49b
NB
676 close(dfd);
677 continue;
678 }
892debc8 679 close(dfd);
fe80f49b
NB
680 break;
681 }
43dad3d6 682 /* FIXME this is a bad test to be using */
3da92f27 683 if (!tst->sb) {
a4e13010 684 close(tfd);
0081eb00 685 fprintf(stderr, Name ": cannot load array metadata from %s\n", devname);
fe80f49b
NB
686 return 1;
687 }
2a528478
N
688
689 /* Make sure device is large enough */
690 if (tst->ss->avail_size(tst, ldsize/512) <
691 array_size) {
a4e13010 692 close(tfd);
cfad27a9 693 tfd = -1;
a4e13010
N
694 if (add_dev != dv->devname)
695 continue;
2a528478
N
696 fprintf(stderr, Name ": %s not large enough to join array\n",
697 dv->devname);
698 return 1;
699 }
700
fe80f49b
NB
701 /* Possibly this device was recently part of the array
702 * and was temporarily removed, and is now being re-added.
703 * If so, we can simply re-add it.
704 */
3da92f27 705 tst->ss->uuid_from_super(tst, duuid);
7eae7080 706
873eec46 707 if (st->sb) {
8453e704 708 struct mdinfo mdi;
a5d85af7 709 st->ss->getinfo_super(st, &mdi, NULL);
3da92f27 710 st->ss->uuid_from_super(st, ouuid);
8453e704
N
711 if ((mdi.disk.state & (1<<MD_DISK_ACTIVE)) &&
712 !(mdi.disk.state & (1<<MD_DISK_FAULTY)) &&
713 memcmp(duuid, ouuid, sizeof(ouuid))==0) {
714 /* look like it is worth a try. Need to
715 * make sure kernel will accept it though.
fe80f49b 716 */
873eec46
N
717 /* re-add doesn't work for version-1 superblocks
718 * before 2.6.18 :-(
719 */
720 if (array.major_version == 1 &&
721 get_linux_version() <= 2006018)
722 goto skip_re_add;
8453e704
N
723 disc.number = mdi.disk.number;
724 if (ioctl(fd, GET_DISK_INFO, &disc) != 0
725 || disc.major != 0 || disc.minor != 0
726 || !enough_fd(fd))
727 goto skip_re_add;
fe80f49b
NB
728 disc.major = major(stb.st_rdev);
729 disc.minor = minor(stb.st_rdev);
730 disc.number = mdi.disk.number;
731 disc.raid_disk = mdi.disk.raid_disk;
732 disc.state = mdi.disk.state;
b3d31955 733 if (dv->writemostly == 1)
4d20d744 734 disc.state |= 1 << MD_DISK_WRITEMOSTLY;
b3d31955
N
735 if (dv->writemostly == 2)
736 disc.state &= ~(1 << MD_DISK_WRITEMOSTLY);
a4e13010
N
737 remove_partitions(tfd);
738 close(tfd);
739 tfd = -1;
833bb0f8
N
740 if (update) {
741 int rv = -1;
742 tfd = dev_open(dv->devname, O_RDWR);
743
744 if (tfd >= 0)
745 rv = st->ss->update_super(
746 st, NULL, update,
747 devname, verbose, 0, NULL);
748 if (rv == 0)
c0f8269d 749 rv = st->ss->store_super(st, tfd);
833bb0f8
N
750 close(tfd);
751 tfd = -1;
752 if (rv != 0) {
753 fprintf(stderr, Name ": failed to update"
754 " superblock during re-add\n");
755 return 1;
756 }
757 }
5c64fcb5
N
758 /* don't even try if disk is marked as faulty */
759 errno = 0;
8453e704 760 if (ioctl(fd, ADD_NEW_DISK, &disc) == 0) {
fe80f49b 761 if (verbose >= 0)
a4e13010 762 fprintf(stderr, Name ": re-added %s\n", add_dev);
7d2e6486 763 count++;
308e1801 764 continue;
fe80f49b 765 }
c9f39c1b
N
766 if (errno == ENOMEM || errno == EROFS) {
767 fprintf(stderr, Name ": add new device failed for %s: %s\n",
a4e13010
N
768 add_dev, strerror(errno));
769 if (add_dev != dv->devname)
770 continue;
c9f39c1b
N
771 return 1;
772 }
8453e704
N
773 skip_re_add:
774 re_add_failed = 1;
fe80f49b 775 }
1cc7f4fe 776 st->ss->free_super(st);
892debc8 777 }
a4e13010
N
778 if (add_dev != dv->devname) {
779 if (verbose > 0)
780 fprintf(stderr, Name
781 ": --re-add for %s to %s is not possible\n",
782 add_dev, devname);
cfad27a9 783 if (tfd >= 0) {
a4e13010 784 close(tfd);
cfad27a9
DL
785 tfd = -1;
786 }
a4e13010
N
787 continue;
788 }
751fd6c0 789 if (dv->re_add) {
a4e13010
N
790 if (tfd >= 0)
791 close(tfd);
751fd6c0
N
792 fprintf(stderr, Name
793 ": --re-add for %s to %s is not possible\n",
794 dv->devname, devname);
795 return 1;
796 }
8453e704
N
797 if (re_add_failed) {
798 fprintf(stderr, Name ": %s reports being an active member for %s, but a --re-add fails.\n",
799 dv->devname, devname);
800 fprintf(stderr, Name ": not performing --add as that would convert %s in to a spare.\n",
801 dv->devname);
802 fprintf(stderr, Name ": To make this a spare, use \"mdadm --zero-superblock %s\" first.\n",
803 dv->devname);
804 if (tfd >= 0)
805 close(tfd);
806 return 1;
807 }
4a39c6f2
NB
808 } else {
809 /* non-persistent. Must ensure that new drive
810 * is at least array.size big.
811 */
7a3be72f 812 if (ldsize/512 < array_size) {
4a39c6f2
NB
813 fprintf(stderr, Name ": %s not large enough to join array\n",
814 dv->devname);
cfad27a9
DL
815 if (tfd >= 0)
816 close(tfd);
4a39c6f2
NB
817 return 1;
818 }
892debc8 819 }
a4e13010
N
820 /* committed to really trying this device now*/
821 if (tfd >= 0) {
822 remove_partitions(tfd);
823 close(tfd);
cfad27a9 824 tfd = -1;
a4e13010 825 }
7eae7080
NB
826 /* in 2.6.17 and earlier, version-1 superblocks won't
827 * use the number we write, but will choose a free number.
828 * we must choose the same free number, which requires
829 * starting at 'raid_disks' and counting up
830 */
3da92f27 831 for (j = array.raid_disks; j< tst->max_devs; j++) {
aa88f531 832 disc.number = j;
682c7051
NB
833 if (ioctl(fd, GET_DISK_INFO, &disc))
834 break;
835 if (disc.major==0 && disc.minor==0)
836 break;
837 if (disc.state & 8) /* removed */
838 break;
839 }
0df46c2a
NB
840 disc.major = major(stb.st_rdev);
841 disc.minor = minor(stb.st_rdev);
892debc8
NB
842 disc.number =j;
843 disc.state = 0;
02c39ab1 844 if (array.not_persistent==0) {
111d01fc 845 int dfd;
b3d31955 846 if (dv->writemostly == 1)
fe80f49b 847 disc.state |= 1 << MD_DISK_WRITEMOSTLY;
3b435195 848 dfd = dev_open(dv->devname, O_RDWR | O_EXCL|O_DIRECT);
f20c3968
DW
849 if (tst->ss->add_to_super(tst, &disc, dfd,
850 dv->devname)) {
f20c3968
DW
851 close(dfd);
852 return 1;
853 }
1cc7f4fe
N
854 if (tst->ss->write_init_super(tst)) {
855 close(dfd);
fe80f49b 856 return 1;
1cc7f4fe 857 }
fe80f49b
NB
858 } else if (dv->re_add) {
859 /* this had better be raid1.
860 * As we are "--re-add"ing we must find a spare slot
861 * to fill.
862 */
863 char *used = malloc(array.raid_disks);
864 memset(used, 0, array.raid_disks);
3da92f27 865 for (j=0; j< tst->max_devs; j++) {
fe80f49b
NB
866 mdu_disk_info_t disc2;
867 disc2.number = j;
868 if (ioctl(fd, GET_DISK_INFO, &disc2))
869 continue;
870 if (disc2.major==0 && disc2.minor==0)
871 continue;
872 if (disc2.state & 8) /* removed */
873 continue;
874 if (disc2.raid_disk < 0)
875 continue;
876 if (disc2.raid_disk > array.raid_disks)
877 continue;
878 used[disc2.raid_disk] = 1;
879 }
880 for (j=0 ; j<array.raid_disks; j++)
881 if (!used[j]) {
882 disc.raid_disk = j;
883 disc.state |= (1<<MD_DISK_SYNC);
884 break;
885 }
0eb26465 886 free(used);
fe80f49b 887 }
b3d31955 888 if (dv->writemostly == 1)
d8def61c 889 disc.state |= (1 << MD_DISK_WRITEMOSTLY);
43dad3d6 890 if (tst->ss->external) {
73cb8d43
AK
891 /* add a disk
892 * to an external metadata container */
43dad3d6
DW
893 struct mdinfo new_mdi;
894 struct mdinfo *sra;
895 int container_fd;
896 int devnum = fd2devnum(fd);
02c39ab1 897 int dfd;
43dad3d6
DW
898
899 container_fd = open_dev_excl(devnum);
900 if (container_fd < 0) {
901 fprintf(stderr, Name ": add failed for %s:"
902 " could not get exclusive access to container\n",
903 dv->devname);
562e70e4 904 tst->ss->free_super(tst);
43dad3d6
DW
905 return 1;
906 }
907
02c39ab1 908 dfd = dev_open(dv->devname, O_RDWR | O_EXCL|O_DIRECT);
d6221e66
N
909 if (mdmon_running(tst->container_dev))
910 tst->update_tail = &tst->updates;
02c39ab1
N
911 if (tst->ss->add_to_super(tst, &disc, dfd,
912 dv->devname)) {
913 close(dfd);
914 close(container_fd);
915 return 1;
916 }
c0f8269d
AK
917 if (tst->update_tail)
918 flush_metadata_updates(tst);
d6221e66 919 else
c0f8269d 920 tst->ss->sync_metadata(tst);
02c39ab1 921
43dad3d6
DW
922 sra = sysfs_read(container_fd, -1, 0);
923 if (!sra) {
924 fprintf(stderr, Name ": add failed for %s: sysfs_read failed\n",
925 dv->devname);
926 close(container_fd);
562e70e4 927 tst->ss->free_super(tst);
43dad3d6
DW
928 return 1;
929 }
930 sra->array.level = LEVEL_CONTAINER;
931 /* Need to set data_offset and component_size */
a5d85af7 932 tst->ss->getinfo_super(tst, &new_mdi, NULL);
43dad3d6
DW
933 new_mdi.disk.major = disc.major;
934 new_mdi.disk.minor = disc.minor;
d23534e4 935 new_mdi.recovery_start = 0;
1cc7f4fe
N
936 /* Make sure fds are closed as they are O_EXCL which
937 * would block add_disk */
938 tst->ss->free_super(tst);
462906cd 939 if (sysfs_add_disk(sra, &new_mdi, 0) != 0) {
43dad3d6
DW
940 fprintf(stderr, Name ": add new device to external metadata"
941 " failed for %s\n", dv->devname);
942 close(container_fd);
73cb8d43 943 sysfs_free(sra);
43dad3d6
DW
944 return 1;
945 }
983fff45 946 ping_monitor_by_id(devnum);
43dad3d6
DW
947 sysfs_free(sra);
948 close(container_fd);
562e70e4
N
949 } else {
950 tst->ss->free_super(tst);
951 if (ioctl(fd, ADD_NEW_DISK, &disc)) {
952 fprintf(stderr, Name ": add new device failed for %s as %d: %s\n",
953 dv->devname, j, strerror(errno));
954 return 1;
955 }
682c7051 956 }
dab6685f
NB
957 if (verbose >= 0)
958 fprintf(stderr, Name ": added %s\n", dv->devname);
682c7051
NB
959 break;
960
961 case 'r':
962 /* hot remove */
4725bc31 963 if (subarray) {
f7dd881f
DW
964 fprintf(stderr, Name ": Cannot remove disks from a"
965 " \'member\' array, perform this"
966 " operation on the parent container\n");
98d27e39
N
967 if (sysfd >= 0)
968 close(sysfd);
f7dd881f 969 return 1;
f94d52f4
NB
970 }
971 if (tst->ss->external) {
972 /* To remove a device from a container, we must
973 * check that it isn't in use in an array.
974 * This involves looking in the 'holders'
975 * directory - there must be just one entry,
976 * the container.
977 * To ensure that it doesn't get used as a
978 * hold spare while we are checking, we
979 * get an O_EXCL open on the container
980 */
981 int dnum = fd2devnum(fd);
982 lfd = open_dev_excl(dnum);
983 if (lfd < 0) {
984 fprintf(stderr, Name
985 ": Cannot get exclusive access "
986 " to container - odd\n");
98d27e39
N
987 if (sysfd >= 0)
988 close(sysfd);
f94d52f4
NB
989 return 1;
990 }
85f9b5f7
DW
991 /* in the detached case it is not possible to
992 * check if we are the unique holder, so just
993 * rely on the 'detached' checks
994 */
995 if (strcmp(dv->devname, "detached") == 0 ||
98d27e39 996 sysfd >= 0 ||
85f9b5f7
DW
997 sysfs_unique_holder(dnum, stb.st_rdev))
998 /* pass */;
999 else {
f94d52f4
NB
1000 fprintf(stderr, Name
1001 ": %s is %s, cannot remove.\n",
1002 dnprintable,
1003 errno == EEXIST ? "still in use":
1004 "not a member");
1005 close(lfd);
1006 return 1;
1007 }
1008 }
82b27616 1009 /* FIXME check that it is a current member */
98d27e39
N
1010 if (sysfd >= 0) {
1011 /* device has been removed and we don't know
1012 * the major:minor number
1013 */
1014 int n = write(sysfd, "remove", 6);
1015 if (n != 6)
f94d52f4 1016 err = -1;
98d27e39
N
1017 else
1018 err = 0;
1019 close(sysfd);
1020 sysfd = -1;
1021 } else {
1022 err = ioctl(fd, HOT_REMOVE_DISK, (unsigned long)stb.st_rdev);
1023 if (err && errno == ENODEV) {
1024 /* Old kernels rejected this if no personality
1025 * registered */
1026 struct mdinfo *sra = sysfs_read(fd, 0, GET_DEVS);
1027 struct mdinfo *dv = NULL;
1028 if (sra)
1029 dv = sra->devs;
1030 for ( ; dv ; dv=dv->next)
f21e18ca
N
1031 if (dv->disk.major == (int)major(stb.st_rdev) &&
1032 dv->disk.minor == (int)minor(stb.st_rdev))
98d27e39
N
1033 break;
1034 if (dv)
1035 err = sysfs_set_str(sra, dv,
1036 "state", "remove");
1037 else
1038 err = -1;
1039 if (sra)
1040 sysfs_free(sra);
1041 }
f94d52f4
NB
1042 }
1043 if (err) {
b80da661
NB
1044 fprintf(stderr, Name ": hot remove failed "
1045 "for %s: %s\n", dnprintable,
1046 strerror(errno));
f94d52f4
NB
1047 if (lfd >= 0)
1048 close(lfd);
682c7051
NB
1049 return 1;
1050 }
313a4a82
DW
1051 if (tst->ss->external) {
1052 /*
1053 * Before dropping our exclusive open we make an
1054 * attempt at preventing mdmon from seeing an
1055 * 'add' event before reconciling this 'remove'
1056 * event.
1057 */
1058 char *name = devnum2devname(fd2devnum(fd));
1059
1060 if (!name) {
1061 fprintf(stderr, Name ": unable to get container name\n");
1062 return 1;
1063 }
1064
1065 ping_manager(name);
1066 free(name);
1067 }
98d27e39
N
1068 if (lfd >= 0)
1069 close(lfd);
7d2e6486 1070 count++;
dab6685f 1071 if (verbose >= 0)
29ba4804
N
1072 fprintf(stderr, Name ": hot removed %s from %s\n",
1073 dnprintable, devname);
682c7051
NB
1074 break;
1075
1076 case 'f': /* set faulty */
1077 /* FIXME check current member */
98d27e39
N
1078 if ((sysfd >= 0 && write(sysfd, "faulty", 6) != 6) ||
1079 (sysfd < 0 && ioctl(fd, SET_DISK_FAULTY,
1080 (unsigned long) stb.st_rdev))) {
b83d95f3 1081 fprintf(stderr, Name ": set device faulty failed for %s: %s\n",
b80da661 1082 dnprintable, strerror(errno));
98d27e39
N
1083 if (sysfd >= 0)
1084 close(sysfd);
682c7051
NB
1085 return 1;
1086 }
98d27e39
N
1087 if (sysfd >= 0)
1088 close(sysfd);
1089 sysfd = -1;
7d2e6486 1090 count++;
dab6685f
NB
1091 if (verbose >= 0)
1092 fprintf(stderr, Name ": set %s faulty in %s\n",
b80da661 1093 dnprintable, devname);
682c7051
NB
1094 break;
1095 }
1096 }
7d2e6486
N
1097 if (test && count == 0)
1098 return 2;
682c7051 1099 return 0;
64c4757e 1100}
1f48664b
NB
1101
1102int autodetect(void)
1103{
1104 /* Open any md device, and issue the RAID_AUTORUN ioctl */
1105 int rv = 1;
1106 int fd = dev_open("9:0", O_RDONLY);
1107 if (fd >= 0) {
1108 if (ioctl(fd, RAID_AUTORUN, 0) == 0)
1109 rv = 0;
1110 close(fd);
1111 }
1112 return rv;
1113}
aa534678 1114
fa56eddb 1115int Update_subarray(char *dev, char *subarray, char *update, struct mddev_ident *ident, int quiet)
aa534678
DW
1116{
1117 struct supertype supertype, *st = &supertype;
1118 int fd, rv = 2;
1119
1120 memset(st, 0, sizeof(*st));
aa534678 1121
feab51f8 1122 fd = open_subarray(dev, subarray, st, quiet);
aa534678
DW
1123 if (fd < 0)
1124 return 2;
1125
1126 if (!st->ss->update_subarray) {
1127 if (!quiet)
1128 fprintf(stderr,
1129 Name ": Operation not supported for %s metadata\n",
1130 st->ss->name);
1131 goto free_super;
1132 }
1133
1134 if (mdmon_running(st->devnum))
1135 st->update_tail = &st->updates;
1136
a951a4f7 1137 rv = st->ss->update_subarray(st, subarray, update, ident);
aa534678
DW
1138
1139 if (rv) {
1140 if (!quiet)
1141 fprintf(stderr, Name ": Failed to update %s of subarray-%s in %s\n",
1142 update, subarray, dev);
1143 } else if (st->update_tail)
1144 flush_metadata_updates(st);
1145 else
1146 st->ss->sync_metadata(st);
1147
1148 if (rv == 0 && strcmp(update, "name") == 0 && !quiet)
1149 fprintf(stderr,
1150 Name ": Updated subarray-%s name from %s, UUIDs may have changed\n",
1151 subarray, dev);
1152
1153 free_super:
1154 st->ss->free_super(st);
1155 close(fd);
1156
1157 return rv;
1158}
d52bb542
AC
1159
1160/* Move spare from one array to another
1161 * If adding to destination array fails
1162 * add back to original array
1163 * Returns 1 on success, 0 on failure */
1164int move_spare(char *from_devname, char *to_devname, dev_t devid)
1165{
1166 struct mddev_dev devlist;
1167 char devname[20];
1168
1169 /* try to remove and add */
1170 int fd1 = open(to_devname, O_RDONLY);
1171 int fd2 = open(from_devname, O_RDONLY);
1172
1173 if (fd1 < 0 || fd2 < 0) {
1174 if (fd1>=0) close(fd1);
1175 if (fd2>=0) close(fd2);
1176 return 0;
1177 }
1178
1179 devlist.next = NULL;
1180 devlist.used = 0;
1181 devlist.re_add = 0;
1182 devlist.writemostly = 0;
1183 devlist.devname = devname;
1184 sprintf(devname, "%d:%d", major(devid), minor(devid));
1185
1186 devlist.disposition = 'r';
1187 if (Manage_subdevs(from_devname, fd2, &devlist, -1, 0, NULL) == 0) {
1188 devlist.disposition = 'a';
1189 if (Manage_subdevs(to_devname, fd1, &devlist, -1, 0, NULL) == 0) {
1190 /* make sure manager is aware of changes */
1191 ping_manager(to_devname);
1192 ping_manager(from_devname);
1193 close(fd1);
1194 close(fd2);
1195 return 1;
1196 }
1197 else Manage_subdevs(from_devname, fd2, &devlist, -1, 0, NULL);
1198 }
1199 close(fd1);
1200 close(fd2);
1201 return 0;
1202}
435d4ebb 1203#endif