]>
git.ipfire.org Git - thirdparty/mdadm.git/blob - Manage.c
2 * mdadm - manage Linux "md" devices aka RAID arrays.
4 * Copyright (C) 2001-2006 Neil Brown <neilb@suse.de>
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
22 * Email: <neilb@cse.unsw.edu.au>
24 * School of Computer Science and Engineering
25 * The University of New South Wales
34 #define REGISTER_DEV _IO (MD_MAJOR, 1)
35 #define START_MD _IO (MD_MAJOR, 2)
36 #define STOP_MD _IO (MD_MAJOR, 3)
38 int Manage_ro(char *devname
, int fd
, int readonly
)
40 /* switch to readonly or rw
43 * first check that array is runing
44 * use RESTART_ARRAY_RW or STOP_ARRAY_RO
47 mdu_array_info_t array
;
49 if (md_get_version(fd
) < 9000) {
50 fprintf(stderr
, Name
": need md driver version 0.90.0 or later\n");
53 if (ioctl(fd
, GET_ARRAY_INFO
, &array
)) {
54 fprintf(stderr
, Name
": %s does not appear to be active.\n",
60 if (ioctl(fd
, STOP_ARRAY_RO
, NULL
)) {
61 fprintf(stderr
, Name
": failed to set readonly for %s: %s\n",
62 devname
, strerror(errno
));
65 } else if (readonly
< 0) {
66 if (ioctl(fd
, RESTART_ARRAY_RW
, NULL
)) {
67 fprintf(stderr
, Name
": failed to set writable for %s: %s\n",
68 devname
, strerror(errno
));
77 int Manage_runstop(char *devname
, int fd
, int runstop
, int quiet
)
79 /* Run or stop the array. array must already be configured
81 * Only print failure messages if quiet == 0;
82 * quiet > 0 means really be quiet
83 * quiet < 0 means we will try again if it fails.
85 mdu_param_t param
; /* unused */
87 if (runstop
== -1 && md_get_version(fd
) < 9000) {
88 if (ioctl(fd
, STOP_MD
, 0)) {
89 if (quiet
== 0) fprintf(stderr
,
90 Name
": stopping device %s "
92 devname
, strerror(errno
));
97 if (md_get_version(fd
) < 9000) {
98 fprintf(stderr
, Name
": need md driver version 0.90.0 or later\n");
102 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
103 fprintf(stderr, Name ": %s does not appear to be active.\n",
109 if (ioctl(fd
, RUN_ARRAY
, ¶m
)) {
110 fprintf(stderr
, Name
": failed to run array %s: %s\n",
111 devname
, strerror(errno
));
115 fprintf(stderr
, Name
": started %s\n", devname
);
116 } else if (runstop
< 0){
117 struct map_ent
*map
= NULL
;
120 /* If this is an mdmon managed array, just write 'inactive'
121 * to the array state and let mdmon clear up.
123 mdi
= sysfs_read(fd
, -1, GET_LEVEL
|GET_VERSION
);
125 mdi
->array
.level
> 0 &&
126 is_subarray(mdi
->text_version
)) {
129 /* This is mdmon managed. */
131 if (sysfs_set_str(mdi
, NULL
,
132 "array_state", "inactive") < 0) {
135 ": failed to stop array %s: %s\n",
136 devname
, strerror(errno
));
140 /* Give monitor a chance to act */
141 cp
= strchr(mdi
->text_version
+1, '/');
144 ping_monitor(mdi
->text_version
+1);
146 fd
= open(devname
, O_RDONLY
);
148 mdi
->array
.major_version
== -1 &&
149 mdi
->array
.minor_version
== -2 &&
150 !is_subarray(mdi
->text_version
)) {
151 /* container, possibly mdmon-managed.
152 * Make sure mdmon isn't opening it, which
153 * would interfere with the 'stop'
155 ping_monitor(mdi
->sys_name
);
160 if (fd
>= 0 && ioctl(fd
, STOP_ARRAY
, NULL
)) {
163 ": failed to stop array %s: %s\n",
164 devname
, strerror(errno
));
166 fprintf(stderr
, "Perhaps a running "
167 "process, mounted filesystem "
168 "or active volume group?\n");
174 fprintf(stderr
, Name
": stopped %s\n", devname
);
175 if (fd
>= 0 && fstat(fd
, &stb
) == 0) {
177 if (major(stb
.st_rdev
) == MD_MAJOR
)
178 devnum
= minor(stb
.st_rdev
);
180 devnum
= -1-(minor(stb
.st_rdev
)>>6);
181 map_delete(&map
, devnum
);
189 int Manage_resize(char *devname
, int fd
, long long size
, int raid_disks
)
191 mdu_array_info_t info
;
192 if (ioctl(fd
, GET_ARRAY_INFO
, &info
) != 0) {
193 fprintf(stderr
, Name
": Cannot get array information for %s: %s\n",
194 devname
, strerror(errno
));
200 info
.raid_disks
= raid_disks
;
201 if (ioctl(fd
, SET_ARRAY_INFO
, &info
) != 0) {
202 fprintf(stderr
, Name
": Cannot set device size/shape for %s: %s\n",
203 devname
, strerror(errno
));
209 int Manage_reconfig(char *devname
, int fd
, int layout
)
211 mdu_array_info_t info
;
212 if (ioctl(fd
, GET_ARRAY_INFO
, &info
) != 0) {
213 fprintf(stderr
, Name
": Cannot get array information for %s: %s\n",
214 devname
, strerror(errno
));
217 info
.layout
= layout
;
218 printf("layout set to %d\n", info
.layout
);
219 if (ioctl(fd
, SET_ARRAY_INFO
, &info
) != 0) {
220 fprintf(stderr
, Name
": Cannot set layout for %s: %s\n",
221 devname
, strerror(errno
));
227 int Manage_subdevs(char *devname
, int fd
,
228 mddev_dev_t devlist
, int verbose
)
230 /* do something to each dev.
232 * 'a' - add the device
234 * If that fails EINVAL, try ADD_NEW_DISK
235 * 'r' - remove the device HOT_REMOVE_DISK
236 * device can be 'faulty' or 'detached' in which case all
237 * matching devices are removed.
238 * 'f' - set the device faulty SET_DISK_FAULTY
239 * device can be 'detached' in which case any device that
240 * is inaccessible will be marked faulty.
242 mdu_array_info_t array
;
243 mdu_disk_info_t disc
;
244 unsigned long long array_size
;
245 mddev_dev_t dv
, next
= NULL
;
249 struct supertype
*st
, *tst
;
254 if (ioctl(fd
, GET_ARRAY_INFO
, &array
)) {
255 fprintf(stderr
, Name
": cannot get array info for %s\n",
260 /* array.size is only 32 bit and may be truncated.
261 * So read from sysfs if possible, and record number of sectors
264 array_size
= get_component_size(fd
);
266 array_size
= array
.size
* 2;
268 tst
= super_by_fd(fd
);
270 fprintf(stderr
, Name
": unsupport array - version %d.%d\n",
271 array
.major_version
, array
.minor_version
);
275 for (dv
= devlist
, j
=0 ; dv
; dv
= next
, j
= jnext
) {
276 unsigned long long ldsize
;
278 char *dnprintable
= dv
->devname
;
284 if (strcmp(dv
->devname
, "failed")==0 ||
285 strcmp(dv
->devname
, "faulty")==0) {
286 if (dv
->disposition
!= 'r') {
287 fprintf(stderr
, Name
": %s only meaningful "
288 "with -r, not -%c\n",
289 dv
->devname
, dv
->disposition
);
292 for (; j
< array
.raid_disks
+ array
.nr_disks
; j
++) {
294 if (ioctl(fd
, GET_DISK_INFO
, &disc
))
296 if (disc
.major
== 0 && disc
.minor
== 0)
298 if ((disc
.state
& 1) == 0) /* faulty */
300 stb
.st_rdev
= makedev(disc
.major
, disc
.minor
);
303 sprintf(dvname
,"%d:%d", disc
.major
, disc
.minor
);
304 dnprintable
= dvname
;
309 } else if (strcmp(dv
->devname
, "detached") == 0) {
310 if (dv
->disposition
!= 'r' && dv
->disposition
!= 'f') {
311 fprintf(stderr
, Name
": %s only meaningful "
312 "with -r of -f, not -%c\n",
313 dv
->devname
, dv
->disposition
);
316 for (; j
< array
.raid_disks
+ array
.nr_disks
; j
++) {
319 if (ioctl(fd
, GET_DISK_INFO
, &disc
))
321 if (disc
.major
== 0 && disc
.minor
== 0)
323 sprintf(dvname
,"%d:%d", disc
.major
, disc
.minor
);
324 sfd
= dev_open(dvname
, O_RDONLY
);
329 if (dv
->disposition
== 'f' &&
330 (disc
.state
& 1) == 1) /* already faulty */
334 stb
.st_rdev
= makedev(disc
.major
, disc
.minor
);
337 dnprintable
= dvname
;
345 if (stat(dv
->devname
, &stb
)) {
346 fprintf(stderr
, Name
": cannot find %s: %s\n",
347 dv
->devname
, strerror(errno
));
350 if ((stb
.st_mode
& S_IFMT
) != S_IFBLK
) {
351 fprintf(stderr
, Name
": %s is not a "
357 switch(dv
->disposition
){
359 fprintf(stderr
, Name
": internal error - devmode[%s]=%d\n",
360 dv
->devname
, dv
->disposition
);
364 if (tst
->subarray
[0]) {
365 fprintf(stderr
, Name
": Cannot add disks to a"
366 " \'member\' array, perform this"
367 " operation on the parent container\n");
370 /* Make sure it isn't in use (in 2.6 or later) */
371 tfd
= open(dv
->devname
, O_RDONLY
|O_EXCL
|O_DIRECT
);
373 fprintf(stderr
, Name
": Cannot open %s: %s\n",
374 dv
->devname
, strerror(errno
));
377 remove_partitions(tfd
);
381 if (array
.not_persistent
==0)
382 st
->ss
->load_super(st
, tfd
, NULL
);
384 if (!get_dev_size(tfd
, dv
->devname
, &ldsize
)) {
391 if (!tst
->ss
->external
&&
392 array
.major_version
== 0 &&
393 md_get_version(fd
)%100 < 2) {
394 if (ioctl(fd
, HOT_ADD_DISK
,
395 (unsigned long)stb
.st_rdev
)==0) {
397 fprintf(stderr
, Name
": hot added %s\n",
402 fprintf(stderr
, Name
": hot add failed for %s: %s\n",
403 dv
->devname
, strerror(errno
));
407 if (array
.not_persistent
== 0 || tst
->ss
->external
) {
408 /* Make sure device is large enough */
409 if (tst
->ss
->avail_size(tst
, ldsize
/512) <
411 fprintf(stderr
, Name
": %s not large enough to join array\n",
416 /* need to find a sample superblock to copy, and
417 * a spare slot to use.
418 * For 'external' array (well, container based),
419 * We can just load the metadata for the array.
421 if (tst
->ss
->external
) {
422 tst
->ss
->load_super(tst
, fd
, NULL
);
423 } else for (j
= 0; j
< tst
->max_devs
; j
++) {
427 if (ioctl(fd
, GET_DISK_INFO
, &disc
))
429 if (disc
.major
==0 && disc
.minor
==0)
431 if ((disc
.state
& 4)==0) continue; /* sync */
432 /* Looks like a good device to try */
433 dev
= map_dev(disc
.major
, disc
.minor
, 1);
435 dfd
= dev_open(dev
, O_RDONLY
);
436 if (dfd
< 0) continue;
437 if (tst
->ss
->load_super(tst
, dfd
,
445 /* FIXME this is a bad test to be using */
447 fprintf(stderr
, Name
": cannot find valid superblock in this array - HELP\n");
450 /* Possibly this device was recently part of the array
451 * and was temporarily removed, and is now being re-added.
452 * If so, we can simply re-add it.
454 tst
->ss
->uuid_from_super(tst
, duuid
);
456 /* re-add doesn't work for version-1 superblocks
459 if (array
.major_version
== 1 &&
460 get_linux_version() <= 2006018)
463 st
->ss
->uuid_from_super(st
, ouuid
);
464 if (memcmp(duuid
, ouuid
, sizeof(ouuid
))==0) {
465 /* looks close enough for now. Kernel
466 * will worry about whether a bitmap
467 * based reconstruction is possible.
470 st
->ss
->getinfo_super(st
, &mdi
);
471 disc
.major
= major(stb
.st_rdev
);
472 disc
.minor
= minor(stb
.st_rdev
);
473 disc
.number
= mdi
.disk
.number
;
474 disc
.raid_disk
= mdi
.disk
.raid_disk
;
475 disc
.state
= mdi
.disk
.state
;
477 disc
.state
|= 1 << MD_DISK_WRITEMOSTLY
;
478 if (ioctl(fd
, ADD_NEW_DISK
, &disc
) == 0) {
480 fprintf(stderr
, Name
": re-added %s\n", dv
->devname
);
483 /* fall back on normal-add */
487 /* non-persistent. Must ensure that new drive
488 * is at least array.size big.
490 if (ldsize
/512 < array_size
) {
491 fprintf(stderr
, Name
": %s not large enough to join array\n",
496 /* in 2.6.17 and earlier, version-1 superblocks won't
497 * use the number we write, but will choose a free number.
498 * we must choose the same free number, which requires
499 * starting at 'raid_disks' and counting up
501 for (j
= array
.raid_disks
; j
< tst
->max_devs
; j
++) {
503 if (ioctl(fd
, GET_DISK_INFO
, &disc
))
505 if (disc
.major
==0 && disc
.minor
==0)
507 if (disc
.state
& 8) /* removed */
510 disc
.major
= major(stb
.st_rdev
);
511 disc
.minor
= minor(stb
.st_rdev
);
514 if (array
.not_persistent
==0 || tst
->ss
->external
) {
517 disc
.state
|= 1 << MD_DISK_WRITEMOSTLY
;
518 dfd
= open(dv
->devname
, O_RDWR
| O_EXCL
|O_DIRECT
);
519 tst
->ss
->add_to_super(tst
, &disc
, dfd
,
521 /* write_init_super will close 'dfd' */
522 if (tst
->ss
->external
)
523 /* mdmon will write the metadata */
525 else if (tst
->ss
->write_init_super(tst
))
527 } else if (dv
->re_add
) {
528 /* this had better be raid1.
529 * As we are "--re-add"ing we must find a spare slot
532 char *used
= malloc(array
.raid_disks
);
533 memset(used
, 0, array
.raid_disks
);
534 for (j
=0; j
< tst
->max_devs
; j
++) {
535 mdu_disk_info_t disc2
;
537 if (ioctl(fd
, GET_DISK_INFO
, &disc2
))
539 if (disc2
.major
==0 && disc2
.minor
==0)
541 if (disc2
.state
& 8) /* removed */
543 if (disc2
.raid_disk
< 0)
545 if (disc2
.raid_disk
> array
.raid_disks
)
547 used
[disc2
.raid_disk
] = 1;
549 for (j
=0 ; j
<array
.raid_disks
; j
++)
552 disc
.state
|= (1<<MD_DISK_SYNC
);
557 disc
.state
|= (1 << MD_DISK_WRITEMOSTLY
);
558 if (tst
->ss
->external
) {
559 /* add a disk to an external metadata container
560 * only if mdmon is around to see it
562 struct mdinfo new_mdi
;
565 int devnum
= fd2devnum(fd
);
567 container_fd
= open_dev_excl(devnum
);
568 if (container_fd
< 0) {
569 fprintf(stderr
, Name
": add failed for %s:"
570 " could not get exclusive access to container\n",
575 if (!mdmon_running(devnum
)) {
576 fprintf(stderr
, Name
": add failed for %s: mdmon not running\n",
582 sra
= sysfs_read(container_fd
, -1, 0);
584 fprintf(stderr
, Name
": add failed for %s: sysfs_read failed\n",
589 sra
->array
.level
= LEVEL_CONTAINER
;
590 /* Need to set data_offset and component_size */
591 tst
->ss
->getinfo_super(tst
, &new_mdi
);
592 new_mdi
.disk
.major
= disc
.major
;
593 new_mdi
.disk
.minor
= disc
.minor
;
594 if (sysfs_add_disk(sra
, &new_mdi
) != 0) {
595 fprintf(stderr
, Name
": add new device to external metadata"
596 " failed for %s\n", dv
->devname
);
600 ping_monitor(devnum2devname(devnum
));
603 } else if (ioctl(fd
, ADD_NEW_DISK
, &disc
)) {
604 fprintf(stderr
, Name
": add new device failed for %s as %d: %s\n",
605 dv
->devname
, j
, strerror(errno
));
609 fprintf(stderr
, Name
": added %s\n", dv
->devname
);
614 if (tst
->subarray
[0]) {
615 fprintf(stderr
, Name
": Cannot remove disks from a"
616 " \'member\' array, perform this"
617 " operation on the parent container\n");
620 if (tst
->ss
->external
) {
621 /* To remove a device from a container, we must
622 * check that it isn't in use in an array.
623 * This involves looking in the 'holders'
624 * directory - there must be just one entry,
626 * To ensure that it doesn't get used as a
627 * hold spare while we are checking, we
628 * get an O_EXCL open on the container
630 int dnum
= fd2devnum(fd
);
631 lfd
= open_dev_excl(dnum
);
634 ": Cannot get exclusive access "
635 " to container - odd\n");
638 if (!sysfs_unique_holder(dnum
, stb
.st_rdev
)) {
640 ": %s is %s, cannot remove.\n",
642 errno
== EEXIST
? "still in use":
648 /* FIXME check that it is a current member */
649 err
= ioctl(fd
, HOT_REMOVE_DISK
, (unsigned long)stb
.st_rdev
);
650 if (err
&& errno
== ENODEV
) {
651 /* Old kernels rejected this if no personality
653 struct mdinfo
*sra
= sysfs_read(fd
, 0, GET_DEVS
);
654 struct mdinfo
*dv
= NULL
;
657 for ( ; dv
; dv
=dv
->next
)
658 if (dv
->disk
.major
== major(stb
.st_rdev
) &&
659 dv
->disk
.minor
== minor(stb
.st_rdev
))
662 err
= sysfs_set_str(sra
, dv
,
670 fprintf(stderr
, Name
": hot remove failed "
671 "for %s: %s\n", dnprintable
,
679 fprintf(stderr
, Name
": hot removed %s\n",
683 case 'f': /* set faulty */
684 /* FIXME check current member */
685 if (ioctl(fd
, SET_DISK_FAULTY
, (unsigned long) stb
.st_rdev
)) {
686 fprintf(stderr
, Name
": set device faulty failed for %s: %s\n",
687 dnprintable
, strerror(errno
));
691 fprintf(stderr
, Name
": set %s faulty in %s\n",
692 dnprintable
, devname
);
702 /* Open any md device, and issue the RAID_AUTORUN ioctl */
704 int fd
= dev_open("9:0", O_RDONLY
);
706 if (ioctl(fd
, RAID_AUTORUN
, 0) == 0)