]> git.ipfire.org Git - thirdparty/mdadm.git/blob - Manage.c
imsm: trim some memory wastage
[thirdparty/mdadm.git] / Manage.c
1 /*
2 * mdadm - manage Linux "md" devices aka RAID arrays.
3 *
4 * Copyright (C) 2001-2006 Neil Brown <neilb@suse.de>
5 *
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 *
21 * Author: Neil Brown
22 * Email: <neilb@cse.unsw.edu.au>
23 * Paper: Neil Brown
24 * School of Computer Science and Engineering
25 * The University of New South Wales
26 * Sydney, 2052
27 * Australia
28 */
29
30 #include "mdadm.h"
31 #include "md_u.h"
32 #include "md_p.h"
33
34 #define REGISTER_DEV _IO (MD_MAJOR, 1)
35 #define START_MD _IO (MD_MAJOR, 2)
36 #define STOP_MD _IO (MD_MAJOR, 3)
37
38 int Manage_ro(char *devname, int fd, int readonly)
39 {
40 /* switch to readonly or rw
41 *
42 * requires >= 0.90.0
43 * first check that array is runing
44 * use RESTART_ARRAY_RW or STOP_ARRAY_RO
45 *
46 */
47 mdu_array_info_t array;
48
49 if (md_get_version(fd) < 9000) {
50 fprintf(stderr, Name ": need md driver version 0.90.0 or later\n");
51 return 1;
52 }
53 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
54 fprintf(stderr, Name ": %s does not appear to be active.\n",
55 devname);
56 return 1;
57 }
58
59 if (readonly>0) {
60 if (ioctl(fd, STOP_ARRAY_RO, NULL)) {
61 fprintf(stderr, Name ": failed to set readonly for %s: %s\n",
62 devname, strerror(errno));
63 return 1;
64 }
65 } else if (readonly < 0) {
66 if (ioctl(fd, RESTART_ARRAY_RW, NULL)) {
67 fprintf(stderr, Name ": failed to set writable for %s: %s\n",
68 devname, strerror(errno));
69 return 1;
70 }
71 }
72 return 0;
73 }
74
75 #ifndef MDASSEMBLE
76
77 int Manage_runstop(char *devname, int fd, int runstop, int quiet)
78 {
79 /* Run or stop the array. array must already be configured
80 * required >= 0.90.0
81 * Only print failure messages if quiet == 0;
82 * quiet > 0 means really be quiet
83 * quiet < 0 means we will try again if it fails.
84 */
85 mdu_param_t param; /* unused */
86
87 if (runstop == -1 && md_get_version(fd) < 9000) {
88 if (ioctl(fd, STOP_MD, 0)) {
89 if (quiet == 0) fprintf(stderr,
90 Name ": stopping device %s "
91 "failed: %s\n",
92 devname, strerror(errno));
93 return 1;
94 }
95 }
96
97 if (md_get_version(fd) < 9000) {
98 fprintf(stderr, Name ": need md driver version 0.90.0 or later\n");
99 return 1;
100 }
101 /*
102 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
103 fprintf(stderr, Name ": %s does not appear to be active.\n",
104 devname);
105 return 1;
106 }
107 */
108 if (runstop>0) {
109 if (ioctl(fd, RUN_ARRAY, &param)) {
110 fprintf(stderr, Name ": failed to run array %s: %s\n",
111 devname, strerror(errno));
112 return 1;
113 }
114 if (quiet <= 0)
115 fprintf(stderr, Name ": started %s\n", devname);
116 } else if (runstop < 0){
117 struct map_ent *map = NULL;
118 struct stat stb;
119 struct mdinfo *mdi;
120 /* If this is an mdmon managed array, just write 'inactive'
121 * to the array state and let mdmon clear up.
122 */
123 mdi = sysfs_read(fd, -1, GET_LEVEL|GET_VERSION);
124 if (mdi &&
125 mdi->array.level > 0 &&
126 mdi->text_version[0] == '/') {
127 char *cp;
128
129 /* This is mdmon managed. */
130 close(fd);
131 if (sysfs_set_str(mdi, NULL,
132 "array_state", "inactive") < 0) {
133 if (quiet == 0)
134 fprintf(stderr, Name
135 ": failed to stop array %s: %s\n",
136 devname, strerror(errno));
137 return 1;
138 }
139
140 /* Give monitor a chance to act */
141 cp = strchr(mdi->text_version+1, '/');
142 if (*cp)
143 *cp = 0;
144 ping_monitor(mdi->text_version+1);
145
146 fd = open(devname, O_RDONLY);
147 } else if (mdi &&
148 mdi->array.major_version == -1 &&
149 mdi->array.minor_version == -2 &&
150 mdi->text_version[0] != '/') {
151 /* container, possibly mdmon-managed.
152 * Make sure mdmon isn't opening it, which
153 * would interfere with the 'stop'
154 */
155 ping_monitor(mdi->sys_name);
156 }
157 if (mdi)
158 sysfs_free(mdi);
159
160 if (fd >= 0 && ioctl(fd, STOP_ARRAY, NULL)) {
161 if (quiet == 0)
162 fprintf(stderr, Name
163 ": failed to stop array %s: %s\n",
164 devname, strerror(errno));
165 return 1;
166 }
167
168 if (quiet <= 0)
169 fprintf(stderr, Name ": stopped %s\n", devname);
170 if (fd >= 0 && fstat(fd, &stb) == 0) {
171 int devnum;
172 if (major(stb.st_rdev) == MD_MAJOR)
173 devnum = minor(stb.st_rdev);
174 else
175 devnum = -1-(minor(stb.st_rdev)>>6);
176 map_delete(&map, devnum);
177 map_write(map);
178 map_free(map);
179 }
180 }
181 return 0;
182 }
183
184 int Manage_resize(char *devname, int fd, long long size, int raid_disks)
185 {
186 mdu_array_info_t info;
187 if (ioctl(fd, GET_ARRAY_INFO, &info) != 0) {
188 fprintf(stderr, Name ": Cannot get array information for %s: %s\n",
189 devname, strerror(errno));
190 return 1;
191 }
192 if (size >= 0)
193 info.size = size;
194 if (raid_disks > 0)
195 info.raid_disks = raid_disks;
196 if (ioctl(fd, SET_ARRAY_INFO, &info) != 0) {
197 fprintf(stderr, Name ": Cannot set device size/shape for %s: %s\n",
198 devname, strerror(errno));
199 return 1;
200 }
201 return 0;
202 }
203
204 int Manage_reconfig(char *devname, int fd, int layout)
205 {
206 mdu_array_info_t info;
207 if (ioctl(fd, GET_ARRAY_INFO, &info) != 0) {
208 fprintf(stderr, Name ": Cannot get array information for %s: %s\n",
209 devname, strerror(errno));
210 return 1;
211 }
212 info.layout = layout;
213 printf("layout set to %d\n", info.layout);
214 if (ioctl(fd, SET_ARRAY_INFO, &info) != 0) {
215 fprintf(stderr, Name ": Cannot set layout for %s: %s\n",
216 devname, strerror(errno));
217 return 1;
218 }
219 return 0;
220 }
221
222 int Manage_subdevs(char *devname, int fd,
223 mddev_dev_t devlist, int verbose)
224 {
225 /* do something to each dev.
226 * devmode can be
227 * 'a' - add the device
228 * try HOT_ADD_DISK
229 * If that fails EINVAL, try ADD_NEW_DISK
230 * 'r' - remove the device HOT_REMOVE_DISK
231 * device can be 'faulty' or 'detached' in which case all
232 * matching devices are removed.
233 * 'f' - set the device faulty SET_DISK_FAULTY
234 * device can be 'detached' in which case any device that
235 * is inaccessible will be marked faulty.
236 */
237 mdu_array_info_t array;
238 mdu_disk_info_t disc;
239 unsigned long long array_size;
240 mddev_dev_t dv, next = NULL;
241 struct stat stb;
242 int j, jnext = 0;
243 int tfd;
244 struct supertype *st, *tst;
245 int duuid[4];
246 int ouuid[4];
247 int lfd = -1;
248
249 if (ioctl(fd, GET_ARRAY_INFO, &array)) {
250 fprintf(stderr, Name ": cannot get array info for %s\n",
251 devname);
252 return 1;
253 }
254
255 /* array.size is only 32 bit and may be truncated.
256 * So read from sysfs if possible, and record number of sectors
257 */
258
259 array_size = get_component_size(fd);
260 if (array_size <= 0)
261 array_size = array.size * 2;
262
263 tst = super_by_fd(fd);
264 if (!tst) {
265 fprintf(stderr, Name ": unsupport array - version %d.%d\n",
266 array.major_version, array.minor_version);
267 return 1;
268 }
269
270 for (dv = devlist, j=0 ; dv; dv = next, j = jnext) {
271 unsigned long long ldsize;
272 char dvname[20];
273 char *dnprintable = dv->devname;
274 int err;
275
276 next = dv->next;
277 jnext = 0;
278
279 if (strcmp(dv->devname, "failed")==0 ||
280 strcmp(dv->devname, "faulty")==0) {
281 if (dv->disposition != 'r') {
282 fprintf(stderr, Name ": %s only meaningful "
283 "with -r, not -%c\n",
284 dv->devname, dv->disposition);
285 return 1;
286 }
287 for (; j < array.raid_disks + array.nr_disks ; j++) {
288 disc.number = j;
289 if (ioctl(fd, GET_DISK_INFO, &disc))
290 continue;
291 if (disc.major == 0 && disc.minor == 0)
292 continue;
293 if ((disc.state & 1) == 0) /* faulty */
294 continue;
295 stb.st_rdev = makedev(disc.major, disc.minor);
296 next = dv;
297 jnext = j+1;
298 sprintf(dvname,"%d:%d", disc.major, disc.minor);
299 dnprintable = dvname;
300 break;
301 }
302 if (jnext == 0)
303 continue;
304 } else if (strcmp(dv->devname, "detached") == 0) {
305 if (dv->disposition != 'r' && dv->disposition != 'f') {
306 fprintf(stderr, Name ": %s only meaningful "
307 "with -r of -f, not -%c\n",
308 dv->devname, dv->disposition);
309 return 1;
310 }
311 for (; j < array.raid_disks + array.nr_disks; j++) {
312 int sfd;
313 disc.number = j;
314 if (ioctl(fd, GET_DISK_INFO, &disc))
315 continue;
316 if (disc.major == 0 && disc.minor == 0)
317 continue;
318 sprintf(dvname,"%d:%d", disc.major, disc.minor);
319 sfd = dev_open(dvname, O_RDONLY);
320 if (sfd >= 0) {
321 close(sfd);
322 continue;
323 }
324 if (dv->disposition == 'f' &&
325 (disc.state & 1) == 1) /* already faulty */
326 continue;
327 if (errno != ENXIO)
328 continue;
329 stb.st_rdev = makedev(disc.major, disc.minor);
330 next = dv;
331 jnext = j+1;
332 dnprintable = dvname;
333 break;
334 }
335 if (jnext == 0)
336 continue;
337 } else {
338 j = 0;
339
340 if (stat(dv->devname, &stb)) {
341 fprintf(stderr, Name ": cannot find %s: %s\n",
342 dv->devname, strerror(errno));
343 return 1;
344 }
345 if ((stb.st_mode & S_IFMT) != S_IFBLK) {
346 fprintf(stderr, Name ": %s is not a "
347 "block device.\n",
348 dv->devname);
349 return 1;
350 }
351 }
352 switch(dv->disposition){
353 default:
354 fprintf(stderr, Name ": internal error - devmode[%s]=%d\n",
355 dv->devname, dv->disposition);
356 return 1;
357 case 'a':
358 /* add the device */
359 if (tst->subarray[0]) {
360 fprintf(stderr, Name ": Cannot add disks to a"
361 " \'member\' array, perform this"
362 " operation on the parent container\n");
363 return 1;
364 }
365 /* Make sure it isn't in use (in 2.6 or later) */
366 tfd = open(dv->devname, O_RDONLY|O_EXCL|O_DIRECT);
367 if (tfd < 0) {
368 fprintf(stderr, Name ": Cannot open %s: %s\n",
369 dv->devname, strerror(errno));
370 return 1;
371 }
372 remove_partitions(tfd);
373
374 st = dup_super(tst);
375
376 if (array.not_persistent==0)
377 st->ss->load_super(st, tfd, NULL);
378
379 if (!get_dev_size(tfd, dv->devname, &ldsize)) {
380 close(tfd);
381 return 1;
382 }
383 close(tfd);
384
385
386 if (!tst->ss->external &&
387 array.major_version == 0 &&
388 md_get_version(fd)%100 < 2) {
389 if (ioctl(fd, HOT_ADD_DISK,
390 (unsigned long)stb.st_rdev)==0) {
391 if (verbose >= 0)
392 fprintf(stderr, Name ": hot added %s\n",
393 dv->devname);
394 continue;
395 }
396
397 fprintf(stderr, Name ": hot add failed for %s: %s\n",
398 dv->devname, strerror(errno));
399 return 1;
400 }
401
402 if (array.not_persistent == 0) {
403
404 /* Make sure device is large enough */
405 if (tst->ss->avail_size(tst, ldsize/512) <
406 array_size) {
407 fprintf(stderr, Name ": %s not large enough to join array\n",
408 dv->devname);
409 return 1;
410 }
411
412 /* need to find a sample superblock to copy, and
413 * a spare slot to use
414 */
415 for (j = 0; j < tst->max_devs; j++) {
416 char *dev;
417 int dfd;
418 disc.number = j;
419 if (ioctl(fd, GET_DISK_INFO, &disc))
420 continue;
421 if (disc.major==0 && disc.minor==0)
422 continue;
423 if ((disc.state & 4)==0) continue; /* sync */
424 /* Looks like a good device to try */
425 dev = map_dev(disc.major, disc.minor, 1);
426 if (!dev) continue;
427 dfd = dev_open(dev, O_RDONLY);
428 if (dfd < 0) continue;
429 if (tst->ss->load_super(tst, dfd,
430 NULL)) {
431 close(dfd);
432 continue;
433 }
434 close(dfd);
435 break;
436 }
437 if (!tst->sb) {
438 fprintf(stderr, Name ": cannot find valid superblock in this array - HELP\n");
439 return 1;
440 }
441 /* Possibly this device was recently part of the array
442 * and was temporarily removed, and is now being re-added.
443 * If so, we can simply re-add it.
444 */
445 tst->ss->uuid_from_super(tst, duuid);
446
447 /* re-add doesn't work for version-1 superblocks
448 * before 2.6.18 :-(
449 */
450 if (array.major_version == 1 &&
451 get_linux_version() <= 2006018)
452 ;
453 else if (st->sb) {
454 st->ss->uuid_from_super(st, ouuid);
455 if (memcmp(duuid, ouuid, sizeof(ouuid))==0) {
456 /* looks close enough for now. Kernel
457 * will worry about whether a bitmap
458 * based reconstruction is possible.
459 */
460 struct mdinfo mdi;
461 st->ss->getinfo_super(st, &mdi);
462 disc.major = major(stb.st_rdev);
463 disc.minor = minor(stb.st_rdev);
464 disc.number = mdi.disk.number;
465 disc.raid_disk = mdi.disk.raid_disk;
466 disc.state = mdi.disk.state;
467 if (dv->writemostly)
468 disc.state |= 1 << MD_DISK_WRITEMOSTLY;
469 if (ioctl(fd, ADD_NEW_DISK, &disc) == 0) {
470 if (verbose >= 0)
471 fprintf(stderr, Name ": re-added %s\n", dv->devname);
472 continue;
473 }
474 /* fall back on normal-add */
475 }
476 }
477 } else {
478 /* non-persistent. Must ensure that new drive
479 * is at least array.size big.
480 */
481 if (ldsize/512 < array_size) {
482 fprintf(stderr, Name ": %s not large enough to join array\n",
483 dv->devname);
484 return 1;
485 }
486 }
487 /* in 2.6.17 and earlier, version-1 superblocks won't
488 * use the number we write, but will choose a free number.
489 * we must choose the same free number, which requires
490 * starting at 'raid_disks' and counting up
491 */
492 for (j = array.raid_disks; j< tst->max_devs; j++) {
493 disc.number = j;
494 if (ioctl(fd, GET_DISK_INFO, &disc))
495 break;
496 if (disc.major==0 && disc.minor==0)
497 break;
498 if (disc.state & 8) /* removed */
499 break;
500 }
501 disc.major = major(stb.st_rdev);
502 disc.minor = minor(stb.st_rdev);
503 disc.number =j;
504 disc.state = 0;
505 if (array.not_persistent==0) {
506 int dfd;
507 if (dv->writemostly)
508 disc.state |= 1 << MD_DISK_WRITEMOSTLY;
509 dfd = open(dv->devname, O_RDWR | O_EXCL|O_DIRECT);
510 tst->ss->add_to_super(tst, &disc, dfd,
511 dv->devname);
512 /* write_init_super will close 'dfd' */
513 if (tst->ss->write_init_super(tst))
514 return 1;
515 } else if (dv->re_add) {
516 /* this had better be raid1.
517 * As we are "--re-add"ing we must find a spare slot
518 * to fill.
519 */
520 char *used = malloc(array.raid_disks);
521 memset(used, 0, array.raid_disks);
522 for (j=0; j< tst->max_devs; j++) {
523 mdu_disk_info_t disc2;
524 disc2.number = j;
525 if (ioctl(fd, GET_DISK_INFO, &disc2))
526 continue;
527 if (disc2.major==0 && disc2.minor==0)
528 continue;
529 if (disc2.state & 8) /* removed */
530 continue;
531 if (disc2.raid_disk < 0)
532 continue;
533 if (disc2.raid_disk > array.raid_disks)
534 continue;
535 used[disc2.raid_disk] = 1;
536 }
537 for (j=0 ; j<array.raid_disks; j++)
538 if (!used[j]) {
539 disc.raid_disk = j;
540 disc.state |= (1<<MD_DISK_SYNC);
541 break;
542 }
543 }
544 if (dv->writemostly)
545 disc.state |= (1 << MD_DISK_WRITEMOSTLY);
546 if (ioctl(fd,ADD_NEW_DISK, &disc)) {
547 fprintf(stderr, Name ": add new device failed for %s as %d: %s\n",
548 dv->devname, j, strerror(errno));
549 return 1;
550 }
551 if (verbose >= 0)
552 fprintf(stderr, Name ": added %s\n", dv->devname);
553 break;
554
555 case 'r':
556 /* hot remove */
557 if (tst->subarray[0]) {
558 fprintf(stderr, Name ": Cannot remove disks from a"
559 " \'member\' array, perform this"
560 " operation on the parent container\n");
561 return 1;
562 }
563 if (tst->ss->external) {
564 /* To remove a device from a container, we must
565 * check that it isn't in use in an array.
566 * This involves looking in the 'holders'
567 * directory - there must be just one entry,
568 * the container.
569 * To ensure that it doesn't get used as a
570 * hold spare while we are checking, we
571 * get an O_EXCL open on the container
572 */
573 int dnum = fd2devnum(fd);
574 lfd = open_dev_excl(dnum);
575 if (lfd < 0) {
576 fprintf(stderr, Name
577 ": Cannot get exclusive access "
578 " to container - odd\n");
579 return 1;
580 }
581 if (!sysfs_unique_holder(dnum, stb.st_rdev)) {
582 fprintf(stderr, Name
583 ": %s is %s, cannot remove.\n",
584 dnprintable,
585 errno == EEXIST ? "still in use":
586 "not a member");
587 close(lfd);
588 return 1;
589 }
590 }
591 /* FIXME check that it is a current member */
592 err = ioctl(fd, HOT_REMOVE_DISK, (unsigned long)stb.st_rdev);
593 if (err && errno == ENODEV) {
594 /* Old kernels rejected this if no personality
595 * registered */
596 struct mdinfo *sra = sysfs_read(fd, 0, GET_DEVS);
597 struct mdinfo *dv = NULL;
598 if (sra)
599 dv = sra->devs;
600 for ( ; dv ; dv=dv->next)
601 if (dv->disk.major == major(stb.st_rdev) &&
602 dv->disk.minor == minor(stb.st_rdev))
603 break;
604 if (dv)
605 err = sysfs_set_str(sra, dv,
606 "state", "remove");
607 else
608 err = -1;
609 if (sra)
610 sysfs_free(sra);
611 }
612 if (err) {
613 fprintf(stderr, Name ": hot remove failed "
614 "for %s: %s\n", dnprintable,
615 strerror(errno));
616 if (lfd >= 0)
617 close(lfd);
618 return 1;
619 }
620 close(lfd);
621 if (verbose >= 0)
622 fprintf(stderr, Name ": hot removed %s\n",
623 dnprintable);
624 break;
625
626 case 'f': /* set faulty */
627 /* FIXME check current member */
628 if (ioctl(fd, SET_DISK_FAULTY, (unsigned long) stb.st_rdev)) {
629 fprintf(stderr, Name ": set device faulty failed for %s: %s\n",
630 dnprintable, strerror(errno));
631 return 1;
632 }
633 if (verbose >= 0)
634 fprintf(stderr, Name ": set %s faulty in %s\n",
635 dnprintable, devname);
636 break;
637 }
638 }
639 return 0;
640
641 }
642
643 int autodetect(void)
644 {
645 /* Open any md device, and issue the RAID_AUTORUN ioctl */
646 int rv = 1;
647 int fd = dev_open("9:0", O_RDONLY);
648 if (fd >= 0) {
649 if (ioctl(fd, RAID_AUTORUN, 0) == 0)
650 rv = 0;
651 close(fd);
652 }
653 return rv;
654 }
655 #endif