2 * mdadm - manage Linux "md" devices aka RAID arrays.
4 * Copyright (C) 2001-2004 Neil Brown <neilb@cse.unsw.edu.au>
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
22 * Email: <neilb@cse.unsw.edu.au>
24 * School of Computer Science and Engineering
25 * The University of New South Wales
33 * All handling for the 0.90.0 version superblock is in
36 * - finding, loading, and writing the superblock.
37 * - initialising a new superblock
38 * - printing the superblock for --examine
39 * - printing part of the superblock for --detail
44 static unsigned long calc_sb0_csum(mdp_super_t
*super
)
46 unsigned long csum
= super
->sb_csum
;
47 unsigned long newcsum
;
49 newcsum
= calc_csum(super
, MD_SB_BYTES
);
50 super
->sb_csum
= csum
;
54 static void examine_super0(void *sbv
)
56 mdp_super_t
*sb
= sbv
;
61 printf(" Magic : %08x\n", sb
->md_magic
);
62 printf(" Version : %02d.%02d.%02d\n", sb
->major_version
, sb
->minor_version
,
64 if (sb
->minor_version
>= 90)
65 printf(" UUID : %08x:%08x:%08x:%08x\n", sb
->set_uuid0
, sb
->set_uuid1
,
66 sb
->set_uuid2
, sb
->set_uuid3
);
68 printf(" UUID : %08x\n", sb
->set_uuid0
);
71 printf(" Creation Time : %.24s\n", ctime(&atime
));
72 c
=map_num(pers
, sb
->level
);
73 printf(" Raid Level : %s\n", c
?c
:"-unknown-");
74 if ((int)sb
->level
>= 0)
75 printf(" Device Size : %d%s\n", sb
->size
, human_size((long long)sb
->size
<<10));
76 printf(" Raid Devices : %d\n", sb
->raid_disks
);
77 printf(" Total Devices : %d\n", sb
->nr_disks
);
78 printf("Preferred Minor : %d\n", sb
->md_minor
);
81 printf(" Update Time : %.24s\n", ctime(&atime
));
82 printf(" State : %s\n",
83 (sb
->state
&(1<<MD_SB_CLEAN
))?"clean":"active");
84 printf(" Active Devices : %d\n", sb
->active_disks
);
85 printf("Working Devices : %d\n", sb
->working_disks
);
86 printf(" Failed Devices : %d\n", sb
->failed_disks
);
87 printf(" Spare Devices : %d\n", sb
->spare_disks
);
88 if (calc_sb0_csum(sb
) == sb
->sb_csum
)
89 printf(" Checksum : %x - correct\n", sb
->sb_csum
);
91 printf(" Checksum : %x - expected %lx\n", sb
->sb_csum
, calc_sb0_csum(sb
));
92 printf(" Events : %d.%d\n", sb
->events_hi
, sb
->events_lo
);
95 c
= map_num(r5layout
, sb
->layout
);
96 printf(" Layout : %s\n", c
?c
:"-unknown-");
102 printf(" Chunk Size : %dK\n", sb
->chunk_size
/1024);
105 printf(" Rounding : %dK\n", sb
->chunk_size
/1024);
110 printf(" Number Major Minor RaidDevice State\n");
111 for (d
= -1; d
<(signed int)(sb
->raid_disks
+sb
->spare_disks
); d
++) {
115 if (d
>=0) dp
= &sb
->disks
[d
];
116 else dp
= &sb
->this_disk
;
117 sprintf(nb
, "%4d", d
);
118 printf("%4s %5d %5d %5d %5d ", d
< 0 ? "this" : nb
,
119 dp
->number
, dp
->major
, dp
->minor
, dp
->raid_disk
);
120 if (dp
->state
& (1<<MD_DISK_FAULTY
)) printf(" faulty");
121 if (dp
->state
& (1<<MD_DISK_ACTIVE
)) printf(" active");
122 if (dp
->state
& (1<<MD_DISK_SYNC
)) printf(" sync");
123 if (dp
->state
& (1<<MD_DISK_REMOVED
)) printf(" removed");
124 if (dp
->state
== 0) printf(" spare");
125 if ((dv
=map_dev(dp
->major
, dp
->minor
)))
128 if (d
== -1) printf("\n");
132 static void brief_examine_super0(void *sbv
)
134 mdp_super_t
*sb
= sbv
;
135 char *c
=map_num(pers
, sb
->level
);
137 printf("ARRAY %s level=%s num-devices=%d UUID=",
138 get_md_name(sb
->md_minor
),
139 c
?c
:"-unknown-", sb
->raid_disks
);
140 if (sb
->minor_version
>= 90)
141 printf("%08x:%08x:%08x:%08x", sb
->set_uuid0
, sb
->set_uuid1
,
142 sb
->set_uuid2
, sb
->set_uuid3
);
144 printf("%08x", sb
->set_uuid0
);
148 static void detail_super0(void *sbv
)
150 mdp_super_t
*sb
= sbv
;
152 if (sb
->minor_version
>= 90)
153 printf("%08x:%08x:%08x:%08x", sb
->set_uuid0
, sb
->set_uuid1
,
154 sb
->set_uuid2
, sb
->set_uuid3
);
156 printf("%08x", sb
->set_uuid0
);
157 printf("\n Events : %d.%d\n\n", sb
->events_hi
, sb
->events_lo
);
160 static void brief_detail_super0(void *sbv
)
162 mdp_super_t
*sb
= sbv
;
164 if (sb
->minor_version
>= 90)
165 printf("%08x:%08x:%08x:%08x", sb
->set_uuid0
, sb
->set_uuid1
,
166 sb
->set_uuid2
, sb
->set_uuid3
);
168 printf("%08x", sb
->set_uuid0
);
171 static void uuid_from_super0(int uuid
[4], void * sbv
)
173 mdp_super_t
*super
= sbv
;
174 uuid
[0] = super
->set_uuid0
;
175 if (super
->minor_version
>= 90) {
176 uuid
[1] = super
->set_uuid1
;
177 uuid
[2] = super
->set_uuid2
;
178 uuid
[3] = super
->set_uuid3
;
186 static void getinfo_super0(struct mdinfo
*info
, void *sbv
)
188 mdp_super_t
*sb
= sbv
;
192 info
->array
.major_version
= sb
->major_version
;
193 info
->array
.minor_version
= sb
->minor_version
;
194 info
->array
.patch_version
= sb
->patch_version
;
195 info
->array
.raid_disks
= sb
->raid_disks
;
196 info
->array
.level
= sb
->level
;
197 info
->array
.md_minor
= sb
->md_minor
;
198 info
->array
.ctime
= sb
->ctime
;
200 info
->disk
.state
= sb
->this_disk
.state
;
201 info
->disk
.major
= sb
->this_disk
.major
;
202 info
->disk
.minor
= sb
->this_disk
.minor
;
203 info
->disk
.raid_disk
= sb
->this_disk
.raid_disk
;
205 info
->events
= md_event(sb
);
207 uuid_from_super0(info
->uuid
, sbv
);
209 /* work_disks is calculated rather than read directly */
210 for (i
=0; i
< MD_SB_DISKS
; i
++)
211 if ((sb
->disks
[i
].state
& (1<<MD_DISK_SYNC
)) &&
212 (sb
->disks
[i
].state
& (1<<MD_DISK_ACTIVE
)) &&
213 !(sb
->disks
[i
].state
& (1<<MD_DISK_FAULTY
)))
215 info
->array
.working_disks
= working
;
219 static int update_super0(struct mdinfo
*info
, void *sbv
, char *update
, char *devname
, int verbose
)
222 mdp_super_t
*sb
= sbv
;
223 if (strcmp(update
, "sparc2.2")==0 ) {
224 /* 2.2 sparc put the events in the wrong place
225 * So we copy the tail of the superblock
226 * up 4 bytes before continuing
228 __u32
*sb32
= (__u32
*)sb
;
229 memcpy(sb32
+MD_SB_GENERIC_CONSTANT_WORDS
+7,
230 sb32
+MD_SB_GENERIC_CONSTANT_WORDS
+7+1,
231 (MD_SB_WORDS
- (MD_SB_GENERIC_CONSTANT_WORDS
+7+1))*4);
232 fprintf (stderr
, Name
": adjusting superblock of %s for 2.2/sparc compatability.\n",
235 if (strcmp(update
, "super-minor") ==0) {
236 sb
->md_minor
= info
->array
.md_minor
;
238 fprintf(stderr
, Name
": updating superblock of %s with minor number %d\n",
239 devname
, info
->array
.md_minor
);
241 if (strcmp(update
, "summaries") == 0) {
243 /* set nr_disks, active_disks, working_disks,
244 * failed_disks, spare_disks based on disks[]
245 * array in superblock.
246 * Also make sure extra slots aren't 'failed'
248 sb
->nr_disks
= sb
->active_disks
=
249 sb
->working_disks
= sb
->failed_disks
=
251 for (i
=0; i
< MD_SB_DISKS
; i
++)
252 if (sb
->disks
[i
].major
||
253 sb
->disks
[i
].minor
) {
254 int state
= sb
->disks
[i
].state
;
255 if (state
& (1<<MD_DISK_REMOVED
))
258 if (state
& (1<<MD_DISK_ACTIVE
))
260 if (state
& (1<<MD_DISK_FAULTY
))
266 } else if (i
>= sb
->raid_disks
&& sb
->disks
[i
].number
== 0)
267 sb
->disks
[i
].state
= 0;
269 if (strcmp(update
, "force")==0) {
270 sb
->events_hi
= (info
->events
>>32) & 0xFFFFFFFF;
271 sb
->events_lo
= (info
->events
) & 0xFFFFFFFF;
272 if (sb
->level
== 5 || sb
->level
== 4 || sb
->level
== 6)
273 /* need to force clean */
274 sb
->state
|= (1 << MD_SB_CLEAN
);
276 if (strcmp(update
, "assemble")==0) {
277 int d
= info
->disk
.number
;
278 if (sb
->disks
[d
].state
!= info
->disk
.state
) {
279 sb
->disks
[d
].state
= info
->disk
.state
;
283 if (strcmp(update
, "newdev") == 0) {
284 int d
= info
->disk
.number
;
285 memset(&sb
->disks
[d
], 0, sizeof(sb
->disks
[d
]));
286 sb
->disks
[d
].number
= d
;
287 sb
->disks
[d
].major
= info
->disk
.major
;
288 sb
->disks
[d
].minor
= info
->disk
.minor
;
289 sb
->disks
[d
].raid_disk
= info
->disk
.raid_disk
;
290 sb
->disks
[d
].state
= info
->disk
.state
;
291 sb
->this_disk
= sb
->disks
[d
];
293 if (strcmp(update
, "grow") == 0) {
294 sb
->raid_disks
= info
->array
.raid_disks
;
295 sb
->nr_disks
= info
->array
.nr_disks
;
296 sb
->active_disks
= info
->array
.active_disks
;
297 sb
->working_disks
= info
->array
.working_disks
;
298 memset(&sb
->disks
[info
->disk
.number
], 0, sizeof(sb
->disks
[0]));
299 sb
->disks
[info
->disk
.number
].number
= info
->disk
.number
;
300 sb
->disks
[info
->disk
.number
].major
= info
->disk
.major
;
301 sb
->disks
[info
->disk
.number
].minor
= info
->disk
.minor
;
302 sb
->disks
[info
->disk
.number
].raid_disk
= info
->disk
.raid_disk
;
303 sb
->disks
[info
->disk
.number
].state
= info
->disk
.state
;
304 if (sb
->this_disk
.number
== info
->disk
.number
)
305 sb
->this_disk
= sb
->disks
[info
->disk
.number
];
307 if (strcmp(update
, "resync") == 0) {
308 /* make sure resync happens */
309 sb
->state
&= ~(1<<MD_SB_CLEAN
);
313 sb
->sb_csum
= calc_sb0_csum(sb
);
317 static __u64
event_super0(void *sbv
)
319 mdp_super_t
*sb
= sbv
;
325 static int init_super0(void **sbp
, mdu_array_info_t
*info
)
327 mdp_super_t
*sb
= malloc(MD_SB_BYTES
);
329 memset(sb
, 0, MD_SB_BYTES
);
331 if (info
->major_version
== -1) {
332 /* zeroing the superblock */
336 spares
= info
->working_disks
- info
->active_disks
;
337 if (info
->raid_disks
+ spares
> MD_SB_DISKS
) {
338 fprintf(stderr
, Name
": too many devices requested: %d+%d > %d\n",
339 info
->raid_disks
, spares
, MD_SB_DISKS
);
343 sb
->md_magic
= MD_SB_MAGIC
;
344 sb
->major_version
= 0;
345 sb
->minor_version
= 90;
346 sb
->patch_version
= 0;
347 sb
->gvalid_words
= 0; /* ignored */
348 sb
->set_uuid0
= random();
350 sb
->level
= info
->level
;
351 sb
->size
= info
->size
;
352 sb
->nr_disks
= info
->nr_disks
;
353 sb
->raid_disks
= info
->raid_disks
;
354 sb
->md_minor
= info
->md_minor
;
355 sb
->not_persistent
= 0;
356 sb
->set_uuid1
= random();
357 sb
->set_uuid2
= random();
358 sb
->set_uuid3
= random();
360 sb
->utime
= sb
->ctime
;
361 sb
->state
= info
->state
;
362 sb
->active_disks
= info
->active_disks
;
363 sb
->working_disks
= info
->working_disks
;
364 sb
->failed_disks
= info
->failed_disks
;
368 sb
->layout
= info
->layout
;
369 sb
->chunk_size
= info
->chunk_size
;
375 /* Add a device to the superblock being created */
376 static void add_to_super0(void *sbv
, mdu_disk_info_t
*dinfo
)
378 mdp_super_t
*sb
= sbv
;
379 mdp_disk_t
*dk
= &sb
->disks
[dinfo
->number
];
381 dk
->number
= dinfo
->number
;
382 dk
->major
= dinfo
->major
;
383 dk
->minor
= dinfo
->minor
;
384 dk
->raid_disk
= dinfo
->raid_disk
;
385 dk
->state
= dinfo
->state
;
388 static int store_super0(int fd
, void *sbv
)
391 unsigned long long dsize
;
392 unsigned long long offset
;
393 mdp_super_t
*super
= sbv
;
396 if (ioctl(fd
, BLKGETSIZE64
, &dsize
) != 0)
399 if (ioctl(fd
, BLKGETSIZE
, &size
))
402 dsize
= ((unsigned long long)size
)<<9;
405 if (dsize
< MD_RESERVED_SECTORS
*2)
408 offset
= MD_NEW_SIZE_SECTORS(dsize
>>9);
412 if (lseek64(fd
, offset
, 0)< 0LL)
415 if (write(fd
, super
, sizeof(*super
)) != sizeof(*super
))
421 static int write_init_super0(struct supertype
*st
, void *sbv
, mdu_disk_info_t
*dinfo
, char *devname
)
423 mdp_super_t
*sb
= sbv
;
424 int fd
= open(devname
, O_RDWR
, O_EXCL
);
428 fprintf(stderr
, Name
": Failed to open %s to write superblock\n", devname
);
432 sb
->this_disk
= sb
->disks
[dinfo
->number
];
433 sb
->sb_csum
= calc_sb0_csum(sb
);
434 rv
= store_super0(fd
, sb
);
437 fprintf(stderr
, Name
": failed to write superblock to %s\n", devname
);
441 static int compare_super0(void **firstp
, void *secondv
)
445 * 0 same, or first was empty, and second was copied
446 * 1 second had wrong number
450 mdp_super_t
*first
= *firstp
;
451 mdp_super_t
*second
= secondv
;
453 int uuid1
[4], uuid2
[4];
454 if (second
->md_magic
!= MD_SB_MAGIC
)
457 first
= malloc(MD_SB_BYTES
);
458 memcpy(first
, second
, MD_SB_BYTES
);
463 uuid_from_super0(uuid1
, first
);
464 uuid_from_super0(uuid2
, second
);
465 if (!same_uuid(uuid1
, uuid2
))
467 if (first
->major_version
!= second
->major_version
||
468 first
->minor_version
!= second
->minor_version
||
469 first
->patch_version
!= second
->patch_version
||
470 first
->gvalid_words
!= second
->gvalid_words
||
471 first
->ctime
!= second
->ctime
||
472 first
->level
!= second
->level
||
473 first
->size
!= second
->size
||
474 first
->raid_disks
!= second
->raid_disks
)
481 static int load_super0(struct supertype
*st
, int fd
, void **sbp
, char *devname
)
483 /* try to read in the superblock
486 * 1 on cannot get superblock
487 * 2 on superblock meaningless
490 unsigned long long dsize
;
491 unsigned long long offset
;
495 if (ioctl(fd
, BLKGETSIZE64
, &dsize
) != 0)
498 if (ioctl(fd
, BLKGETSIZE
, &size
)) {
500 fprintf(stderr
, Name
": cannot find device size for %s: %s\n",
501 devname
, strerror(errno
));
507 if (dsize
< MD_RESERVED_SECTORS
*2) {
509 fprintf(stderr
, Name
": %s is too small for md: size is %ld sectors.\n",
514 offset
= MD_NEW_SIZE_SECTORS(dsize
>>9);
518 ioctl(fd
, BLKFLSBUF
, 0); /* make sure we read current data */
520 if (lseek64(fd
, offset
, 0)< 0LL) {
522 fprintf(stderr
, Name
": Cannot seek to superblock on %s: %s\n",
523 devname
, strerror(errno
));
527 super
= malloc(MD_SB_BYTES
);
529 if (read(fd
, super
, sizeof(*super
)) != MD_SB_BYTES
) {
531 fprintf(stderr
, Name
": Cannot read superblock on %s\n",
537 if (super
->md_magic
!= MD_SB_MAGIC
) {
539 fprintf(stderr
, Name
": No super block found on %s (Expected magic %08x, got %08x)\n",
540 devname
, MD_SB_MAGIC
, super
->md_magic
);
545 if (super
->major_version
!= 0) {
547 fprintf(stderr
, Name
": Cannot interpret superblock on %s - version is %d\n",
548 devname
, super
->major_version
);
553 if (st
->ss
== NULL
) {
555 st
->minor_version
= 90;
561 static struct supertype
*match_metadata_desc0(char *arg
)
563 struct supertype
*st
= malloc(sizeof(*st
));
567 st
->minor_version
= 90;
568 if (strcmp(arg
, "0") == 0 ||
569 strcmp(arg
, "0.90") == 0 ||
570 strcmp(arg
, "default") == 0
578 static __u64
avail_size0(__u64 devsize
)
580 if (devsize
< MD_RESERVED_SECTORS
*2)
582 return MD_NEW_SIZE_SECTORS(devsize
);
585 struct superswitch super0
= {
586 .examine_super
= examine_super0
,
587 .brief_examine_super
= brief_examine_super0
,
588 .detail_super
= detail_super0
,
589 .brief_detail_super
= brief_detail_super0
,
590 .uuid_from_super
= uuid_from_super0
,
591 .getinfo_super
= getinfo_super0
,
592 .update_super
= update_super0
,
593 .event_super
= event_super0
,
594 .init_super
= init_super0
,
595 .add_to_super
= add_to_super0
,
596 .store_super
= store_super0
,
597 .write_init_super
= write_init_super0
,
598 .compare_super
= compare_super0
,
599 .load_super
= load_super0
,
600 .match_metadata_desc
= match_metadata_desc0
,
601 .avail_size
= avail_size0
,