]> git.ipfire.org Git - thirdparty/mdadm.git/blob - super1.c
Grow: Fix linear-growth when devices are not all the same size.
[thirdparty/mdadm.git] / super1.c
1 /*
2 * mdadm - manage Linux "md" devices aka RAID arrays.
3 *
4 * Copyright (C) 2001-2006 Neil Brown <neilb@suse.de>
5 *
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 *
21 * Author: Neil Brown
22 * Email: <neilb@cse.unsw.edu.au>
23 * Paper: Neil Brown
24 * School of Computer Science and Engineering
25 * The University of New South Wales
26 * Sydney, 2052
27 * Australia
28 */
29
30 #include "mdadm.h"
31 /*
32 * The version-1 superblock :
33 * All numeric fields are little-endian.
34 *
35 * total size: 256 bytes plus 2 per device.
36 * 1K allows 384 devices.
37 */
38 struct mdp_superblock_1 {
39 /* constant array information - 128 bytes */
40 __u32 magic; /* MD_SB_MAGIC: 0xa92b4efc - little endian */
41 __u32 major_version; /* 1 */
42 __u32 feature_map; /* 0 for now */
43 __u32 pad0; /* always set to 0 when writing */
44
45 __u8 set_uuid[16]; /* user-space generated. */
46 char set_name[32]; /* set and interpreted by user-space */
47
48 __u64 ctime; /* lo 40 bits are seconds, top 24 are microseconds or 0*/
49 __u32 level; /* -4 (multipath), -1 (linear), 0,1,4,5 */
50 __u32 layout; /* only for raid5 currently */
51 __u64 size; /* used size of component devices, in 512byte sectors */
52
53 __u32 chunksize; /* in 512byte sectors */
54 __u32 raid_disks;
55 __u32 bitmap_offset; /* sectors after start of superblock that bitmap starts
56 * NOTE: signed, so bitmap can be before superblock
57 * only meaningful of feature_map[0] is set.
58 */
59
60 /* These are only valid with feature bit '4' */
61 __u32 new_level; /* new level we are reshaping to */
62 __u64 reshape_position; /* next address in array-space for reshape */
63 __u32 delta_disks; /* change in number of raid_disks */
64 __u32 new_layout; /* new layout */
65 __u32 new_chunk; /* new chunk size (bytes) */
66 __u8 pad1[128-124]; /* set to 0 when written */
67
68 /* constant this-device information - 64 bytes */
69 __u64 data_offset; /* sector start of data, often 0 */
70 __u64 data_size; /* sectors in this device that can be used for data */
71 __u64 super_offset; /* sector start of this superblock */
72 __u64 recovery_offset;/* sectors before this offset (from data_offset) have been recovered */
73 __u32 dev_number; /* permanent identifier of this device - not role in raid */
74 __u32 cnt_corrected_read; /* number of read errors that were corrected by re-writing */
75 __u8 device_uuid[16]; /* user-space setable, ignored by kernel */
76 __u8 devflags; /* per-device flags. Only one defined...*/
77 #define WriteMostly1 1 /* mask for writemostly flag in above */
78 __u8 pad2[64-57]; /* set to 0 when writing */
79
80 /* array state information - 64 bytes */
81 __u64 utime; /* 40 bits second, 24 btes microseconds */
82 __u64 events; /* incremented when superblock updated */
83 __u64 resync_offset; /* data before this offset (from data_offset) known to be in sync */
84 __u32 sb_csum; /* checksum upto devs[max_dev] */
85 __u32 max_dev; /* size of devs[] array to consider */
86 __u8 pad3[64-32]; /* set to 0 when writing */
87
88 /* device state information. Indexed by dev_number.
89 * 2 bytes per device
90 * Note there are no per-device state flags. State information is rolled
91 * into the 'roles' value. If a device is spare or faulty, then it doesn't
92 * have a meaningful role.
93 */
94 __u16 dev_roles[0]; /* role in array, or 0xffff for a spare, or 0xfffe for faulty */
95 };
96
97 struct misc_dev_info {
98 __u64 device_size;
99 };
100
101 /* feature_map bits */
102 #define MD_FEATURE_BITMAP_OFFSET 1
103 #define MD_FEATURE_RECOVERY_OFFSET 2 /* recovery_offset is present and
104 * must be honoured
105 */
106 #define MD_FEATURE_RESHAPE_ACTIVE 4
107
108 #define MD_FEATURE_ALL (1|2|4)
109
110 #ifndef offsetof
111 #define offsetof(t,f) ((size_t)&(((t*)0)->f))
112 #endif
113 static unsigned int calc_sb_1_csum(struct mdp_superblock_1 * sb)
114 {
115 unsigned int disk_csum, csum;
116 unsigned long long newcsum;
117 int size = sizeof(*sb) + __le32_to_cpu(sb->max_dev)*2;
118 unsigned int *isuper = (unsigned int*)sb;
119 int i;
120
121 /* make sure I can count... */
122 if (offsetof(struct mdp_superblock_1,data_offset) != 128 ||
123 offsetof(struct mdp_superblock_1, utime) != 192 ||
124 sizeof(struct mdp_superblock_1) != 256) {
125 fprintf(stderr, "WARNING - superblock isn't sized correctly\n");
126 }
127
128 disk_csum = sb->sb_csum;
129 sb->sb_csum = 0;
130 newcsum = 0;
131 for (i=0; size>=4; size -= 4 ) {
132 newcsum += __le32_to_cpu(*isuper);
133 isuper++;
134 }
135
136 if (size == 2)
137 newcsum += __le16_to_cpu(*(unsigned short*) isuper);
138
139 csum = (newcsum & 0xffffffff) + (newcsum >> 32);
140 sb->sb_csum = disk_csum;
141 return __cpu_to_le32(csum);
142 }
143
144 #ifndef MDASSEMBLE
145 static void examine_super1(struct supertype *st, char *homehost)
146 {
147 struct mdp_superblock_1 *sb = st->sb;
148 time_t atime;
149 int d;
150 int faulty;
151 int i;
152 char *c;
153 int l = homehost ? strlen(homehost) : 0;
154 int layout;
155 unsigned long long sb_offset;
156
157 printf(" Magic : %08x\n", __le32_to_cpu(sb->magic));
158 printf(" Version : 1");
159 sb_offset = __le64_to_cpu(sb->super_offset);
160 if (sb_offset <= 4)
161 printf(".1\n");
162 else if (sb_offset <= 8)
163 printf(".2\n");
164 else
165 printf(".0\n");
166 printf(" Feature Map : 0x%x\n", __le32_to_cpu(sb->feature_map));
167 printf(" Array UUID : ");
168 for (i=0; i<16; i++) {
169 if ((i&3)==0 && i != 0) printf(":");
170 printf("%02x", sb->set_uuid[i]);
171 }
172 printf("\n");
173 printf(" Name : %.32s", sb->set_name);
174 if (l > 0 && l < 32 &&
175 sb->set_name[l] == ':' &&
176 strncmp(sb->set_name, homehost, l) == 0)
177 printf(" (local to host %s)", homehost);
178 printf("\n");
179 atime = __le64_to_cpu(sb->ctime) & 0xFFFFFFFFFFULL;
180 printf(" Creation Time : %.24s\n", ctime(&atime));
181 c=map_num(pers, __le32_to_cpu(sb->level));
182 printf(" Raid Level : %s\n", c?c:"-unknown-");
183 printf(" Raid Devices : %d\n", __le32_to_cpu(sb->raid_disks));
184 printf("\n");
185 printf(" Avail Dev Size : %llu%s\n",
186 (unsigned long long)__le64_to_cpu(sb->data_size),
187 human_size(__le64_to_cpu(sb->data_size)<<9));
188 if (__le32_to_cpu(sb->level) >= 0) {
189 int ddsks=0;
190 switch(__le32_to_cpu(sb->level)) {
191 case 1: ddsks=1;break;
192 case 4:
193 case 5: ddsks = __le32_to_cpu(sb->raid_disks)-1; break;
194 case 6: ddsks = __le32_to_cpu(sb->raid_disks)-2; break;
195 case 10:
196 layout = __le32_to_cpu(sb->layout);
197 ddsks = __le32_to_cpu(sb->raid_disks)
198 / (layout&255) / ((layout>>8)&255);
199 }
200 if (ddsks)
201 printf(" Array Size : %llu%s\n",
202 ddsks*(unsigned long long)__le64_to_cpu(sb->size),
203 human_size(ddsks*__le64_to_cpu(sb->size)<<9));
204 if (sb->size != sb->data_size)
205 printf(" Used Dev Size : %llu%s\n",
206 (unsigned long long)__le64_to_cpu(sb->size),
207 human_size(__le64_to_cpu(sb->size)<<9));
208 }
209 if (sb->data_offset)
210 printf(" Data Offset : %llu sectors\n",
211 (unsigned long long)__le64_to_cpu(sb->data_offset));
212 printf(" Super Offset : %llu sectors\n",
213 (unsigned long long)__le64_to_cpu(sb->super_offset));
214 if (__le32_to_cpu(sb->feature_map) & MD_FEATURE_RECOVERY_OFFSET)
215 printf("Recovery Offset : %llu sectors\n", (unsigned long long)__le64_to_cpu(sb->recovery_offset));
216 printf(" State : %s\n", (__le64_to_cpu(sb->resync_offset)+1)? "active":"clean");
217 printf(" Device UUID : ");
218 for (i=0; i<16; i++) {
219 if ((i&3)==0 && i != 0) printf(":");
220 printf("%02x", sb->device_uuid[i]);
221 }
222 printf("\n");
223 printf("\n");
224 if (sb->feature_map & __cpu_to_le32(MD_FEATURE_BITMAP_OFFSET)) {
225 printf("Internal Bitmap : %ld sectors from superblock\n",
226 (long)(int32_t)__le32_to_cpu(sb->bitmap_offset));
227 }
228 if (sb->feature_map & __le32_to_cpu(MD_FEATURE_RESHAPE_ACTIVE)) {
229 printf(" Reshape pos'n : %llu%s\n", (unsigned long long)__le64_to_cpu(sb->reshape_position)/2,
230 human_size(__le64_to_cpu(sb->reshape_position)<<9));
231 if (__le32_to_cpu(sb->delta_disks)) {
232 printf(" Delta Devices : %d", __le32_to_cpu(sb->delta_disks));
233 if (__le32_to_cpu(sb->delta_disks))
234 printf(" (%d->%d)\n",
235 __le32_to_cpu(sb->raid_disks)-__le32_to_cpu(sb->delta_disks),
236 __le32_to_cpu(sb->raid_disks));
237 else
238 printf(" (%d->%d)\n", __le32_to_cpu(sb->raid_disks),
239 __le32_to_cpu(sb->raid_disks)+__le32_to_cpu(sb->delta_disks));
240 }
241 if (__le32_to_cpu(sb->new_level) != __le32_to_cpu(sb->level)) {
242 c = map_num(pers, __le32_to_cpu(sb->new_level));
243 printf(" New Level : %s\n", c?c:"-unknown-");
244 }
245 if (__le32_to_cpu(sb->new_layout) != __le32_to_cpu(sb->layout)) {
246 if (__le32_to_cpu(sb->level) == 5) {
247 c = map_num(r5layout, __le32_to_cpu(sb->new_layout));
248 printf(" New Layout : %s\n", c?c:"-unknown-");
249 }
250 if (__le32_to_cpu(sb->level) == 10) {
251 printf(" New Layout :");
252 print_r10_layout(__le32_to_cpu(sb->new_layout));
253 printf("\n");
254 }
255 }
256 if (__le32_to_cpu(sb->new_chunk) != __le32_to_cpu(sb->chunksize))
257 printf(" New Chunksize : %dK\n", __le32_to_cpu(sb->new_chunk)/2);
258 printf("\n");
259 }
260 if (sb->devflags) {
261 printf(" Flags :");
262 if (sb->devflags & WriteMostly1)
263 printf(" write-mostly");
264 printf("\n");
265 }
266
267 atime = __le64_to_cpu(sb->utime) & 0xFFFFFFFFFFULL;
268 printf(" Update Time : %.24s\n", ctime(&atime));
269
270 if (calc_sb_1_csum(sb) == sb->sb_csum)
271 printf(" Checksum : %x - correct\n", __le32_to_cpu(sb->sb_csum));
272 else
273 printf(" Checksum : %x - expected %x\n", __le32_to_cpu(sb->sb_csum),
274 __le32_to_cpu(calc_sb_1_csum(sb)));
275 printf(" Events : %llu\n", (unsigned long long)__le64_to_cpu(sb->events));
276 printf("\n");
277 if (__le32_to_cpu(sb->level) == 5) {
278 c = map_num(r5layout, __le32_to_cpu(sb->layout));
279 printf(" Layout : %s\n", c?c:"-unknown-");
280 }
281 if (__le32_to_cpu(sb->level) == 10) {
282 int lo = __le32_to_cpu(sb->layout);
283 printf(" Layout :");
284 print_r10_layout(lo);
285 printf("\n");
286 }
287 switch(__le32_to_cpu(sb->level)) {
288 case 0:
289 case 4:
290 case 5:
291 case 6:
292 case 10:
293 printf(" Chunk Size : %dK\n", __le32_to_cpu(sb->chunksize)/2);
294 break;
295 case -1:
296 printf(" Rounding : %dK\n", __le32_to_cpu(sb->chunksize)/2);
297 break;
298 default: break;
299 }
300 printf("\n");
301 printf(" Array Slot : %d (", __le32_to_cpu(sb->dev_number));
302 for (i= __le32_to_cpu(sb->max_dev); i> 0 ; i--)
303 if (__le16_to_cpu(sb->dev_roles[i-1]) != 0xffff)
304 break;
305 for (d=0; d < i; d++) {
306 int role = __le16_to_cpu(sb->dev_roles[d]);
307 if (d) printf(", ");
308 if (role == 0xffff) printf("empty");
309 else if(role == 0xfffe) printf("failed");
310 else printf("%d", role);
311 }
312 printf(")\n");
313 printf(" Array State : ");
314 for (d=0; d<__le32_to_cpu(sb->raid_disks); d++) {
315 int cnt = 0;
316 int me = 0;
317 int i;
318 for (i=0; i< __le32_to_cpu(sb->max_dev); i++) {
319 int role = __le16_to_cpu(sb->dev_roles[i]);
320 if (role == d) {
321 if (i == __le32_to_cpu(sb->dev_number))
322 me = 1;
323 cnt++;
324 }
325 }
326 if (cnt > 1) printf("?");
327 else if (cnt == 1 && me) printf("U");
328 else if (cnt == 1) printf("u");
329 else printf ("_");
330 }
331 faulty = 0;
332 for (i=0; i< __le32_to_cpu(sb->max_dev); i++) {
333 int role = __le16_to_cpu(sb->dev_roles[i]);
334 if (role == 0xFFFE)
335 faulty++;
336 }
337 if (faulty) printf(" %d failed", faulty);
338 printf("\n");
339 }
340
341
342 static void brief_examine_super1(struct supertype *st)
343 {
344 struct mdp_superblock_1 *sb = st->sb;
345 int i;
346 unsigned long long sb_offset;
347 char *nm;
348 char *c=map_num(pers, __le32_to_cpu(sb->level));
349
350 nm = strchr(sb->set_name, ':');
351 if (nm)
352 nm++;
353 else if (sb->set_name[0])
354 nm = sb->set_name;
355 else
356 nm = "??";
357
358 printf("ARRAY /dev/md/%s level=%s ", nm, c?c:"-unknown-");
359 sb_offset = __le64_to_cpu(sb->super_offset);
360 if (sb_offset <= 4)
361 printf("metadata=1.1 ");
362 else if (sb_offset <= 8)
363 printf("metadata=1.2 ");
364 else
365 printf("metadata=1.0 ");
366 printf("num-devices=%d UUID=", __le32_to_cpu(sb->raid_disks));
367 for (i=0; i<16; i++) {
368 if ((i&3)==0 && i != 0) printf(":");
369 printf("%02x", sb->set_uuid[i]);
370 }
371 if (sb->set_name[0])
372 printf(" name=%.32s", sb->set_name);
373 printf("\n");
374 }
375
376 static void export_examine_super1(struct supertype *st)
377 {
378 struct mdp_superblock_1 *sb = st->sb;
379 int i;
380 int len = 32;
381
382 printf("MD_LEVEL=%s\n", map_num(pers, __le32_to_cpu(sb->level)));
383 printf("MD_DEVICES=%d\n", __le32_to_cpu(sb->raid_disks));
384 for (i=0; i<32; i++)
385 if (sb->set_name[i] == '\n' ||
386 sb->set_name[i] == '\0') {
387 len = i;
388 break;
389 }
390 if (len)
391 printf("MD_NAME=%.*s\n", len, sb->set_name);
392 printf("MD_UUID=");
393 for (i=0; i<16; i++) {
394 if ((i&3)==0 && i != 0) printf(":");
395 printf("%02x", sb->set_uuid[i]);
396 }
397 printf("\n");
398 printf("MD_UPDATE_TIME=%llu\n",
399 __le64_to_cpu(sb->utime) & 0xFFFFFFFFFFULL);
400 printf("MD_DEV_UUID=");
401 for (i=0; i<16; i++) {
402 if ((i&3)==0 && i != 0) printf(":");
403 printf("%02x", sb->device_uuid[i]);
404 }
405 printf("\n");
406 printf("MD_EVENTS=%llu\n",
407 (unsigned long long)__le64_to_cpu(sb->events));
408 }
409
410 static void detail_super1(struct supertype *st, char *homehost)
411 {
412 struct mdp_superblock_1 *sb = st->sb;
413 int i;
414 int l = homehost ? strlen(homehost) : 0;
415
416 printf(" Name : %.32s", sb->set_name);
417 if (l > 0 && l < 32 &&
418 sb->set_name[l] == ':' &&
419 strncmp(sb->set_name, homehost, l) == 0)
420 printf(" (local to host %s)", homehost);
421 printf("\n UUID : ");
422 for (i=0; i<16; i++) {
423 if ((i&3)==0 && i != 0) printf(":");
424 printf("%02x", sb->set_uuid[i]);
425 }
426 printf("\n Events : %llu\n\n", (unsigned long long)__le64_to_cpu(sb->events));
427 }
428
429 static void brief_detail_super1(struct supertype *st)
430 {
431 struct mdp_superblock_1 *sb = st->sb;
432 int i;
433
434 if (sb->set_name[0])
435 printf(" name=%.32s", sb->set_name);
436 printf(" UUID=");
437 for (i=0; i<16; i++) {
438 if ((i&3)==0 && i != 0) printf(":");
439 printf("%02x", sb->set_uuid[i]);
440 }
441 }
442
443 static void export_detail_super1(struct supertype *st)
444 {
445 struct mdp_superblock_1 *sb = st->sb;
446 int i;
447 int len = 32;
448
449 for (i=0; i<32; i++)
450 if (sb->set_name[i] == '\n' ||
451 sb->set_name[i] == '\0') {
452 len = i;
453 break;
454 }
455 if (len)
456 printf("MD_NAME=%.*s\n", len, sb->set_name);
457 printf("MD_UUID=");
458 for (i=0; i<16; i++) {
459 if ((i&3)==0 && i != 0) printf(":");
460 printf("%02x", sb->set_uuid[i]);
461 }
462 printf("\n");
463 }
464
465 #endif
466
467 static int match_home1(struct supertype *st, char *homehost)
468 {
469 struct mdp_superblock_1 *sb = st->sb;
470 int l = homehost ? strlen(homehost) : 0;
471
472 return (l > 0 && l < 32 &&
473 sb->set_name[l] == ':' &&
474 strncmp(sb->set_name, homehost, l) == 0);
475 }
476
477 static void uuid_from_super1(struct supertype *st, int uuid[4])
478 {
479 struct mdp_superblock_1 *super = st->sb;
480 char *cuuid = (char*)uuid;
481 int i;
482 for (i=0; i<16; i++)
483 cuuid[i] = super->set_uuid[i];
484 }
485
486 static void getinfo_super1(struct supertype *st, struct mdinfo *info)
487 {
488 struct mdp_superblock_1 *sb = st->sb;
489 int working = 0;
490 int i;
491 int role;
492
493 info->array.major_version = 1;
494 info->array.minor_version = __le32_to_cpu(sb->feature_map);
495 info->array.patch_version = 0;
496 info->array.raid_disks = __le32_to_cpu(sb->raid_disks);
497 info->array.level = __le32_to_cpu(sb->level);
498 info->array.layout = __le32_to_cpu(sb->layout);
499 info->array.md_minor = -1;
500 info->array.ctime = __le64_to_cpu(sb->ctime);
501 info->array.utime = __le64_to_cpu(sb->utime);
502 info->array.chunk_size = __le32_to_cpu(sb->chunksize)*512;
503 info->array.state =
504 (__le64_to_cpu(sb->resync_offset) >= __le64_to_cpu(sb->size))
505 ? 1 : 0;
506
507 info->data_offset = __le64_to_cpu(sb->data_offset);
508 info->component_size = __le64_to_cpu(sb->size);
509
510 info->disk.major = 0;
511 info->disk.minor = 0;
512 info->disk.number = __le32_to_cpu(sb->dev_number);
513 if (__le32_to_cpu(sb->dev_number) >= __le32_to_cpu(sb->max_dev) ||
514 __le32_to_cpu(sb->max_dev) > 512)
515 role = 0xfffe;
516 else
517 role = __le16_to_cpu(sb->dev_roles[__le32_to_cpu(sb->dev_number)]);
518
519 info->disk.raid_disk = -1;
520 switch(role) {
521 case 0xFFFF:
522 info->disk.state = 2; /* spare: ACTIVE, not sync, not faulty */
523 break;
524 case 0xFFFE:
525 info->disk.state = 1; /* faulty */
526 break;
527 default:
528 info->disk.state = 6; /* active and in sync */
529 info->disk.raid_disk = role;
530 }
531 info->events = __le64_to_cpu(sb->events);
532
533 memcpy(info->uuid, sb->set_uuid, 16);
534
535 strncpy(info->name, sb->set_name, 32);
536 info->name[32] = 0;
537
538 if (sb->feature_map & __le32_to_cpu(MD_FEATURE_RESHAPE_ACTIVE)) {
539 info->reshape_active = 1;
540 info->reshape_progress = __le64_to_cpu(sb->reshape_position);
541 info->new_level = __le32_to_cpu(sb->new_level);
542 info->delta_disks = __le32_to_cpu(sb->delta_disks);
543 info->new_layout = __le32_to_cpu(sb->new_layout);
544 info->new_chunk = __le32_to_cpu(sb->new_chunk)<<9;
545 } else
546 info->reshape_active = 0;
547
548 for (i=0; i< __le32_to_cpu(sb->max_dev); i++) {
549 role = __le16_to_cpu(sb->dev_roles[i]);
550 if (/*role == 0xFFFF || */role < info->array.raid_disks)
551 working++;
552 }
553
554 info->array.working_disks = working;
555 }
556
557 static int update_super1(struct supertype *st, struct mdinfo *info,
558 char *update,
559 char *devname, int verbose,
560 int uuid_set, char *homehost)
561 {
562 /* NOTE: for 'assemble' and 'force' we need to return non-zero if any change was made.
563 * For others, the return value is ignored.
564 */
565 int rv = 0;
566 struct mdp_superblock_1 *sb = st->sb;
567
568 if (strcmp(update, "force-one")==0) {
569 /* Not enough devices for a working array,
570 * so bring this one up-to-date
571 */
572 if (sb->events != __cpu_to_le64(info->events))
573 rv = 1;
574 sb->events = __cpu_to_le64(info->events);
575 }
576 if (strcmp(update, "force-array")==0) {
577 /* Degraded array and 'force' requests to
578 * maybe need to mark it 'clean'.
579 */
580 switch(__le32_to_cpu(sb->level)) {
581 case 5: case 4: case 6:
582 /* need to force clean */
583 if (sb->resync_offset != ~0ULL)
584 rv = 1;
585 sb->resync_offset = ~0ULL;
586 }
587 }
588 if (strcmp(update, "assemble")==0) {
589 int d = info->disk.number;
590 int want;
591 if (info->disk.state == 6)
592 want = __cpu_to_le32(info->disk.raid_disk);
593 else
594 want = 0xFFFF;
595 if (sb->dev_roles[d] != want) {
596 sb->dev_roles[d] = want;
597 rv = 1;
598 }
599 }
600 if (strcmp(update, "linear-grow-new") == 0) {
601 int i;
602 int rfd, fd;
603 int max = __le32_to_cpu(sb->max_dev);
604
605 for (i=0 ; i < max ; i++)
606 if (__le16_to_cpu(sb->dev_roles[i]) >= 0xfffe)
607 break;
608 sb->dev_number = __cpu_to_le32(i);
609 info->disk.number = i;
610 if (max >= __le32_to_cpu(sb->max_dev))
611 sb->max_dev = __cpu_to_le32(max+1);
612
613 if ((rfd = open("/dev/urandom", O_RDONLY)) < 0 ||
614 read(rfd, sb->device_uuid, 16) != 16) {
615 *(__u32*)(sb->device_uuid) = random();
616 *(__u32*)(sb->device_uuid+4) = random();
617 *(__u32*)(sb->device_uuid+8) = random();
618 *(__u32*)(sb->device_uuid+12) = random();
619 }
620
621 sb->dev_roles[i] =
622 __cpu_to_le16(info->disk.raid_disk);
623
624 fd = open(devname, O_RDONLY);
625 if (fd >= 0) {
626 unsigned long long ds;
627 get_dev_size(fd, devname, &ds);
628 close(fd);
629 ds >>= 9;
630 if (__le64_to_cpu(sb->super_offset) <
631 __le64_to_cpu(sb->data_offset)) {
632 sb->data_size = __cpu_to_le64(
633 ds - __le64_to_cpu(sb->data_offset));
634 } else {
635 ds -= 8*2;
636 ds &= ~(unsigned long long)(4*2-1);
637 sb->super_offset = __cpu_to_le64(ds);
638 sb->data_size = __cpu_to_le64(
639 ds - __le64_to_cpu(sb->data_offset));
640 }
641 }
642 }
643 if (strcmp(update, "linear-grow-update") == 0) {
644 sb->raid_disks = __cpu_to_le32(info->array.raid_disks);
645 sb->dev_roles[info->disk.number] =
646 __cpu_to_le16(info->disk.raid_disk);
647 }
648 if (strcmp(update, "resync") == 0) {
649 /* make sure resync happens */
650 sb->resync_offset = 0ULL;
651 }
652 if (strcmp(update, "uuid") == 0) {
653 copy_uuid(sb->set_uuid, info->uuid, super1.swapuuid);
654
655 if (__le32_to_cpu(sb->feature_map)&MD_FEATURE_BITMAP_OFFSET) {
656 struct bitmap_super_s *bm;
657 bm = (struct bitmap_super_s*)(st->sb+1024);
658 memcpy(bm->uuid, sb->set_uuid, 16);
659 }
660 }
661 if (strcmp(update, "homehost") == 0 &&
662 homehost) {
663 char *c;
664 update = "name";
665 c = strchr(sb->set_name, ':');
666 if (c)
667 strncpy(info->name, c+1, 31 - (c-sb->set_name));
668 else
669 strncpy(info->name, sb->set_name, 32);
670 info->name[32] = 0;
671 }
672 if (strcmp(update, "name") == 0) {
673 if (info->name[0] == 0)
674 sprintf(info->name, "%d", info->array.md_minor);
675 memset(sb->set_name, 0, sizeof(sb->set_name));
676 if (homehost &&
677 strchr(info->name, ':') == NULL &&
678 strlen(homehost)+1+strlen(info->name) < 32) {
679 strcpy(sb->set_name, homehost);
680 strcat(sb->set_name, ":");
681 strcat(sb->set_name, info->name);
682 } else
683 strcpy(sb->set_name, info->name);
684 }
685 if (strcmp(update, "devicesize") == 0 &&
686 __le64_to_cpu(sb->super_offset) <
687 __le64_to_cpu(sb->data_offset)) {
688 /* set data_size to device size less data_offset */
689 struct misc_dev_info *misc = (struct misc_dev_info*)
690 (st->sb + 1024 + sizeof(struct bitmap_super_s));
691 printf("Size was %llu\n", (unsigned long long)
692 __le64_to_cpu(sb->data_size));
693 sb->data_size = __cpu_to_le64(
694 misc->device_size - __le64_to_cpu(sb->data_offset));
695 printf("Size is %llu\n", (unsigned long long)
696 __le64_to_cpu(sb->data_size));
697 }
698 if (strcmp(update, "_reshape_progress")==0)
699 sb->reshape_position = __cpu_to_le64(info->reshape_progress);
700
701 sb->sb_csum = calc_sb_1_csum(sb);
702 return rv;
703 }
704
705 static int init_super1(struct supertype *st, mdu_array_info_t *info,
706 unsigned long long size, char *name, char *homehost, int *uuid)
707 {
708 struct mdp_superblock_1 *sb = malloc(1024 + sizeof(bitmap_super_t) +
709 sizeof(struct misc_dev_info));
710 int spares;
711 int rfd;
712 char defname[10];
713 memset(sb, 0, 1024);
714
715 st->sb = sb;
716 if (info->major_version == -1) {
717 /* zeroing superblock */
718 return 0;
719 }
720
721 spares = info->working_disks - info->active_disks;
722 if (info->raid_disks + spares > 384) {
723 fprintf(stderr, Name ": too many devices requested: %d+%d > %d\n",
724 info->raid_disks , spares, 384);
725 return 0;
726 }
727
728 sb->magic = __cpu_to_le32(MD_SB_MAGIC);
729 sb->major_version = __cpu_to_le32(1);
730 sb->feature_map = 0;
731 sb->pad0 = 0;
732
733 if (uuid)
734 copy_uuid(sb->set_uuid, uuid, super1.swapuuid);
735 else {
736 if ((rfd = open("/dev/urandom", O_RDONLY)) < 0 ||
737 read(rfd, sb->set_uuid, 16) != 16) {
738 *(__u32*)(sb->set_uuid) = random();
739 *(__u32*)(sb->set_uuid+4) = random();
740 *(__u32*)(sb->set_uuid+8) = random();
741 *(__u32*)(sb->set_uuid+12) = random();
742 }
743 if (rfd >= 0) close(rfd);
744 }
745
746 if (name == NULL || *name == 0) {
747 sprintf(defname, "%d", info->md_minor);
748 name = defname;
749 }
750 memset(sb->set_name, 0, 32);
751 if (homehost &&
752 strchr(name, ':')== NULL &&
753 strlen(homehost)+1+strlen(name) < 32) {
754 strcpy(sb->set_name, homehost);
755 strcat(sb->set_name, ":");
756 strcat(sb->set_name, name);
757 } else
758 strcpy(sb->set_name, name);
759
760 sb->ctime = __cpu_to_le64((unsigned long long)time(0));
761 sb->level = __cpu_to_le32(info->level);
762 sb->layout = __cpu_to_le32(info->layout);
763 sb->size = __cpu_to_le64(size*2ULL);
764 sb->chunksize = __cpu_to_le32(info->chunk_size>>9);
765 sb->raid_disks = __cpu_to_le32(info->raid_disks);
766
767 sb->data_offset = __cpu_to_le64(0);
768 sb->data_size = __cpu_to_le64(0);
769 sb->super_offset = __cpu_to_le64(0);
770 sb->recovery_offset = __cpu_to_le64(0);
771
772 sb->utime = sb->ctime;
773 sb->events = __cpu_to_le64(1);
774 if (info->state & (1<<MD_SB_CLEAN))
775 sb->resync_offset = ~0ULL;
776 else
777 sb->resync_offset = 0;
778 sb->max_dev = __cpu_to_le32((1024- sizeof(struct mdp_superblock_1))/
779 sizeof(sb->dev_roles[0]));
780 memset(sb->pad3, 0, sizeof(sb->pad3));
781
782 memset(sb->dev_roles, 0xff, 1024 - sizeof(struct mdp_superblock_1));
783
784 return 1;
785 }
786
787 /* Add a device to the superblock being created */
788 static void add_to_super1(struct supertype *st, mdu_disk_info_t *dk)
789 {
790 struct mdp_superblock_1 *sb = st->sb;
791 __u16 *rp = sb->dev_roles + dk->number;
792 if ((dk->state & 6) == 6) /* active, sync */
793 *rp = __cpu_to_le16(dk->raid_disk);
794 else if ((dk->state & ~2) == 0) /* active or idle -> spare */
795 *rp = 0xffff;
796 else
797 *rp = 0xfffe;
798 }
799
800 static void locate_bitmap1(struct supertype *st, int fd);
801
802 static int store_super1(struct supertype *st, int fd)
803 {
804 struct mdp_superblock_1 *sb = st->sb;
805 unsigned long long sb_offset;
806 int sbsize;
807 unsigned long long dsize;
808
809 if (!get_dev_size(fd, NULL, &dsize))
810 return 1;
811
812 dsize >>= 9;
813
814 if (dsize < 24)
815 return 2;
816
817 /*
818 * Calculate the position of the superblock.
819 * It is always aligned to a 4K boundary and
820 * depending on minor_version, it can be:
821 * 0: At least 8K, but less than 12K, from end of device
822 * 1: At start of device
823 * 2: 4K from start of device.
824 */
825 switch(st->minor_version) {
826 case 0:
827 sb_offset = dsize;
828 sb_offset -= 8*2;
829 sb_offset &= ~(4*2-1);
830 break;
831 case 1:
832 sb_offset = 0;
833 break;
834 case 2:
835 sb_offset = 4*2;
836 break;
837 default:
838 return -EINVAL;
839 }
840
841
842
843 if (sb_offset != __le64_to_cpu(sb->super_offset) &&
844 0 != __le64_to_cpu(sb->super_offset)
845 ) {
846 fprintf(stderr, Name ": internal error - sb_offset is wrong\n");
847 abort();
848 }
849
850 if (lseek64(fd, sb_offset << 9, 0)< 0LL)
851 return 3;
852
853 sbsize = sizeof(*sb) + 2 * __le32_to_cpu(sb->max_dev);
854
855 if (write(fd, sb, sbsize) != sbsize)
856 return 4;
857
858 if (sb->feature_map & __cpu_to_le32(MD_FEATURE_BITMAP_OFFSET)) {
859 struct bitmap_super_s *bm = (struct bitmap_super_s*)
860 (((char*)sb)+1024);
861 if (__le32_to_cpu(bm->magic) == BITMAP_MAGIC) {
862 locate_bitmap1(st, fd);
863 if (write(fd, bm, sizeof(*bm)) != sizeof(*bm))
864 return 5;
865 }
866 }
867 fsync(fd);
868 return 0;
869 }
870
871 static int load_super1(struct supertype *st, int fd, char *devname);
872
873 static unsigned long choose_bm_space(unsigned long devsize)
874 {
875 /* if the device is bigger than 8Gig, save 64k for bitmap usage,
876 * if bigger than 200Gig, save 128k
877 */
878 if (devsize < 64*2) return 0;
879 if (devsize - 64*2 >= 200*1024*1024*2)
880 return 128*2;
881 if (devsize - 4*2 > 8*1024*1024*2)
882 return 64*2;
883 return 4*2;
884 }
885
886 static int write_init_super1(struct supertype *st,
887 mdu_disk_info_t *dinfo, char *devname)
888 {
889 struct mdp_superblock_1 *sb = st->sb;
890 struct supertype refst;
891 int fd = open(devname, O_RDWR | O_EXCL);
892 int rfd;
893 int rv;
894 int bm_space;
895
896 unsigned long long dsize, array_size;
897 long long sb_offset;
898
899
900 if (fd < 0) {
901 fprintf(stderr, Name ": Failed to open %s to write superblock\n",
902 devname);
903 return -1;
904 }
905
906 sb->dev_number = __cpu_to_le32(dinfo->number);
907 if (dinfo->state & (1<<MD_DISK_WRITEMOSTLY))
908 sb->devflags |= __cpu_to_le32(WriteMostly1);
909
910 if ((rfd = open("/dev/urandom", O_RDONLY)) < 0 ||
911 read(rfd, sb->device_uuid, 16) != 16) {
912 *(__u32*)(sb->device_uuid) = random();
913 *(__u32*)(sb->device_uuid+4) = random();
914 *(__u32*)(sb->device_uuid+8) = random();
915 *(__u32*)(sb->device_uuid+12) = random();
916 }
917 if (rfd >= 0) close(rfd);
918 sb->events = 0;
919
920 refst =*st;
921 refst.sb = NULL;
922 if (load_super1(&refst, fd, NULL)==0) {
923 struct mdp_superblock_1 *refsb = refst.sb;
924
925 memcpy(sb->device_uuid, refsb->device_uuid, 16);
926 if (memcmp(sb->set_uuid, refsb->set_uuid, 16)==0) {
927 /* same array, so preserve events and dev_number */
928 sb->events = refsb->events;
929 /* bugs in 2.6.17 and earlier mean the dev_number
930 * chosen in Manage must be preserved
931 */
932 if (get_linux_version() >= 2006018)
933 sb->dev_number = refsb->dev_number;
934 }
935 free(refsb);
936 }
937
938 if (!get_dev_size(fd, NULL, &dsize))
939 return 1;
940 dsize >>= 9;
941
942 if (dsize < 24) {
943 close(fd);
944 return 2;
945 }
946
947
948 /*
949 * Calculate the position of the superblock.
950 * It is always aligned to a 4K boundary and
951 * depending on minor_version, it can be:
952 * 0: At least 8K, but less than 12K, from end of device
953 * 1: At start of device
954 * 2: 4K from start of device.
955 * Depending on the array size, we might leave extra space
956 * for a bitmap.
957 */
958 array_size = __le64_to_cpu(sb->size);
959 /* work out how much space we left for a bitmap */
960 bm_space = choose_bm_space(array_size);
961
962 switch(st->minor_version) {
963 case 0:
964 sb_offset = dsize;
965 sb_offset -= 8*2;
966 sb_offset &= ~(4*2-1);
967 sb->super_offset = __cpu_to_le64(sb_offset);
968 sb->data_offset = __cpu_to_le64(0);
969 if (sb_offset - bm_space < array_size)
970 bm_space = sb_offset - array_size;
971 sb->data_size = __cpu_to_le64(sb_offset - bm_space);
972 break;
973 case 1:
974 sb->super_offset = __cpu_to_le64(0);
975 if (4*2 + bm_space + __le64_to_cpu(sb->size) > dsize)
976 bm_space = dsize - __le64_to_cpu(sb->size) - 4*2;
977 sb->data_offset = __cpu_to_le64(bm_space + 4*2);
978 sb->data_size = __cpu_to_le64(dsize - bm_space - 4*2);
979 break;
980 case 2:
981 sb_offset = 4*2;
982 sb->super_offset = __cpu_to_le64(4*2);
983 if (4*2 + 4*2 + bm_space + __le64_to_cpu(sb->size) > dsize)
984 bm_space = dsize - __le64_to_cpu(sb->size) - 4*2 - 4*2;
985 sb->data_offset = __cpu_to_le64(4*2 + 4*2 + bm_space);
986 sb->data_size = __cpu_to_le64(dsize - 4*2 - 4*2 - bm_space );
987 break;
988 default:
989 return -EINVAL;
990 }
991
992
993 sb->sb_csum = calc_sb_1_csum(sb);
994 rv = store_super1(st, fd);
995 if (rv)
996 fprintf(stderr, Name ": failed to write superblock to %s\n", devname);
997
998 if (rv == 0 && (__le32_to_cpu(sb->feature_map) & 1))
999 rv = st->ss->write_bitmap(st, fd);
1000 close(fd);
1001 return rv;
1002 }
1003
1004 static int compare_super1(struct supertype *st, struct supertype *tst)
1005 {
1006 /*
1007 * return:
1008 * 0 same, or first was empty, and second was copied
1009 * 1 second had wrong number
1010 * 2 wrong uuid
1011 * 3 wrong other info
1012 */
1013 struct mdp_superblock_1 *first = st->sb;
1014 struct mdp_superblock_1 *second = tst->sb;
1015
1016 if (second->magic != __cpu_to_le32(MD_SB_MAGIC))
1017 return 1;
1018 if (second->major_version != __cpu_to_le32(1))
1019 return 1;
1020
1021 if (!first) {
1022 first = malloc(1024+sizeof(bitmap_super_t) +
1023 sizeof(struct misc_dev_info));
1024 memcpy(first, second, 1024+sizeof(bitmap_super_t) +
1025 sizeof(struct misc_dev_info));
1026 st->sb = first;
1027 return 0;
1028 }
1029 if (memcmp(first->set_uuid, second->set_uuid, 16)!= 0)
1030 return 2;
1031
1032 if (first->ctime != second->ctime ||
1033 first->level != second->level ||
1034 first->layout != second->layout ||
1035 first->size != second->size ||
1036 first->chunksize != second->chunksize ||
1037 first->raid_disks != second->raid_disks)
1038 return 3;
1039 return 0;
1040 }
1041
1042 static void free_super1(struct supertype *st);
1043
1044 static int load_super1(struct supertype *st, int fd, char *devname)
1045 {
1046 unsigned long long dsize;
1047 unsigned long long sb_offset;
1048 struct mdp_superblock_1 *super;
1049 int uuid[4];
1050 struct bitmap_super_s *bsb;
1051 struct misc_dev_info *misc;
1052
1053 free_super1(st);
1054
1055 if (st->ss == NULL || st->minor_version == -1) {
1056 int bestvers = -1;
1057 struct supertype tst;
1058 __u64 bestctime = 0;
1059 /* guess... choose latest ctime */
1060 tst.ss = &super1;
1061 tst.sb = NULL;
1062 for (tst.minor_version = 0; tst.minor_version <= 2 ; tst.minor_version++) {
1063 switch(load_super1(&tst, fd, devname)) {
1064 case 0: super = tst.sb;
1065 if (bestvers == -1 ||
1066 bestctime < __le64_to_cpu(super->ctime)) {
1067 bestvers = tst.minor_version;
1068 bestctime = __le64_to_cpu(super->ctime);
1069 }
1070 free(super);
1071 tst.sb = NULL;
1072 break;
1073 case 1: return 1; /*bad device */
1074 case 2: break; /* bad, try next */
1075 }
1076 }
1077 if (bestvers != -1) {
1078 int rv;
1079 tst.minor_version = bestvers;
1080 tst.ss = &super1;
1081 tst.max_devs = 384;
1082 rv = load_super1(&tst, fd, devname);
1083 if (rv == 0)
1084 *st = tst;
1085 return rv;
1086 }
1087 return 2;
1088 }
1089 if (!get_dev_size(fd, devname, &dsize))
1090 return 1;
1091 dsize >>= 9;
1092
1093 if (dsize < 24) {
1094 if (devname)
1095 fprintf(stderr, Name ": %s is too small for md: size is %llu sectors.\n",
1096 devname, dsize);
1097 return 1;
1098 }
1099
1100 /*
1101 * Calculate the position of the superblock.
1102 * It is always aligned to a 4K boundary and
1103 * depending on minor_version, it can be:
1104 * 0: At least 8K, but less than 12K, from end of device
1105 * 1: At start of device
1106 * 2: 4K from start of device.
1107 */
1108 switch(st->minor_version) {
1109 case 0:
1110 sb_offset = dsize;
1111 sb_offset -= 8*2;
1112 sb_offset &= ~(4*2-1);
1113 break;
1114 case 1:
1115 sb_offset = 0;
1116 break;
1117 case 2:
1118 sb_offset = 4*2;
1119 break;
1120 default:
1121 return -EINVAL;
1122 }
1123
1124 ioctl(fd, BLKFLSBUF, 0); /* make sure we read current data */
1125
1126
1127 if (lseek64(fd, sb_offset << 9, 0)< 0LL) {
1128 if (devname)
1129 fprintf(stderr, Name ": Cannot seek to superblock on %s: %s\n",
1130 devname, strerror(errno));
1131 return 1;
1132 }
1133
1134 super = malloc(1024 + sizeof(bitmap_super_t) +
1135 sizeof(struct misc_dev_info));
1136
1137 if (read(fd, super, 1024) != 1024) {
1138 if (devname)
1139 fprintf(stderr, Name ": Cannot read superblock on %s\n",
1140 devname);
1141 free(super);
1142 return 1;
1143 }
1144
1145 if (__le32_to_cpu(super->magic) != MD_SB_MAGIC) {
1146 if (devname)
1147 fprintf(stderr, Name ": No super block found on %s (Expected magic %08x, got %08x)\n",
1148 devname, MD_SB_MAGIC, __le32_to_cpu(super->magic));
1149 free(super);
1150 return 2;
1151 }
1152
1153 if (__le32_to_cpu(super->major_version) != 1) {
1154 if (devname)
1155 fprintf(stderr, Name ": Cannot interpret superblock on %s - version is %d\n",
1156 devname, __le32_to_cpu(super->major_version));
1157 free(super);
1158 return 2;
1159 }
1160 if (__le64_to_cpu(super->super_offset) != sb_offset) {
1161 if (devname)
1162 fprintf(stderr, Name ": No superblock found on %s (super_offset is wrong)\n",
1163 devname);
1164 free(super);
1165 return 2;
1166 }
1167 st->sb = super;
1168
1169 bsb = (struct bitmap_super_s *)(((char*)super)+1024);
1170
1171 misc = (struct misc_dev_info*) (bsb+1);
1172 misc->device_size = dsize;
1173
1174 /* Now check on the bitmap superblock */
1175 if ((__le32_to_cpu(super->feature_map)&MD_FEATURE_BITMAP_OFFSET) == 0)
1176 return 0;
1177 /* Read the bitmap superblock and make sure it looks
1178 * valid. If it doesn't clear the bit. An --assemble --force
1179 * should get that written out.
1180 */
1181 locate_bitmap1(st, fd);
1182 if (read(fd, ((char*)super)+1024, sizeof(struct bitmap_super_s))
1183 != sizeof(struct bitmap_super_s))
1184 goto no_bitmap;
1185
1186 uuid_from_super1(st, uuid);
1187 if (__le32_to_cpu(bsb->magic) != BITMAP_MAGIC ||
1188 memcmp(bsb->uuid, uuid, 16) != 0)
1189 goto no_bitmap;
1190 return 0;
1191
1192 no_bitmap:
1193 super->feature_map = __cpu_to_le32(__le32_to_cpu(super->feature_map) & ~1);
1194 return 0;
1195 }
1196
1197
1198 static struct supertype *match_metadata_desc1(char *arg)
1199 {
1200 struct supertype *st = malloc(sizeof(*st));
1201 if (!st) return st;
1202
1203 st->ss = &super1;
1204 st->max_devs = 384;
1205 st->sb = NULL;
1206 if (strcmp(arg, "1.0") == 0) {
1207 st->minor_version = 0;
1208 return st;
1209 }
1210 if (strcmp(arg, "1.1") == 0) {
1211 st->minor_version = 1;
1212 return st;
1213 }
1214 if (strcmp(arg, "1.2") == 0) {
1215 st->minor_version = 2;
1216 return st;
1217 }
1218 if (strcmp(arg, "1") == 0 ||
1219 strcmp(arg, "default/large") == 0) {
1220 st->minor_version = -1;
1221 return st;
1222 }
1223
1224 free(st);
1225 return NULL;
1226 }
1227
1228 /* find available size on device with this devsize, using
1229 * superblock type st, and reserving 'reserve' sectors for
1230 * a possible bitmap
1231 */
1232 static __u64 avail_size1(struct supertype *st, __u64 devsize)
1233 {
1234 struct mdp_superblock_1 *super = st->sb;
1235 if (devsize < 24)
1236 return 0;
1237
1238 if (super == NULL)
1239 /* creating: allow suitable space for bitmap */
1240 devsize -= choose_bm_space(devsize);
1241 #ifndef MDASSEMBLE
1242 else if (__le32_to_cpu(super->feature_map)&MD_FEATURE_BITMAP_OFFSET) {
1243 /* hot-add. allow for actual size of bitmap */
1244 struct bitmap_super_s *bsb;
1245 bsb = (struct bitmap_super_s *)(((char*)super)+1024);
1246 devsize -= bitmap_sectors(bsb);
1247 }
1248 #endif
1249
1250 switch(st->minor_version) {
1251 case -1: /* no specified. Now time to set default */
1252 st->minor_version = 0;
1253 /* FALL THROUGH */
1254 case 0:
1255 /* at end */
1256 return ((devsize - 8*2 ) & ~(4*2-1));
1257 case 1:
1258 /* at start, 4K for superblock and possible bitmap */
1259 return devsize - 4*2;
1260 case 2:
1261 /* 4k from start, 4K for superblock and possible bitmap */
1262 return devsize - (4+4)*2;
1263 }
1264 return 0;
1265 }
1266
1267 static int
1268 add_internal_bitmap1(struct supertype *st,
1269 int *chunkp, int delay, int write_behind,
1270 unsigned long long size,
1271 int may_change, int major)
1272 {
1273 /*
1274 * If not may_change, then this is a 'Grow', and the bitmap
1275 * must fit after the superblock.
1276 * If may_change, then this is create, and we can put the bitmap
1277 * before the superblock if we like, or may move the start.
1278 * If !may_change, the bitmap MUST live at offset of 1K, until
1279 * we get a sysfs interface.
1280 *
1281 * size is in sectors, chunk is in bytes !!!
1282 */
1283
1284 unsigned long long bits;
1285 unsigned long long max_bits;
1286 unsigned long long min_chunk;
1287 long offset;
1288 int chunk = *chunkp;
1289 int room = 0;
1290 struct mdp_superblock_1 *sb = st->sb;
1291 bitmap_super_t *bms = (bitmap_super_t*)(((char*)sb) + 1024);
1292
1293 switch(st->minor_version) {
1294 case 0:
1295 /* either 3K after the superblock, or some amount of space
1296 * before.
1297 */
1298 if (may_change) {
1299 /* We are creating array, so we *know* how much room has
1300 * been left.
1301 */
1302 offset = 0;
1303 room = choose_bm_space(__le64_to_cpu(sb->size));
1304 if (room == 4*2) {
1305 /* make it 3K after the superblock */
1306 room = 3*2;
1307 offset = 2;
1308 }
1309 } else {
1310 room = __le64_to_cpu(sb->super_offset)
1311 - __le64_to_cpu(sb->data_offset)
1312 - __le64_to_cpu(sb->data_size);
1313 /* remove '1 ||' when we can set offset via sysfs */
1314 if (1 || (room < 3*2 &&
1315 __le32_to_cpu(sb->max_dev) <= 384)) {
1316 room = 3*2;
1317 offset = 1*2;
1318 } else {
1319 offset = 0; /* means movable offset */
1320 }
1321 }
1322 break;
1323 case 1:
1324 case 2: /* between superblock and data */
1325 if (may_change) {
1326 offset = 4*2;
1327 room = choose_bm_space(__le64_to_cpu(sb->size));
1328 } else {
1329 room = __le64_to_cpu(sb->data_offset)
1330 - __le64_to_cpu(sb->super_offset);
1331 if (1 || __le32_to_cpu(sb->max_dev) <= 384) {
1332 room -= 2;
1333 offset = 2;
1334 } else {
1335 room -= 4*2;
1336 offset = 4*2;
1337 }
1338 }
1339 break;
1340 default:
1341 return 0;
1342 }
1343
1344 if (chunk == UnSet && room > 128*2)
1345 /* Limit to 128K of bitmap when chunk size not requested */
1346 room = 128*2;
1347
1348 max_bits = (room * 512 - sizeof(bitmap_super_t)) * 8;
1349
1350 min_chunk = 4096; /* sub-page chunks don't work yet.. */
1351 bits = (size*512)/min_chunk +1;
1352 while (bits > max_bits) {
1353 min_chunk *= 2;
1354 bits = (bits+1)/2;
1355 }
1356 if (chunk == UnSet)
1357 chunk = min_chunk;
1358 else if (chunk < min_chunk)
1359 return 0; /* chunk size too small */
1360 if (chunk == 0) /* rounding problem */
1361 return 0;
1362
1363 if (offset == 0) {
1364 bits = (size*512) / chunk + 1;
1365 room = ((bits+7)/8 + sizeof(bitmap_super_t) +511)/512;
1366 offset = -room;
1367 }
1368
1369 sb->bitmap_offset = __cpu_to_le32(offset);
1370
1371 sb->feature_map = __cpu_to_le32(__le32_to_cpu(sb->feature_map) | 1);
1372 memset(bms, 0, sizeof(*bms));
1373 bms->magic = __cpu_to_le32(BITMAP_MAGIC);
1374 bms->version = __cpu_to_le32(major);
1375 uuid_from_super1(st, (int*)bms->uuid);
1376 bms->chunksize = __cpu_to_le32(chunk);
1377 bms->daemon_sleep = __cpu_to_le32(delay);
1378 bms->sync_size = __cpu_to_le64(size);
1379 bms->write_behind = __cpu_to_le32(write_behind);
1380
1381 *chunkp = chunk;
1382 return 1;
1383 }
1384
1385
1386 static void locate_bitmap1(struct supertype *st, int fd)
1387 {
1388 unsigned long long offset;
1389 struct mdp_superblock_1 *sb;
1390 int mustfree = 0;
1391
1392 if (!st->sb) {
1393 if (st->ss->load_super(st, fd, NULL))
1394 return; /* no error I hope... */
1395 mustfree = 1;
1396 }
1397 sb = st->sb;
1398
1399 offset = __le64_to_cpu(sb->super_offset);
1400 offset += (int32_t) __le32_to_cpu(sb->bitmap_offset);
1401 if (mustfree)
1402 free(sb);
1403 lseek64(fd, offset<<9, 0);
1404 }
1405
1406 static int write_bitmap1(struct supertype *st, int fd)
1407 {
1408 struct mdp_superblock_1 *sb = st->sb;
1409 bitmap_super_t *bms = (bitmap_super_t*)(((char*)sb)+1024);
1410 int rv = 0;
1411
1412 int towrite, n;
1413 char buf[4096];
1414
1415 locate_bitmap1(st, fd);
1416
1417 if (write(fd, ((char*)sb)+1024, sizeof(bitmap_super_t)) !=
1418 sizeof(bitmap_super_t))
1419 return -2;
1420 towrite = __le64_to_cpu(bms->sync_size) / (__le32_to_cpu(bms->chunksize)>>9);
1421 towrite = (towrite+7) >> 3; /* bits to bytes */
1422 memset(buf, 0xff, sizeof(buf));
1423 while (towrite > 0) {
1424 n = towrite;
1425 if (n > sizeof(buf))
1426 n = sizeof(buf);
1427 n = write(fd, buf, n);
1428 if (n > 0)
1429 towrite -= n;
1430 else
1431 break;
1432 }
1433 fsync(fd);
1434 if (towrite)
1435 rv = -2;
1436
1437 return rv;
1438 }
1439
1440 static void free_super1(struct supertype *st)
1441 {
1442 if (st->sb)
1443 free(st->sb);
1444 st->sb = NULL;
1445 }
1446
1447 struct superswitch super1 = {
1448 #ifndef MDASSEMBLE
1449 .examine_super = examine_super1,
1450 .brief_examine_super = brief_examine_super1,
1451 .export_examine_super = export_examine_super1,
1452 .detail_super = detail_super1,
1453 .brief_detail_super = brief_detail_super1,
1454 .export_detail_super = export_detail_super1,
1455 #endif
1456 .match_home = match_home1,
1457 .uuid_from_super = uuid_from_super1,
1458 .getinfo_super = getinfo_super1,
1459 .update_super = update_super1,
1460 .init_super = init_super1,
1461 .add_to_super = add_to_super1,
1462 .store_super = store_super1,
1463 .write_init_super = write_init_super1,
1464 .compare_super = compare_super1,
1465 .load_super = load_super1,
1466 .match_metadata_desc = match_metadata_desc1,
1467 .avail_size = avail_size1,
1468 .add_internal_bitmap = add_internal_bitmap1,
1469 .locate_bitmap = locate_bitmap1,
1470 .write_bitmap = write_bitmap1,
1471 .free_super = free_super1,
1472 .major = 1,
1473 #if __BYTE_ORDER == BIG_ENDIAN
1474 .swapuuid = 0,
1475 #else
1476 .swapuuid = 1,
1477 #endif
1478 };