]> git.ipfire.org Git - thirdparty/mdadm.git/blame - mdstat.c
mdadm: load default sysfs attributes after assemblation
[thirdparty/mdadm.git] / mdstat.c
CommitLineData
e0d19036
NB
1/*
2 * mdstat - parse /proc/mdstat file. Part of:
3 * mdadm - manage Linux "md" devices aka RAID arrays.
4 *
e736b623 5 * Copyright (C) 2002-2009 Neil Brown <neilb@suse.de>
e0d19036
NB
6 *
7 *
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 *
22 * Author: Neil Brown
e736b623 23 * Email: <neilb@suse.de>
e0d19036
NB
24 */
25
26/*
27 * The /proc/mdstat file comes in at least 3 flavours:
28 * In an unpatched 2.2 kernel (md 0.36.6):
29 * Personalities : [n raidx] ...
30 * read_ahead {not set|%d sectors}
31 * md0 : {in}active{ raidX /dev/hda... %d blocks{ maxfault=%d}}
32 * md1 : .....
33 *
34 * Normally only 4 md lines, but all are listed.
35 *
36 * In a patched 2.2 kernel (md 0.90.0)
37 * Personalities : [raidx] ...
38 * read_ahead {not set|%d sectors}
39 * mdN : {in}active {(readonly)} raidX dev[%d]{(F)} ... %d blocks STATUS RESYNC
40 * ... Only initialised arrays listed
8f21823f 41 * unused devices: {dev dev ... | <none>}
e0d19036
NB
42 *
43 * STATUS is personality dependant:
44 * linear: %dk rounding
45 * raid0: %dk chunks
46 * raid1: [%d/%d] [U_U] ( raid/working. operational or not)
47 * raid5: level 4/5, %dk chunk, algorithm %d [%d/%d] [U_U]
48 *
49 * RESYNC is empty or:
50 * {resync|recovery}=%u%% finish=%u.%umin
51 * or
52 * resync=DELAYED
53 *
54 * In a 2.4 kernel (md 0.90.0/2.4)
55 * Personalities : [raidX] ...
56 * read_ahead {not set|%d sectors}
57 * mdN : {in}active {(read-only)} raidX dev[%d]{(F)} ...
58 * %d blocks STATUS
59 * RESYNC
8f21823f 60 * unused devices: {dev dev .. | <none>}
e0d19036
NB
61 *
62 * STATUS matches 0.90.0/2.2
63 * RESYNC includes [===>....],
64 * adds a space after {resync|recovery} and before and after '='
65 * adds a decimal to the recovery percent.
66 * adds (%d/%d) resync amount and max_blocks, before finish.
67 * adds speed=%dK/sec after finish
68 *
69 *
70 *
71 * Out of this we want to extract:
72 * list of devices, active or not
73 * pattern of failed drives (so need number of drives)
74 * percent resync complete
75 *
76 * As continuation is indicated by leading space, we use
77 * conf_line from config.c to read logical lines
78 *
79 */
80
81#include "mdadm.h"
82#include "dlink.h"
dd0781e5 83#include <sys/select.h>
549e9569 84#include <ctype.h>
e0d19036 85
3b57c466
N
86static void free_member_devnames(struct dev_member *m)
87{
88 while(m) {
89 struct dev_member *t = m;
90
91 m = m->next;
92 free(t->name);
93 free(t);
94 }
95}
96
0ad6835c 97static int add_member_devname(struct dev_member **m, char *name)
3b57c466
N
98{
99 struct dev_member *new;
100 char *t;
101
102 if ((t = strchr(name, '[')) == NULL)
103 /* not a device */
0ad6835c 104 return 0;
3b57c466 105
503975b9 106 new = xmalloc(sizeof(*new));
3b57c466
N
107 new->name = strndup(name, t - name);
108 new->next = *m;
109 *m = new;
0ad6835c 110 return 1;
3b57c466
N
111}
112
e0d19036
NB
113void free_mdstat(struct mdstat_ent *ms)
114{
115 while (ms) {
116 struct mdstat_ent *t;
3b57c466
N
117 free(ms->level);
118 free(ms->pattern);
119 free(ms->metadata_version);
120 free_member_devnames(ms->members);
e0d19036
NB
121 t = ms;
122 ms = ms->next;
123 free(t);
124 }
125}
126
dd0781e5 127static int mdstat_fd = -1;
22a88995 128struct mdstat_ent *mdstat_read(int hold, int start)
e0d19036
NB
129{
130 FILE *f;
22a88995 131 struct mdstat_ent *all, *rv, **end, **insert_here;
e0d19036 132 char *line;
d94a4f62 133 int fd;
e0d19036 134
dd0781e5 135 if (hold && mdstat_fd != -1) {
52209d6e
TM
136 off_t offset = lseek(mdstat_fd, 0L, 0);
137 if (offset == (off_t)-1) {
138 mdstat_close();
139 return NULL;
140 }
d94a4f62
JS
141 fd = dup(mdstat_fd);
142 if (fd >= 0)
143 f = fdopen(fd, "r");
144 else
145 return NULL;
dd0781e5
NB
146 } else
147 f = fopen("/proc/mdstat", "r");
e0d19036
NB
148 if (f == NULL)
149 return NULL;
e4dc5106
DL
150 else
151 fcntl(fileno(f), F_SETFD, FD_CLOEXEC);
e0d19036
NB
152
153 all = NULL;
154 end = &all;
155 for (; (line = conf_line(f)) ; free_line(line)) {
156 struct mdstat_ent *ent;
157 char *w;
4dd2df09 158 char devnm[32];
22a88995 159 int in_devs = 0;
e0d19036 160
a9db8995 161 if (strcmp(line, "Personalities") == 0)
e0d19036 162 continue;
a9db8995 163 if (strcmp(line, "read_ahead") == 0)
e0d19036 164 continue;
a9db8995 165 if (strcmp(line, "unused") == 0)
e0d19036 166 continue;
22a88995 167 insert_here = NULL;
e0d19036 168 /* Better be an md line.. */
d7be7d87
JS
169 if (strncmp(line, "md", 2)!= 0 || strlen(line) >= 32 ||
170 (line[2] != '_' && !isdigit(line[2])))
98c6faba 171 continue;
4dd2df09 172 strcpy(devnm, line);
e0d19036 173
503975b9 174 ent = xmalloc(sizeof(*ent));
9581efb1 175 ent->level = ent->pattern= NULL;
e0d19036 176 ent->next = NULL;
9dad51d4 177 ent->percent = RESYNC_NONE;
e0d19036 178 ent->active = -1;
e5329c37 179 ent->resync = 0;
549e9569
NB
180 ent->metadata_version = NULL;
181 ent->raid_disks = 0;
549e9569 182 ent->devcnt = 0;
3b57c466 183 ent->members = NULL;
e0d19036 184
4dd2df09 185 strcpy(ent->devnm, devnm);
aba69144 186
e0d19036
NB
187 for (w=dl_next(line); w!= line ; w=dl_next(w)) {
188 int l = strlen(w);
189 char *eq;
a9db8995 190 if (strcmp(w, "active") == 0)
e0d19036 191 ent->active = 1;
a9db8995 192 else if (strcmp(w, "inactive") == 0) {
e0d19036 193 ent->active = 0;
b6d7a7fb
JD
194 in_devs = 1;
195 } else if (ent->active > 0 &&
e0d19036 196 ent->level == NULL &&
22a88995 197 w[0] != '(' /*readonly*/) {
503975b9 198 ent->level = xstrdup(w);
22a88995 199 in_devs = 1;
a9db8995 200 } else if (in_devs && strcmp(w, "blocks") == 0)
22a88995 201 in_devs = 0;
549e9569 202 else if (in_devs) {
4dd2df09 203 char *ep = strchr(w, '[');
0ad6835c
ML
204 ent->devcnt +=
205 add_member_devname(&ent->members, w);
a9db8995 206 if (ep && strncmp(w, "md", 2) == 0) {
549e9569
NB
207 /* This has an md device as a component.
208 * If that device is already in the
209 * list, make sure we insert before
210 * there.
211 */
212 struct mdstat_ent **ih;
549e9569
NB
213 ih = &all;
214 while (ih != insert_here && *ih &&
d7be7d87
JS
215 ((int)strlen((*ih)->devnm) !=
216 ep-w ||
217 strncmp((*ih)->devnm, w,
218 ep-w) != 0))
549e9569
NB
219 ih = & (*ih)->next;
220 insert_here = ih;
221 }
222 } else if (strcmp(w, "super") == 0 &&
223 dl_next(w) != line) {
224 w = dl_next(w);
503975b9 225 ent->metadata_version = xstrdup(w);
549e9569
NB
226 } else if (w[0] == '[' && isdigit(w[1])) {
227 ent->raid_disks = atoi(w+1);
22a88995 228 } else if (!ent->pattern &&
a9db8995
ZL
229 w[0] == '[' &&
230 (w[1] == 'U' || w[1] == '_')) {
503975b9 231 ent->pattern = xstrdup(w+1);
a9db8995 232 if (ent->pattern[l-2] == ']')
e0d19036 233 ent->pattern[l-2] = '\0';
9dad51d4 234 } else if (ent->percent == RESYNC_NONE &&
a9db8995 235 strncmp(w, "re", 2) == 0 &&
e0d19036 236 w[l-1] == '%' &&
a9db8995 237 (eq = strchr(w, '=')) != NULL ) {
e0d19036 238 ent->percent = atoi(eq+1);
a9db8995 239 if (strncmp(w,"resync", 6) == 0)
e5329c37 240 ent->resync = 1;
a9db8995 241 else if (strncmp(w, "reshape", 7) == 0)
f94c116f
N
242 ent->resync = 2;
243 else
244 ent->resync = 0;
9dad51d4 245 } else if (ent->percent == RESYNC_NONE &&
f94c116f 246 (w[0] == 'r' || w[0] == 'c')) {
35c34037 247 if (strncmp(w, "resync", 6) == 0)
f94c116f 248 ent->resync = 1;
a9db8995 249 if (strncmp(w, "reshape", 7) == 0)
f94c116f 250 ent->resync = 2;
a9db8995 251 if (strncmp(w, "recovery", 8) == 0)
aa8d7dc7 252 ent->resync = 0;
a9db8995 253 if (strncmp(w, "check", 5) == 0)
f94c116f
N
254 ent->resync = 3;
255
2d3603ba 256 if (l > 8 && strcmp(w+l-8, "=DELAYED") == 0)
9dad51d4 257 ent->percent = RESYNC_DELAYED;
2d3603ba 258 if (l > 8 && strcmp(w+l-8, "=PENDING") == 0)
9dad51d4
N
259 ent->percent = RESYNC_PENDING;
260 } else if (ent->percent == RESYNC_NONE &&
aba69144 261 w[0] >= '0' &&
e0d19036
NB
262 w[0] <= '9' &&
263 w[l-1] == '%') {
264 ent->percent = atoi(w);
265 }
266 }
22a88995
NB
267 if (insert_here && (*insert_here)) {
268 ent->next = *insert_here;
269 *insert_here = ent;
270 } else {
271 *end = ent;
272 end = &ent->next;
273 }
e0d19036 274 }
e4dc5106 275 if (hold && mdstat_fd == -1) {
dd0781e5 276 mdstat_fd = dup(fileno(f));
e4dc5106
DL
277 fcntl(mdstat_fd, F_SETFD, FD_CLOEXEC);
278 }
e0d19036 279 fclose(f);
22a88995
NB
280
281 /* If we might want to start array,
282 * reverse the order, so that components comes before composites
283 */
284 if (start) {
285 rv = NULL;
286 while (all) {
287 struct mdstat_ent *e = all;
288 all = all->next;
289 e->next = rv;
290 rv = e;
291 }
a9db8995
ZL
292 } else
293 rv = all;
22a88995 294 return rv;
e0d19036 295}
dd0781e5 296
a7a0d8a1
N
297void mdstat_close(void)
298{
299 if (mdstat_fd >= 0)
300 close(mdstat_fd);
301 mdstat_fd = -1;
302}
303
dd0781e5
NB
304void mdstat_wait(int seconds)
305{
306 fd_set fds;
307 struct timeval tm;
0b5ec75e 308 int maxfd = 0;
dd0781e5 309 FD_ZERO(&fds);
0b5ec75e 310 if (mdstat_fd >= 0) {
dd0781e5 311 FD_SET(mdstat_fd, &fds);
0b5ec75e
N
312 maxfd = mdstat_fd;
313 }
dd0781e5
NB
314 tm.tv_sec = seconds;
315 tm.tv_usec = 0;
0b5ec75e 316 select(maxfd + 1, NULL, NULL, &fds, &tm);
dd0781e5 317}
8382f19b 318
58a4ba2a 319void mdstat_wait_fd(int fd, const sigset_t *sigmask)
549e9569
NB
320{
321 fd_set fds, rfds;
5d4d1b26 322 int maxfd = 0;
549e9569
NB
323
324 FD_ZERO(&fds);
325 FD_ZERO(&rfds);
326 if (mdstat_fd >= 0)
327 FD_SET(mdstat_fd, &fds);
5d4d1b26 328
58a4ba2a 329 if (fd >= 0) {
28005287
N
330 struct stat stb;
331 fstat(fd, &stb);
332 if ((stb.st_mode & S_IFMT) == S_IFREG)
333 /* Must be a /proc or /sys fd, so expect
334 * POLLPRI
335 * i.e. an 'exceptional' event.
336 */
337 FD_SET(fd, &fds);
338 else
339 FD_SET(fd, &rfds);
5d4d1b26
N
340
341 if (fd > maxfd)
342 maxfd = fd;
343
28005287 344 }
0b5ec75e
N
345 if (mdstat_fd > maxfd)
346 maxfd = mdstat_fd;
549e9569 347
0b5ec75e 348 pselect(maxfd + 1, &rfds, NULL, &fds,
1ed3f387 349 NULL, sigmask);
549e9569
NB
350}
351
4dd2df09 352int mddev_busy(char *devnm)
8382f19b
NB
353{
354 struct mdstat_ent *mdstat = mdstat_read(0, 0);
355 struct mdstat_ent *me;
356
357 for (me = mdstat ; me ; me = me->next)
4dd2df09 358 if (strcmp(me->devnm, devnm) == 0)
8382f19b
NB
359 break;
360 free_mdstat(mdstat);
361 return me != NULL;
362}
3b57c466
N
363
364struct mdstat_ent *mdstat_by_component(char *name)
365{
366 struct mdstat_ent *mdstat = mdstat_read(0, 0);
367
368 while (mdstat) {
369 struct dev_member *m;
370 struct mdstat_ent *ent;
371 if (mdstat->metadata_version &&
372 strncmp(mdstat->metadata_version, "external:", 9) == 0 &&
373 is_subarray(mdstat->metadata_version+9))
374 /* don't return subarrays, only containers */
375 ;
376 else for (m = mdstat->members; m; m = m->next) {
377 if (strcmp(m->name, name) == 0) {
378 free_mdstat(mdstat->next);
379 mdstat->next = NULL;
380 return mdstat;
381 }
382 }
383 ent = mdstat;
384 mdstat = mdstat->next;
385 ent->next = NULL;
386 free_mdstat(ent);
387 }
388 return NULL;
389}
78b10e66 390
4dd2df09 391struct mdstat_ent *mdstat_by_subdev(char *subdev, char *container)
78b10e66
N
392{
393 struct mdstat_ent *mdstat = mdstat_read(0, 0);
4dd2df09 394 struct mdstat_ent *ent = NULL;
78b10e66
N
395
396 while (mdstat) {
78b10e66 397 /* metadata version must match:
4dd2df09
N
398 * external:[/-]%s/%s
399 * where first %s is 'container' and second %s is 'subdev'
78b10e66 400 */
4dd2df09
N
401 if (ent)
402 free_mdstat(ent);
78b10e66
N
403 ent = mdstat;
404 mdstat = mdstat->next;
405 ent->next = NULL;
4dd2df09
N
406
407 if (ent->metadata_version == NULL ||
408 strncmp(ent->metadata_version, "external:", 9) != 0)
409 continue;
410
411 if (!metadata_container_matches(ent->metadata_version+9,
412 container) ||
413 !metadata_subdev_matches(ent->metadata_version+9,
414 subdev))
415 continue;
416
417 free_mdstat(mdstat);
418 return ent;
78b10e66
N
419 }
420 return NULL;
421}