/*
* mdadm - manage Linux "md" devices aka RAID arrays.
*
- * Copyright (C) 2001-2006 Neil Brown <neilb@suse.de>
+ * Copyright (C) 2001-2009 Neil Brown <neilb@suse.de>
*
*
* This program is free software; you can redistribute it and/or modify
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*
* Author: Neil Brown
- * Email: <neilb@cse.unsw.edu.au>
- * Paper: Neil Brown
- * School of Computer Science and Engineering
- * The University of New South Wales
- * Sydney, 2052
- * Australia
+ * Email: <neilb@suse.de>
*/
#include "mdadm.h"
#include <ctype.h>
-void make_dev_symlink(char *dev)
-{
- char *new = strdup(dev);
-
- if (!new) return;
- /* /dev/md/0 -> /dev/md0
- * /dev/md/d0 -> /dev/md_d0
- */
- if (isdigit(new[8]))
- strcpy(new+7, new+8);
- else
- new[7] = '_';
- symlink(dev+5, new);
-}
-
-
void make_parts(char *dev, int cnt)
{
/* make 'cnt' partition devices for 'dev'
- * We use the major/minor from dev and add 1..cnt
+ * If dev is a device name we use the
+ * major/minor from dev and add 1..cnt
+ * If it is a symlink, we make similar symlinks.
* If dev ends with a digit, we add "p%d" else "%d"
* If the name exists, we use it's owner/mode,
* else that of dev
*/
struct stat stb;
- int major, minor;
+ int major_num;
+ int minor_num;
+ int odig;
int i;
int nlen = strlen(dev) + 20;
- char *name = malloc(nlen);
+ char *name;
int dig = isdigit(dev[strlen(dev)-1]);
+ char orig[1024];
+ char sym[1024];
+ int err;
if (cnt==0) cnt=4;
- if (stat(dev, &stb)!= 0)
+ if (lstat(dev, &stb)!= 0)
return;
- if (!S_ISBLK(stb.st_mode))
+
+ if (S_ISBLK(stb.st_mode)) {
+ major_num = major(stb.st_rdev);
+ minor_num = minor(stb.st_rdev);
+ odig = -1;
+ } else if (S_ISLNK(stb.st_mode)) {
+ int len = readlink(dev, orig, sizeof(orig));
+ if (len < 0 || len > 1000)
+ return;
+ orig[len] = 0;
+ odig = isdigit(orig[len-1]);
+ major_num = -1;
+ minor_num = -1;
+ } else
return;
- major = major(stb.st_rdev);
- minor = minor(stb.st_rdev);
+ name = malloc(nlen);
for (i=1; i <= cnt ; i++) {
struct stat stb2;
snprintf(name, nlen, "%s%s%d", dev, dig?"p":"", i);
if (stat(name, &stb2)==0) {
- if (!S_ISBLK(stb2.st_mode))
+ if (!S_ISBLK(stb2.st_mode) || !S_ISBLK(stb.st_mode))
continue;
- if (stb2.st_rdev == makedev(major, minor+i))
+ if (stb2.st_rdev == makedev(major_num, minor_num+i))
continue;
unlink(name);
} else {
stb2 = stb;
}
- if (mknod(name, S_IFBLK | 0600, makedev(major, minor+i)))
- perror("mknod");
- if (chown(name, stb2.st_uid, stb2.st_gid))
- perror("chown");
- if (chmod(name, stb2.st_mode & 07777))
- perror("chmod");
- if (strncmp(name, "/dev/md/", 8) == 0)
- make_dev_symlink(name);
- stat(name, &stb2);
- add_dev(name, &stb2, 0, NULL);
+ if (S_ISBLK(stb.st_mode)) {
+ if (mknod(name, S_IFBLK | 0600,
+ makedev(major_num, minor_num+i)))
+ perror("mknod");
+ if (chown(name, stb2.st_uid, stb2.st_gid))
+ perror("chown");
+ if (chmod(name, stb2.st_mode & 07777))
+ perror("chmod");
+ err = 0;
+ } else {
+ snprintf(sym, sizeof(sym), "%s%s%d", orig, odig?"p":"", i);
+ err = symlink(sym, name);
+ }
+
+ if (err == 0 && stat(name, &stb2) == 0)
+ add_dev(name, &stb2, 0, NULL);
}
+ free(name);
}
/*
- * Open a given md device, and check that it really is one.
- * If 'autof' is given, then we need to create, or recreate, the md device.
- * If the name already exists, and is not a block device, we fail.
- * If it exists and is not an md device, is not the right type (partitioned or not),
- * or is currently in-use, we remove the device, but remember the owner and mode.
- * If it now doesn't exist, we find a new md array and create the device.
- * Default ownership/mode comes from config file.
+ * We need a new md device to assemble/build/create an array.
+ * 'dev' is a name given us by the user (command line or mdadm.conf)
+ * It might start with /dev or /dev/md any might end with a digit
+ * string.
+ * If it starts with just /dev, it must be /dev/mdX or /dev/md_dX
+ * If it ends with a digit string, then it must be as above, or
+ * 'trustworthy' must be 'METADATA' and the 'dev' must be
+ * /dev/md/'name'NN or 'name'NN
+ * If it doesn't end with a digit string, it must be /dev/md/'name'
+ * or 'name' or must be NULL.
+ * If the digit string is present, it gives the minor number to use
+ * If not, we choose a high, unused minor number.
+ * If the 'dev' is a standard name, it devices whether 'md' or 'mdp'.
+ * else if the name is 'd[0-9]+' then we use mdp
+ * else if trustworthy is 'METADATA' we use md
+ * else the choice depends on 'autof'.
+ * If name is NULL it is assumed to match whatever dev provides.
+ * If both name and dev are NULL, we choose a name 'mdXX' or 'mdpXX'
+ *
+ * If 'name' is given, and 'trustworthy' is 'foreign' and name is not
+ * supported by 'dev', we add a "_%d" suffix based on the minor number
+ * use that.
+ *
+ * If udev is configured, we create a temporary device, open it, and
+ * unlink it.
+ * If not, we create the /dev/mdXX device, and is name is usable,
+ * /dev/md/name
+ * In any case we return /dev/md/name or (if that isn't available)
+ * /dev/mdXX in 'chosen'.
+ *
+ * When we create devices, we use uid/gid/umask from config file.
*/
-int open_mddev(char *dev, int autof)
+
+int create_mddev(char *dev, char *name, int autof, int trustworthy,
+ char *chosen)
{
int mdfd;
struct stat stb;
- int major = MD_MAJOR;
- int minor = 0;
- int must_remove = 0;
- struct mdstat_ent *mdlist;
- int num;
+ int num = -1;
+ int use_mdp = -1;
struct createinfo *ci = conf_get_create_info();
int parts;
+ char *cname;
+ char devname[20];
+ char cbuf[400];
+ if (chosen == NULL)
+ chosen = cbuf;
+
if (autof == 0)
autof = ci->autof;
parts = autof >> 3;
autof &= 7;
- if (autof && autof != 1) {
- /* autof is set, so we need to check that the name is ok,
- * and possibly create one if not
+ strcpy(chosen, "/dev/md/");
+ cname = chosen + strlen(chosen);
+
+
+ if (dev) {
+ if (strncmp(dev, "/dev/md/", 8) == 0) {
+ strcpy(cname, dev+8);
+ } else if (strncmp(dev, "/dev/", 5) == 0) {
+ char *e = dev + strlen(dev);
+ while (e > dev && isdigit(e[-1]))
+ e--;
+ if (e[0])
+ num = strtoul(e, NULL, 10);
+ strcpy(cname, dev+5);
+ cname[e-(dev+5)] = 0;
+ /* name *must* be mdXX or md_dXX in this context */
+ if (num < 0 ||
+ (strcmp(cname, "md") != 0 && strcmp(cname, "md_d") != 0)) {
+ fprintf(stderr, Name ": %s is an invalid name "
+ "for an md device. Try /dev/md/%s\n",
+ dev, dev+5);
+ return -1;
+ }
+ if (strcmp(cname, "md") == 0)
+ use_mdp = 0;
+ else
+ use_mdp = 1;
+ /* recreate name: /dev/md/0 or /dev/md/d0 */
+ sprintf(cname, "%s%d", use_mdp?"d":"", num);
+ } else
+ strcpy(cname, dev);
+
+ /* 'cname' must not contain a slash, and may not be
+ * empty.
*/
- int std;
- stb.st_mode = 0;
- if (stat(dev, &stb)==0 && ! S_ISBLK(stb.st_mode)) {
- fprintf(stderr, Name ": %s is not a block device.\n",
- dev);
+ if (strchr(cname, '/') != NULL) {
+ fprintf(stderr, Name ": %s is an invalid name "
+ "for an md device.\n", dev);
return -1;
}
- if (autof == 2 && stb.st_mode == 0 && !is_standard(dev, NULL)) {
- fprintf(stderr, Name ": --auto=yes requires a 'standard' md device name, not %s\n", dev);
+ if (cname[0] == 0) {
+ fprintf(stderr, Name ": %s is an invalid name "
+ "for an md device (empty!).", dev);
return -1;
}
- /* check major number is correct */
- num = -1;
- std = is_standard(dev, &num);
- if (std>0) major = get_mdp_major();
- switch(autof) {
- case 2: /* only create is_standard names */
- if (!std && !stb.st_mode) {
- fprintf(stderr, Name ": --auto=yes requires a 'standard' md device name, not %s\n", dev);
- return -1;
- }
- break;
- case 3: /* create md, reject std>0 */
- if (std > 0) {
- fprintf(stderr, Name ": that --auto option not compatable with device named %s\n", dev);
- return -1;
- }
- break;
- case 4: /* create mdp, reject std<0 */
- if (std < 0) {
- fprintf(stderr, Name ": that --auto option not compatable with device named %s\n", dev);
- return -1;
- }
- break;
- case 5: /* default to md if not standard */
- break;
- case 6: /* default to mdp if not standard */
- if (std == 0) major = get_mdp_major();
- break;
- }
- /* major is final. num is -1 if not standard */
- if (stb.st_mode && major(stb.st_rdev) != major)
- must_remove = 1;
- if (stb.st_mode && !must_remove) {
- mdu_array_info_t array;
- /* looks ok, see if it is available */
- mdfd = open(dev, O_RDWR, 0);
- if (mdfd < 0) {
- fprintf(stderr, Name ": error opening %s: %s\n",
- dev, strerror(errno));
- return -1;
- } else if (md_get_version(mdfd) <= 0) {
- fprintf(stderr, Name ": %s does not appear to be an md device\n",
- dev);
- close(mdfd);
- return -1;
- }
- if (ioctl(mdfd, GET_ARRAY_INFO, &array)==0) {
- /* already active */
- close(mdfd);
- fprintf(stderr, Name ": %s is already active.\n",
- dev);
- return -1;
- } else {
- if (major != MD_MAJOR && parts > 0)
- make_parts(dev, parts);
- return mdfd;
- }
- }
- /* Ok, need to find a minor that is not in use.
- * If the device name is in a 'standard' format,
- * intuit the minor from that, else
- * easiest to read /proc/mdstat, and hunt through for
- * an unused number
- */
if (num < 0) {
- /* need to pick an unused number */
- mdlist = mdstat_read(0, 0);
- /* Choose a large number. Start from 127 and search down,
- * but if nothing is found, start really big
+ /* If cname is 'N' or 'dN', we get dev number
+ * from there.
*/
- for (num = 127 ; num != 128 ; num = num ? num-1 : (1<<22)-1) {
- struct mdstat_ent *me;
- int devnum = num;
- if (major != MD_MAJOR)
- devnum = -1-num;
+ char *sp = cname;
+ char *ep;
+ if (cname[0] == 'd')
+ sp++;
+ num = strtoul(sp, &ep, 10);
+ if (ep == sp || *ep || num < 0)
+ num = -1;
+ else if (cname[0] == 'd')
+ use_mdp = 1;
+ else
+ use_mdp = 0;
+ }
+ }
- for (me=mdlist; me; me=me->next)
- if (me->devnum == devnum)
- break;
- if (!me) {
- /* doesn't exist in mdstat.
- * make sure it is new to /dev too
- */
- char *dn;
- if (major != MD_MAJOR)
- minor = num << MdpMinorShift;
- else
- minor = num;
- dn = map_dev(major,minor, 0);
- if (dn==NULL || is_standard(dn, NULL)) {
- /* this number only used by a 'standard' name,
- * so it is safe to use
- */
- break;
- }
- }
- }
- } else if (major == MD_MAJOR)
- minor = num;
+ /* Now determine device number */
+ /* named 'METADATA' cannot use 'mdp'. */
+ if (name && name[0] == 0)
+ name = NULL;
+ if (name && trustworthy == METADATA && use_mdp == 1) {
+ fprintf(stderr, Name ": %s is not allowed for a %s container. "
+ "Consider /dev/md%d.\n", dev, name, num);
+ return -1;
+ }
+ if (name && trustworthy == METADATA)
+ use_mdp = 0;
+ if (use_mdp == -1) {
+ if (autof == 4 || autof == 6)
+ use_mdp = 1;
else
- minor = num << MdpMinorShift;
- /* major and minor have been chosen */
+ use_mdp = 0;
+ }
+ if (num < 0 && trustworthy == LOCAL && name) {
+ /* if name is numeric, possibly prefixed by
+ * 'md' or '/dev/md', use that for num
+ * if it is not already in use */
+ char *ep;
+ char *n2 = name;
+ if (strncmp(n2, "/dev/", 5) == 0)
+ n2 += 5;
+ if (strncmp(n2, "md", 2) == 0)
+ n2 += 2;
+ if (*n2 == '/')
+ n2++;
+ num = strtoul(n2, &ep, 10);
+ if (ep == n2 || *ep)
+ num = -1;
+ else if (mddev_busy(use_mdp ? (-1-num) : num))
+ num = -1;
+ }
- /* If it was a 'standard' name and it is in-use, then
- * the device could already be correct
+ if (num < 0) {
+ /* need to choose a free number. */
+ num = find_free_devnum(use_mdp);
+ if (num == NoMdDev) {
+ fprintf(stderr, Name ": No avail md devices - aborting\n");
+ return -1;
+ }
+ } else {
+ num = use_mdp ? (-1-num) : num;
+ if (mddev_busy(num)) {
+ fprintf(stderr, Name ": %s is already in use.\n",
+ dev);
+ return -1;
+ }
+ }
+
+ if (num < 0)
+ sprintf(devname, "/dev/md_d%d", -1-num);
+ else
+ sprintf(devname, "/dev/md%d", num);
+
+ if (cname[0] == 0 && name) {
+ /* Need to find a name if we can
+ * We don't completely trust 'name'. Truncate to
+ * reasonable length and remove '/'
*/
- if (stb.st_mode && major(stb.st_rdev) == major &&
- minor(stb.st_rdev) == minor)
- ;
- else {
- if (major(makedev(major,minor)) != major ||
- minor(makedev(major,minor)) != minor) {
- fprintf(stderr, Name ": Need newer C library to use more than 4 partitionable md devices, sorry\n");
- return -1;
- }
- if (must_remove)
- unlink(dev);
+ char *cp;
+ struct map_ent *map = NULL;
+ int conflict = 1;
+ int unum = 0;
+ int cnlen;
+ strncpy(cname, name, 200);
+ cname[200] = 0;
+ while ((cp = strchr(cname, '/')) != NULL)
+ *cp = '-';
+ if (trustworthy == LOCAL ||
+ (trustworthy == FOREIGN && strchr(cname, ':') != NULL)) {
+ /* Only need suffix if there is a conflict */
+ if (map_by_name(&map, cname) == NULL)
+ conflict = 0;
+ }
+ cnlen = strlen(cname);
+ while (conflict) {
+ if (trustworthy == METADATA && !isdigit(cname[cnlen-1]))
+ sprintf(cname+cnlen, "%d", unum);
+ else
+ /* add _%d to FOREIGN array that don't
+ * a 'host:' prefix
+ */
+ sprintf(cname+cnlen, "_%d", unum);
+ unum++;
+ if (map_by_name(&map, cname) == NULL)
+ conflict = 0;
+ }
+ }
- if (strncmp(dev, "/dev/md/", 8) == 0) {
- if (mkdir("/dev/md",0700)==0) {
- chown("/dev/md", ci->uid, ci->gid);
- chmod("/dev/md", ci->mode| ((ci->mode>>2) & 0111));
- }
+ if (dev && dev[0] == '/')
+ strcpy(chosen, dev);
+ else if (cname[0] == 0)
+ strcpy(chosen, devname);
+
+ /* We have a device number and name.
+ * If we cannot detect udev, we need to make
+ * devices and links ourselves.
+ */
+ if (stat("/dev/.udev", &stb) != 0 ||
+ check_env("MDADM_NO_UDEV")) {
+ /* Make sure 'devname' exists and 'chosen' is a symlink to it */
+ if (lstat(devname, &stb) == 0) {
+ /* Must be the correct device, else error */
+ if ((stb.st_mode&S_IFMT) != S_IFBLK ||
+ stb.st_rdev != makedev(dev2major(num),dev2minor(num))) {
+ fprintf(stderr, Name ": %s exists but looks wrong, please fix\n",
+ devname);
+ return -1;
}
- if (mknod(dev, S_IFBLK|0600, makedev(major, minor))!= 0) {
- fprintf(stderr, Name ": failed to create %s\n", dev);
+ } else {
+ if (mknod(devname, S_IFBLK|0600,
+ makedev(dev2major(num),dev2minor(num))) != 0) {
+ fprintf(stderr, Name ": failed to create %s\n",
+ devname);
return -1;
}
- if (must_remove) {
- if (chown(dev, stb.st_uid, stb.st_gid))
- perror("chown");
- if (chmod(dev, stb.st_mode & 07777))
- perror("chmod");
- } else {
- if (chown(dev, ci->uid, ci->gid))
- perror("chown");
- if (chmod(dev, ci->mode))
- perror("chmod");
+ if (chown(devname, ci->uid, ci->gid))
+ perror("chown");
+ if (chmod(devname, ci->mode))
+ perror("chmod");
+ stat(devname, &stb);
+ add_dev(devname, &stb, 0, NULL);
+ }
+ if (use_mdp == 1)
+ make_parts(devname, parts);
+ if (strcmp(chosen, devname) != 0) {
+
+ if (mkdir("/dev/md",0700)==0) {
+ if (chown("/dev/md", ci->uid, ci->gid))
+ perror("chown /dev/md");
+ if (chmod("/dev/md", ci->mode| ((ci->mode>>2) & 0111)))
+ perror("chmod /dev/md");
}
- stat(dev, &stb);
- add_dev(dev, &stb, 0, NULL);
- if (strncmp(dev, "/dev/md/", 8) == 0)
- make_dev_symlink(dev);
- if (major != MD_MAJOR)
- make_parts(dev,parts);
+
+ if (dev && strcmp(chosen, dev) == 0)
+ /* We know we are allowed to use this name */
+ unlink(chosen);
+
+ if (lstat(chosen, &stb) == 0) {
+ char buf[300];
+ ssize_t link_len = readlink(chosen, buf, sizeof(buf)-1);
+ if (link_len >= 0)
+ buf[link_len] = '\0';
+
+ if ((stb.st_mode & S_IFMT) != S_IFLNK ||
+ link_len < 0 ||
+ strcmp(buf, devname) != 0) {
+ fprintf(stderr, Name ": %s exists - ignoring\n",
+ chosen);
+ strcpy(chosen, devname);
+ }
+ } else if (symlink(devname, chosen) != 0)
+ fprintf(stderr, Name ": failed to create %s: %s\n",
+ chosen, strerror(errno));
+ if (use_mdp && strcmp(chosen, devname) != 0)
+ make_parts(chosen, parts);
}
}
- mdfd = open(dev, O_RDWR, 0);
+ mdfd = open_dev_excl(num);
if (mdfd < 0)
- fprintf(stderr, Name ": error opening %s: %s\n",
- dev, strerror(errno));
- else if (md_get_version(mdfd) <= 0) {
- fprintf(stderr, Name ": %s does not appear to be an md device\n",
- dev);
+ fprintf(stderr, Name ": unexpected failure opening %s\n",
+ devname);
+ return mdfd;
+}
+
+
+/* Open this and check that it is an md device.
+ * On success, return filedescriptor.
+ * On failure, return -1 if it doesn't exist,
+ * or -2 if it exists but is not an md device.
+ */
+int open_mddev(char *dev, int report_errors)
+{
+ int mdfd = open(dev, O_RDWR);
+ if (mdfd < 0 && errno == EACCES)
+ mdfd = open(dev, O_RDONLY);
+ if (mdfd < 0) {
+ if (report_errors)
+ fprintf(stderr, Name ": error opening %s: %s\n",
+ dev, strerror(errno));
+ return -1;
+ }
+ if (md_get_version(mdfd) <= 0) {
close(mdfd);
- mdfd = -1;
+ if (report_errors)
+ fprintf(stderr, Name ": %s does not appear to be "
+ "an md device\n", dev);
+ return -2;
}
return mdfd;
}
-