summaryrefslogtreecommitdiffstats
path: root/mdadm.c
diff options
context:
space:
mode:
Diffstat (limited to '')
-rw-r--r--mdadm.c2078
-rw-r--r--mdadm.conf-example65
-rw-r--r--mdadm.conf.5706
3 files changed, 2849 insertions, 0 deletions
diff --git a/mdadm.c b/mdadm.c
new file mode 100644
index 0000000..26299b2
--- /dev/null
+++ b/mdadm.c
@@ -0,0 +1,2078 @@
+/*
+ * mdadm - manage Linux "md" devices aka RAID arrays.
+ *
+ * Copyright (C) 2001-2013 Neil Brown <neilb@suse.de>
+ *
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+ *
+ * Author: Neil Brown
+ * Email: <neilb@suse.de>
+ *
+ * Additions for bitmap and write-behind RAID options, Copyright (C) 2003-2004,
+ * Paul Clements, SteelEye Technology, Inc.
+ */
+
+#include "mdadm.h"
+#include "md_p.h"
+#include <ctype.h>
+
+static int scan_assemble(struct supertype *ss,
+ struct context *c,
+ struct mddev_ident *ident);
+static int misc_scan(char devmode, struct context *c);
+static int stop_scan(int verbose);
+static int misc_list(struct mddev_dev *devlist,
+ struct mddev_ident *ident,
+ char *dump_directory,
+ struct supertype *ss, struct context *c);
+const char Name[] = "mdadm";
+
+int main(int argc, char *argv[])
+{
+ int mode = 0;
+ int opt;
+ int option_index;
+ int rv;
+ int i;
+
+ unsigned long long array_size = 0;
+ unsigned long long data_offset = INVALID_SECTORS;
+ struct mddev_ident ident;
+ char *configfile = NULL;
+ int devmode = 0;
+ int bitmap_fd = -1;
+ struct mddev_dev *devlist = NULL;
+ struct mddev_dev **devlistend = & devlist;
+ struct mddev_dev *dv;
+ mdu_array_info_t array;
+ int devs_found = 0;
+ char *symlinks = NULL;
+ int grow_continue = 0;
+ /* autof indicates whether and how to create device node.
+ * bottom 3 bits are style. Rest (when shifted) are number of parts
+ * 0 - unset
+ * 1 - don't create (no)
+ * 2 - if is_standard, then create (yes)
+ * 3 - create as 'md' - reject is_standard mdp (md)
+ * 4 - create as 'mdp' - reject is_standard md (mdp)
+ * 5 - default to md if not is_standard (md in config file)
+ * 6 - default to mdp if not is_standard (part, or mdp in config file)
+ */
+ struct context c = {
+ .require_homehost = 1,
+ };
+ struct shape s = {
+ .journaldisks = 0,
+ .level = UnSet,
+ .layout = UnSet,
+ .bitmap_chunk = UnSet,
+ .consistency_policy = CONSISTENCY_POLICY_UNKNOWN,
+ };
+
+ char sys_hostname[256];
+ char *mailaddr = NULL;
+ char *program = NULL;
+ int increments = 20;
+ int daemonise = 0;
+ char *pidfile = NULL;
+ int oneshot = 0;
+ int spare_sharing = 1;
+ struct supertype *ss = NULL;
+ enum flag_mode writemostly = FlagDefault;
+ enum flag_mode failfast = FlagDefault;
+ char *shortopt = short_options;
+ int dosyslog = 0;
+ int rebuild_map = 0;
+ char *remove_path = NULL;
+ char *udev_filename = NULL;
+ char *dump_directory = NULL;
+
+ int print_help = 0;
+ FILE *outf;
+
+ int mdfd = -1;
+ int locked = 0;
+
+ srandom(time(0) ^ getpid());
+
+ ident.uuid_set = 0;
+ ident.level = UnSet;
+ ident.raid_disks = UnSet;
+ ident.super_minor = UnSet;
+ ident.devices = 0;
+ ident.spare_group = NULL;
+ ident.autof = 0;
+ ident.st = NULL;
+ ident.bitmap_fd = -1;
+ ident.bitmap_file = NULL;
+ ident.name[0] = 0;
+ ident.container = NULL;
+ ident.member = NULL;
+
+ if (get_linux_version() < 2006015) {
+ pr_err("This version of mdadm does not support kernels older than 2.6.15\n");
+ exit(1);
+ }
+
+ while ((option_index = -1),
+ (opt = getopt_long(argc, argv, shortopt, long_options,
+ &option_index)) != -1) {
+ int newmode = mode;
+ /* firstly, some mode-independent options */
+ switch(opt) {
+ case HelpOptions:
+ print_help = 2;
+ continue;
+ case 'h':
+ print_help = 1;
+ continue;
+
+ case 'V':
+ fputs(Version, stderr);
+ exit(0);
+
+ case 'v': c.verbose++;
+ continue;
+
+ case 'q': c.verbose--;
+ continue;
+
+ case 'b':
+ if (mode == ASSEMBLE || mode == BUILD ||
+ mode == CREATE || mode == GROW ||
+ mode == INCREMENTAL || mode == MANAGE)
+ break; /* b means bitmap */
+ case Brief:
+ c.brief = 1;
+ continue;
+
+ case NoDevices:
+ c.no_devices = 1;
+ continue;
+
+ case 'Y': c.export++;
+ continue;
+
+ case HomeHost:
+ if (strcasecmp(optarg, "<ignore>") == 0)
+ c.require_homehost = 0;
+ else
+ c.homehost = optarg;
+ continue;
+
+ case OffRootOpt:
+ /* Silently ignore old option */
+ continue;
+
+ case Prefer:
+ if (c.prefer)
+ free(c.prefer);
+ if (asprintf(&c.prefer, "/%s/", optarg) <= 0)
+ c.prefer = NULL;
+ continue;
+
+ case ':':
+ case '?':
+ fputs(Usage, stderr);
+ exit(2);
+ }
+ /* second, figure out the mode.
+ * Some options force the mode. Others
+ * set the mode if it isn't already
+ */
+
+ switch(opt) {
+ case ManageOpt:
+ newmode = MANAGE;
+ shortopt = short_bitmap_options;
+ break;
+ case 'a':
+ case Add:
+ case AddSpare:
+ case AddJournal:
+ case 'r':
+ case Remove:
+ case Replace:
+ case With:
+ case 'f':
+ case Fail:
+ case ReAdd: /* re-add */
+ case ClusterConfirm:
+ if (!mode) {
+ newmode = MANAGE;
+ shortopt = short_bitmap_options;
+ }
+ break;
+
+ case 'A': newmode = ASSEMBLE;
+ shortopt = short_bitmap_auto_options;
+ break;
+ case 'B': newmode = BUILD;
+ shortopt = short_bitmap_auto_options;
+ break;
+ case 'C': newmode = CREATE;
+ shortopt = short_bitmap_auto_options;
+ break;
+ case 'F': newmode = MONITOR;
+ break;
+ case 'G': newmode = GROW;
+ shortopt = short_bitmap_options;
+ break;
+ case 'I': newmode = INCREMENTAL;
+ shortopt = short_bitmap_auto_options;
+ break;
+ case AutoDetect:
+ newmode = AUTODETECT;
+ break;
+
+ case MiscOpt:
+ case 'D':
+ case 'E':
+ case 'X':
+ case 'Q':
+ case ExamineBB:
+ case Dump:
+ case Restore:
+ case Action:
+ newmode = MISC;
+ break;
+
+ case 'R':
+ case 'S':
+ case 'o':
+ case 'w':
+ case 'W':
+ case WaitOpt:
+ case Waitclean:
+ case DetailPlatform:
+ case KillSubarray:
+ case UpdateSubarray:
+ case UdevRules:
+ case KillOpt:
+ if (!mode)
+ newmode = MISC;
+ break;
+
+ case NoSharing:
+ newmode = MONITOR;
+ break;
+ }
+ if (mode && newmode == mode) {
+ /* everybody happy ! */
+ } else if (mode && newmode != mode) {
+ /* not allowed.. */
+ pr_err("");
+ if (option_index >= 0)
+ fprintf(stderr, "--%s", long_options[option_index].name);
+ else
+ fprintf(stderr, "-%c", opt);
+ fprintf(stderr, " would set mdadm mode to \"%s\", but it is already set to \"%s\".\n",
+ map_num(modes, newmode),
+ map_num(modes, mode));
+ exit(2);
+ } else if (!mode && newmode) {
+ mode = newmode;
+ if (mode == MISC && devs_found) {
+ pr_err("No action given for %s in --misc mode\n",
+ devlist->devname);
+ cont_err("Action options must come before device names\n");
+ exit(2);
+ }
+ } else {
+ /* special case of -c --help */
+ if ((opt == 'c' || opt == ConfigFile) &&
+ (strncmp(optarg, "--h", 3) == 0 ||
+ strncmp(optarg, "-h", 2) == 0)) {
+ fputs(Help_config, stdout);
+ exit(0);
+ }
+
+ /* If first option is a device, don't force the mode yet */
+ if (opt == 1) {
+ if (devs_found == 0) {
+ dv = xmalloc(sizeof(*dv));
+ dv->devname = optarg;
+ dv->disposition = devmode;
+ dv->writemostly = writemostly;
+ dv->failfast = failfast;
+ dv->used = 0;
+ dv->next = NULL;
+ *devlistend = dv;
+ devlistend = &dv->next;
+
+ devs_found++;
+ continue;
+ }
+ /* No mode yet, and this is the second device ... */
+ pr_err("An option must be given to set the mode before a second device\n"
+ " (%s) is listed\n", optarg);
+ exit(2);
+ }
+ if (option_index >= 0)
+ pr_err("--%s", long_options[option_index].name);
+ else
+ pr_err("-%c", opt);
+ fprintf(stderr, " does not set the mode, and so cannot be the first option.\n");
+ exit(2);
+ }
+
+ /* if we just set the mode, then done */
+ switch(opt) {
+ case ManageOpt:
+ case MiscOpt:
+ case 'A':
+ case 'B':
+ case 'C':
+ case 'F':
+ case 'G':
+ case 'I':
+ case AutoDetect:
+ continue;
+ }
+ if (opt == 1) {
+ /* an undecorated option - must be a device name.
+ */
+
+ if (devs_found > 0 && devmode == DetailPlatform) {
+ pr_err("controller may only be specified once. %s ignored\n",
+ optarg);
+ continue;
+ }
+
+ if (devs_found > 0 && mode == MANAGE && !devmode) {
+ pr_err("Must give one of -a/-r/-f for subsequent devices at %s\n", optarg);
+ exit(2);
+ }
+ if (devs_found > 0 && mode == GROW && !devmode) {
+ pr_err("Must give -a/--add for devices to add: %s\n", optarg);
+ exit(2);
+ }
+ dv = xmalloc(sizeof(*dv));
+ dv->devname = optarg;
+ dv->disposition = devmode;
+ dv->writemostly = writemostly;
+ dv->failfast = failfast;
+ dv->used = 0;
+ dv->next = NULL;
+ *devlistend = dv;
+ devlistend = &dv->next;
+
+ devs_found++;
+ continue;
+ }
+
+ /* We've got a mode, and opt is now something else which
+ * could depend on the mode */
+#define O(a,b) ((a<<16)|b)
+ switch (O(mode,opt)) {
+ case O(GROW,'c'):
+ case O(GROW,ChunkSize):
+ case O(CREATE,'c'):
+ case O(CREATE,ChunkSize):
+ case O(BUILD,'c'): /* chunk or rounding */
+ case O(BUILD,ChunkSize): /* chunk or rounding */
+ if (s.chunk) {
+ pr_err("chunk/rounding may only be specified once. Second value is %s.\n", optarg);
+ exit(2);
+ }
+ s.chunk = parse_size(optarg);
+ if (s.chunk == INVALID_SECTORS ||
+ s.chunk < 8 || (s.chunk&1)) {
+ pr_err("invalid chunk/rounding value: %s\n",
+ optarg);
+ exit(2);
+ }
+ /* Convert sectors to K */
+ s.chunk /= 2;
+ continue;
+
+ case O(INCREMENTAL, 'e'):
+ case O(CREATE,'e'):
+ case O(ASSEMBLE,'e'):
+ case O(MISC,'e'): /* set metadata (superblock) information */
+ if (ss) {
+ pr_err("metadata information already given\n");
+ exit(2);
+ }
+ for(i = 0; !ss && superlist[i]; i++)
+ ss = superlist[i]->match_metadata_desc(optarg);
+
+ if (!ss) {
+ pr_err("unrecognised metadata identifier: %s\n", optarg);
+ exit(2);
+ }
+ continue;
+
+ case O(MANAGE,'W'):
+ case O(MANAGE,WriteMostly):
+ case O(BUILD,'W'):
+ case O(BUILD,WriteMostly):
+ case O(CREATE,'W'):
+ case O(CREATE,WriteMostly):
+ /* set write-mostly for following devices */
+ writemostly = FlagSet;
+ continue;
+
+ case O(MANAGE,'w'):
+ /* clear write-mostly for following devices */
+ writemostly = FlagClear;
+ continue;
+
+ case O(MANAGE,FailFast):
+ case O(CREATE,FailFast):
+ failfast = FlagSet;
+ continue;
+ case O(MANAGE,NoFailFast):
+ failfast = FlagClear;
+ continue;
+
+ case O(GROW,'z'):
+ case O(CREATE,'z'):
+ case O(BUILD,'z'): /* size */
+ if (s.size > 0) {
+ pr_err("size may only be specified once. Second value is %s.\n", optarg);
+ exit(2);
+ }
+ if (strcmp(optarg, "max") == 0)
+ s.size = MAX_SIZE;
+ else {
+ s.size = parse_size(optarg);
+ if (s.size == INVALID_SECTORS || s.size < 8) {
+ pr_err("invalid size: %s\n", optarg);
+ exit(2);
+ }
+ /* convert sectors to K */
+ s.size /= 2;
+ }
+ continue;
+
+ case O(GROW,'Z'): /* array size */
+ if (array_size > 0) {
+ pr_err("array-size may only be specified once. Second value is %s.\n", optarg);
+ exit(2);
+ }
+ if (strcmp(optarg, "max") == 0)
+ array_size = MAX_SIZE;
+ else {
+ array_size = parse_size(optarg);
+ if (array_size == 0 ||
+ array_size == INVALID_SECTORS) {
+ pr_err("invalid array size: %s\n",
+ optarg);
+ exit(2);
+ }
+ }
+ continue;
+
+ case O(CREATE,DataOffset):
+ case O(GROW,DataOffset):
+ if (data_offset != INVALID_SECTORS) {
+ pr_err("data-offset may only be specified one. Second value is %s.\n", optarg);
+ exit(2);
+ }
+ if (mode == CREATE && strcmp(optarg, "variable") == 0)
+ data_offset = VARIABLE_OFFSET;
+ else
+ data_offset = parse_size(optarg);
+ if (data_offset == INVALID_SECTORS) {
+ pr_err("invalid data-offset: %s\n",
+ optarg);
+ exit(2);
+ }
+ continue;
+
+ case O(GROW,'l'):
+ case O(CREATE,'l'):
+ case O(BUILD,'l'): /* set raid level*/
+ if (s.level != UnSet) {
+ pr_err("raid level may only be set once. Second value is %s.\n", optarg);
+ exit(2);
+ }
+ s.level = map_name(pers, optarg);
+ if (s.level == UnSet) {
+ pr_err("invalid raid level: %s\n",
+ optarg);
+ exit(2);
+ }
+ if (s.level != 0 && s.level != LEVEL_LINEAR &&
+ s.level != 1 && s.level != LEVEL_MULTIPATH &&
+ s.level != LEVEL_FAULTY && s.level != 10 &&
+ mode == BUILD) {
+ pr_err("Raid level %s not permitted with --build.\n",
+ optarg);
+ exit(2);
+ }
+ if (s.sparedisks > 0 && s.level < 1 && s.level >= -1) {
+ pr_err("raid level %s is incompatible with spare-devices setting.\n",
+ optarg);
+ exit(2);
+ }
+ ident.level = s.level;
+ continue;
+
+ case O(GROW, 'p'): /* new layout */
+ case O(GROW, Layout):
+ if (s.layout_str) {
+ pr_err("layout may only be sent once. Second value was %s\n", optarg);
+ exit(2);
+ }
+ s.layout_str = optarg;
+ /* 'Grow' will parse the value */
+ continue;
+
+ case O(CREATE,'p'): /* raid5 layout */
+ case O(CREATE,Layout):
+ case O(BUILD,'p'): /* faulty layout */
+ case O(BUILD,Layout):
+ if (s.layout != UnSet) {
+ pr_err("layout may only be sent once. Second value was %s\n", optarg);
+ exit(2);
+ }
+ switch(s.level) {
+ default:
+ pr_err("layout not meaningful for %s arrays.\n",
+ map_num(pers, s.level));
+ exit(2);
+ case UnSet:
+ pr_err("raid level must be given before layout.\n");
+ exit(2);
+
+ case 0:
+ s.layout = map_name(r0layout, optarg);
+ if (s.layout == UnSet) {
+ pr_err("layout %s not understood for raid0.\n",
+ optarg);
+ exit(2);
+ }
+ break;
+ case 5:
+ s.layout = map_name(r5layout, optarg);
+ if (s.layout == UnSet) {
+ pr_err("layout %s not understood for raid5.\n",
+ optarg);
+ exit(2);
+ }
+ break;
+ case 6:
+ s.layout = map_name(r6layout, optarg);
+ if (s.layout == UnSet) {
+ pr_err("layout %s not understood for raid6.\n",
+ optarg);
+ exit(2);
+ }
+ break;
+
+ case 10:
+ s.layout = parse_layout_10(optarg);
+ if (s.layout < 0) {
+ pr_err("layout for raid10 must be 'nNN', 'oNN' or 'fNN' where NN is a number, not %s\n", optarg);
+ exit(2);
+ }
+ break;
+ case LEVEL_FAULTY:
+ /* Faulty
+ * modeNNN
+ */
+ s.layout = parse_layout_faulty(optarg);
+ if (s.layout == -1) {
+ pr_err("layout %s not understood for faulty.\n",
+ optarg);
+ exit(2);
+ }
+ break;
+ }
+ continue;
+
+ case O(CREATE,AssumeClean):
+ case O(BUILD,AssumeClean): /* assume clean */
+ case O(GROW,AssumeClean):
+ s.assume_clean = 1;
+ continue;
+
+ case O(GROW,'n'):
+ case O(CREATE,'n'):
+ case O(BUILD,'n'): /* number of raid disks */
+ if (s.raiddisks) {
+ pr_err("raid-devices set twice: %d and %s\n",
+ s.raiddisks, optarg);
+ exit(2);
+ }
+ if (parse_num(&s.raiddisks, optarg) != 0 || s.raiddisks <= 0) {
+ pr_err("invalid number of raid devices: %s\n",
+ optarg);
+ exit(2);
+ }
+ ident.raid_disks = s.raiddisks;
+ continue;
+ case O(ASSEMBLE, Nodes):
+ case O(GROW, Nodes):
+ case O(CREATE, Nodes):
+ if (parse_num(&c.nodes, optarg) != 0 || c.nodes < 2) {
+ pr_err("clustered array needs two nodes at least: %s\n",
+ optarg);
+ exit(2);
+ }
+ continue;
+ case O(CREATE, ClusterName):
+ case O(ASSEMBLE, ClusterName):
+ c.homecluster = optarg;
+ if (strlen(c.homecluster) > 64) {
+ pr_err("Cluster name too big.\n");
+ exit(2);
+ }
+ continue;
+ case O(CREATE,'x'): /* number of spare (eXtra) disks */
+ if (s.sparedisks) {
+ pr_err("spare-devices set twice: %d and %s\n",
+ s.sparedisks, optarg);
+ exit(2);
+ }
+ if (s.level != UnSet && s.level <= 0 && s.level >= -1) {
+ pr_err("spare-devices setting is incompatible with raid level %d\n",
+ s.level);
+ exit(2);
+ }
+ if (parse_num(&s.sparedisks, optarg) != 0 || s.sparedisks < 0) {
+ pr_err("invalid number of spare-devices: %s\n",
+ optarg);
+ exit(2);
+ }
+ continue;
+
+ case O(CREATE,'a'):
+ case O(CREATE,Auto):
+ case O(BUILD,'a'):
+ case O(BUILD,Auto):
+ case O(INCREMENTAL,'a'):
+ case O(INCREMENTAL,Auto):
+ case O(ASSEMBLE,'a'):
+ case O(ASSEMBLE,Auto): /* auto-creation of device node */
+ c.autof = parse_auto(optarg, "--auto flag", 0);
+ continue;
+
+ case O(CREATE,Symlinks):
+ case O(BUILD,Symlinks):
+ case O(ASSEMBLE,Symlinks): /* auto creation of symlinks in /dev to /dev/md */
+ symlinks = optarg;
+ continue;
+
+ case O(BUILD,'f'): /* force honouring '-n 1' */
+ case O(BUILD,Force): /* force honouring '-n 1' */
+ case O(GROW,'f'): /* ditto */
+ case O(GROW,Force): /* ditto */
+ case O(CREATE,'f'): /* force honouring of device list */
+ case O(CREATE,Force): /* force honouring of device list */
+ case O(ASSEMBLE,'f'): /* force assembly */
+ case O(ASSEMBLE,Force): /* force assembly */
+ case O(MISC,'f'): /* force zero */
+ case O(MISC,Force): /* force zero */
+ case O(MANAGE,Force): /* add device which is too large */
+ c.force = 1;
+ continue;
+ /* now for the Assemble options */
+ case O(ASSEMBLE, FreezeReshape): /* Freeze reshape during
+ * initrd phase */
+ case O(INCREMENTAL, FreezeReshape):
+ c.freeze_reshape = 1;
+ continue;
+ case O(CREATE,'u'): /* uuid of array */
+ case O(ASSEMBLE,'u'): /* uuid of array */
+ if (ident.uuid_set) {
+ pr_err("uuid cannot be set twice. Second value %s.\n", optarg);
+ exit(2);
+ }
+ if (parse_uuid(optarg, ident.uuid))
+ ident.uuid_set = 1;
+ else {
+ pr_err("Bad uuid: %s\n", optarg);
+ exit(2);
+ }
+ continue;
+
+ case O(CREATE,'N'):
+ case O(ASSEMBLE,'N'):
+ case O(MISC,'N'):
+ if (ident.name[0]) {
+ pr_err("name cannot be set twice. Second value %s.\n", optarg);
+ exit(2);
+ }
+ if (mode == MISC && !c.subarray) {
+ pr_err("-N/--name only valid with --update-subarray in misc mode\n");
+ exit(2);
+ }
+ if (strlen(optarg) > 32) {
+ pr_err("name '%s' is too long, 32 chars max.\n",
+ optarg);
+ exit(2);
+ }
+ strcpy(ident.name, optarg);
+ continue;
+
+ case O(ASSEMBLE,'m'): /* super-minor for array */
+ case O(ASSEMBLE,SuperMinor):
+ if (ident.super_minor != UnSet) {
+ pr_err("super-minor cannot be set twice. Second value: %s.\n", optarg);
+ exit(2);
+ }
+ if (strcmp(optarg, "dev") == 0)
+ ident.super_minor = -2;
+ else if (parse_num(&ident.super_minor, optarg) != 0 || ident.super_minor < 0) {
+ pr_err("Bad super-minor number: %s.\n", optarg);
+ exit(2);
+ }
+ continue;
+
+ case O(ASSEMBLE,'o'):
+ case O(MANAGE,'o'):
+ case O(CREATE,'o'):
+ c.readonly = 1;
+ continue;
+
+ case O(ASSEMBLE,'U'): /* update the superblock */
+ case O(MISC,'U'):
+ if (c.update) {
+ pr_err("Can only update one aspect of superblock, both %s and %s given.\n",
+ c.update, optarg);
+ exit(2);
+ }
+ if (mode == MISC && !c.subarray) {
+ pr_err("Only subarrays can be updated in misc mode\n");
+ exit(2);
+ }
+ c.update = optarg;
+ if (strcmp(c.update, "sparc2.2") == 0)
+ continue;
+ if (strcmp(c.update, "super-minor") == 0)
+ continue;
+ if (strcmp(c.update, "summaries") == 0)
+ continue;
+ if (strcmp(c.update, "resync") == 0)
+ continue;
+ if (strcmp(c.update, "uuid") == 0)
+ continue;
+ if (strcmp(c.update, "name") == 0)
+ continue;
+ if (strcmp(c.update, "homehost") == 0)
+ continue;
+ if (strcmp(c.update, "home-cluster") == 0)
+ continue;
+ if (strcmp(c.update, "nodes") == 0)
+ continue;
+ if (strcmp(c.update, "devicesize") == 0)
+ continue;
+ if (strcmp(c.update, "bitmap") == 0)
+ continue;
+ if (strcmp(c.update, "no-bitmap") == 0)
+ continue;
+ if (strcmp(c.update, "bbl") == 0)
+ continue;
+ if (strcmp(c.update, "no-bbl") == 0)
+ continue;
+ if (strcmp(c.update, "force-no-bbl") == 0)
+ continue;
+ if (strcmp(c.update, "ppl") == 0)
+ continue;
+ if (strcmp(c.update, "no-ppl") == 0)
+ continue;
+ if (strcmp(c.update, "metadata") == 0)
+ continue;
+ if (strcmp(c.update, "revert-reshape") == 0)
+ continue;
+ if (strcmp(c.update, "layout-original") == 0 ||
+ strcmp(c.update, "layout-alternate") == 0 ||
+ strcmp(c.update, "layout-unspecified") == 0)
+ continue;
+ if (strcmp(c.update, "byteorder") == 0) {
+ if (ss) {
+ pr_err("must not set metadata type with --update=byteorder.\n");
+ exit(2);
+ }
+ for(i = 0; !ss && superlist[i]; i++)
+ ss = superlist[i]->match_metadata_desc(
+ "0.swap");
+ if (!ss) {
+ pr_err("INTERNAL ERROR cannot find 0.swap\n");
+ exit(2);
+ }
+
+ continue;
+ }
+ if (strcmp(c.update,"?") == 0 ||
+ strcmp(c.update, "help") == 0) {
+ outf = stdout;
+ fprintf(outf, "%s: ", Name);
+ } else {
+ outf = stderr;
+ fprintf(outf,
+ "%s: '--update=%s' is invalid. ",
+ Name, c.update);
+ }
+ fprintf(outf, "Valid --update options are:\n"
+ " 'sparc2.2', 'super-minor', 'uuid', 'name', 'nodes', 'resync',\n"
+ " 'summaries', 'homehost', 'home-cluster', 'byteorder', 'devicesize',\n"
+ " 'bitmap', 'no-bitmap', 'metadata', 'revert-reshape'\n"
+ " 'bbl', 'no-bbl', 'force-no-bbl', 'ppl', 'no-ppl'\n"
+ " 'layout-original', 'layout-alternate', 'layout-unspecified'\n"
+ );
+ exit(outf == stdout ? 0 : 2);
+
+ case O(MANAGE,'U'):
+ /* update=devicesize is allowed with --re-add */
+ if (devmode != 'A') {
+ pr_err("--update in Manage mode only allowed with --re-add.\n");
+ exit(1);
+ }
+ if (c.update) {
+ pr_err("Can only update one aspect of superblock, both %s and %s given.\n",
+ c.update, optarg);
+ exit(2);
+ }
+ c.update = optarg;
+ if (strcmp(c.update, "devicesize") != 0 &&
+ strcmp(c.update, "bbl") != 0 &&
+ strcmp(c.update, "force-no-bbl") != 0 &&
+ strcmp(c.update, "no-bbl") != 0) {
+ pr_err("only 'devicesize', 'bbl', 'no-bbl', and 'force-no-bbl' can be updated with --re-add\n");
+ exit(2);
+ }
+ continue;
+
+ case O(INCREMENTAL,NoDegraded):
+ pr_err("--no-degraded is deprecated in Incremental mode\n");
+ case O(ASSEMBLE,NoDegraded): /* --no-degraded */
+ c.runstop = -1; /* --stop isn't allowed for --assemble,
+ * so we overload slightly */
+ continue;
+
+ case O(ASSEMBLE,'c'):
+ case O(ASSEMBLE,ConfigFile):
+ case O(INCREMENTAL, 'c'):
+ case O(INCREMENTAL, ConfigFile):
+ case O(MISC, 'c'):
+ case O(MISC, ConfigFile):
+ case O(MONITOR,'c'):
+ case O(MONITOR,ConfigFile):
+ case O(CREATE,ConfigFile):
+ if (configfile) {
+ pr_err("configfile cannot be set twice. Second value is %s.\n", optarg);
+ exit(2);
+ }
+ configfile = optarg;
+ set_conffile(configfile);
+ /* FIXME possibly check that config file exists. Even parse it */
+ continue;
+ case O(ASSEMBLE,'s'): /* scan */
+ case O(MISC,'s'):
+ case O(MONITOR,'s'):
+ case O(INCREMENTAL,'s'):
+ c.scan = 1;
+ continue;
+
+ case O(MONITOR,'m'): /* mail address */
+ case O(MONITOR,EMail):
+ if (mailaddr)
+ pr_err("only specify one mailaddress. %s ignored.\n",
+ optarg);
+ else
+ mailaddr = optarg;
+ continue;
+
+ case O(MONITOR,'p'): /* alert program */
+ case O(MONITOR,ProgramOpt): /* alert program */
+ if (program)
+ pr_err("only specify one alter program. %s ignored.\n",
+ optarg);
+ else
+ program = optarg;
+ continue;
+
+ case O(MONITOR,'r'): /* rebuild increments */
+ case O(MONITOR,Increment):
+ if (parse_num(&increments, optarg) != 0
+ || increments > 99 || increments < 1) {
+ pr_err("please specify positive integer between 1 and 99 as rebuild increments.\n");
+ exit(2);
+ }
+ continue;
+
+ case O(MONITOR,'d'): /* delay in seconds */
+ case O(GROW, 'd'):
+ case O(BUILD,'d'): /* delay for bitmap updates */
+ case O(CREATE,'d'):
+ if (c.delay)
+ pr_err("only specify delay once. %s ignored.\n", optarg);
+ else if (parse_num(&c.delay, optarg) != 0 || c.delay < 1) {
+ pr_err("invalid delay: %s\n", optarg);
+ exit(2);
+ }
+ continue;
+ case O(MONITOR,'f'): /* daemonise */
+ case O(MONITOR,Fork):
+ daemonise = 1;
+ continue;
+ case O(MONITOR,'i'): /* pid */
+ if (pidfile)
+ pr_err("only specify one pid file. %s ignored.\n",
+ optarg);
+ else
+ pidfile = optarg;
+ continue;
+ case O(MONITOR,'1'): /* oneshot */
+ oneshot = 1;
+ spare_sharing = 0;
+ continue;
+ case O(MONITOR,'t'): /* test */
+ c.test = 1;
+ continue;
+ case O(MONITOR,'y'): /* log messages to syslog */
+ openlog("mdadm", LOG_PID, SYSLOG_FACILITY);
+ dosyslog = 1;
+ continue;
+ case O(MONITOR, NoSharing):
+ spare_sharing = 0;
+ continue;
+
+ /* now the general management options. Some are applicable
+ * to other modes. None have arguments.
+ */
+ case O(GROW,'a'):
+ case O(GROW,Add):
+ case O(MANAGE,'a'):
+ case O(MANAGE,Add): /* add a drive */
+ devmode = 'a';
+ continue;
+ case O(MANAGE,AddSpare): /* add drive - never re-add */
+ devmode = 'S';
+ continue;
+ case O(MANAGE,AddJournal): /* add journal */
+ if (s.journaldisks && (s.level < 4 || s.level > 6)) {
+ pr_err("--add-journal is only supported for RAID level 4/5/6.\n");
+ exit(2);
+ }
+ devmode = 'j';
+ continue;
+ case O(MANAGE,ReAdd):
+ devmode = 'A';
+ continue;
+ case O(MANAGE,'r'): /* remove a drive */
+ case O(MANAGE,Remove):
+ devmode = 'r';
+ continue;
+ case O(MANAGE,'f'): /* set faulty */
+ case O(MANAGE,Fail):
+ case O(INCREMENTAL,'f'):
+ case O(INCREMENTAL,Remove):
+ case O(INCREMENTAL,Fail): /* r for incremental is taken, use f
+ * even though we will both fail and
+ * remove the device */
+ devmode = 'f';
+ continue;
+ case O(MANAGE, ClusterConfirm):
+ devmode = 'c';
+ continue;
+ case O(MANAGE,Replace):
+ /* Mark these devices for replacement */
+ devmode = 'R';
+ continue;
+ case O(MANAGE,With):
+ /* These are the replacements to use */
+ if (devmode != 'R') {
+ pr_err("--with must follow --replace\n");
+ exit(2);
+ }
+ devmode = 'W';
+ continue;
+ case O(INCREMENTAL,'R'):
+ case O(MANAGE,'R'):
+ case O(ASSEMBLE,'R'):
+ case O(BUILD,'R'):
+ case O(CREATE,'R'): /* Run the array */
+ if (c.runstop < 0) {
+ pr_err("Cannot both Stop and Run an array\n");
+ exit(2);
+ }
+ c.runstop = 1;
+ continue;
+ case O(MANAGE,'S'):
+ if (c.runstop > 0) {
+ pr_err("Cannot both Run and Stop an array\n");
+ exit(2);
+ }
+ c.runstop = -1;
+ continue;
+ case O(MANAGE,'t'):
+ c.test = 1;
+ continue;
+
+ case O(MISC,'Q'):
+ case O(MISC,'D'):
+ case O(MISC,'E'):
+ case O(MISC,KillOpt):
+ case O(MISC,'R'):
+ case O(MISC,'S'):
+ case O(MISC,'X'):
+ case O(MISC, ExamineBB):
+ case O(MISC,'o'):
+ case O(MISC,'w'):
+ case O(MISC,'W'):
+ case O(MISC, WaitOpt):
+ case O(MISC, Waitclean):
+ case O(MISC, DetailPlatform):
+ case O(MISC, KillSubarray):
+ case O(MISC, UpdateSubarray):
+ case O(MISC, Dump):
+ case O(MISC, Restore):
+ case O(MISC ,Action):
+ if (opt == KillSubarray || opt == UpdateSubarray) {
+ if (c.subarray) {
+ pr_err("subarray can only be specified once\n");
+ exit(2);
+ }
+ c.subarray = optarg;
+ }
+ if (opt == Action) {
+ if (c.action) {
+ pr_err("Only one --action can be specified\n");
+ exit(2);
+ }
+ if (strcmp(optarg, "idle") == 0 ||
+ strcmp(optarg, "frozen") == 0 ||
+ strcmp(optarg, "check") == 0 ||
+ strcmp(optarg, "repair") == 0)
+ c.action = optarg;
+ else {
+ pr_err("action must be one of idle, frozen, check, repair\n");
+ exit(2);
+ }
+ }
+ if (devmode && devmode != opt &&
+ (devmode == 'E' ||
+ (opt == 'E' && devmode != 'Q'))) {
+ pr_err("--examine/-E cannot be given with ");
+ if (devmode == 'E') {
+ if (option_index >= 0)
+ fprintf(stderr, "--%s\n",
+ long_options[option_index].name);
+ else
+ fprintf(stderr, "-%c\n", opt);
+ } else if (isalpha(devmode))
+ fprintf(stderr, "-%c\n", devmode);
+ else
+ fprintf(stderr, "previous option\n");
+ exit(2);
+ }
+ devmode = opt;
+ if (opt == Dump || opt == Restore) {
+ if (dump_directory != NULL) {
+ pr_err("dump/restore directory specified twice: %s and %s\n",
+ dump_directory, optarg);
+ exit(2);
+ }
+ dump_directory = optarg;
+ }
+ continue;
+ case O(MISC, UdevRules):
+ if (devmode && devmode != opt) {
+ pr_err("--udev-rules must be the only option.\n");
+ } else {
+ if (udev_filename)
+ pr_err("only specify one udev rule filename. %s ignored.\n",
+ optarg);
+ else
+ udev_filename = optarg;
+ }
+ devmode = opt;
+ continue;
+ case O(MISC,'t'):
+ c.test = 1;
+ continue;
+
+ case O(MISC, Sparc22):
+ if (devmode != 'E') {
+ pr_err("--sparc2.2 only allowed with --examine\n");
+ exit(2);
+ }
+ c.SparcAdjust = 1;
+ continue;
+
+ case O(ASSEMBLE,'b'): /* here we simply set the bitmap file */
+ case O(ASSEMBLE,Bitmap):
+ if (!optarg) {
+ pr_err("bitmap file needed with -b in --assemble mode\n");
+ exit(2);
+ }
+ if (strcmp(optarg, "internal") == 0 ||
+ strcmp(optarg, "clustered") == 0) {
+ pr_err("no need to specify --bitmap when assembling"
+ " arrays with internal or clustered bitmap\n");
+ continue;
+ }
+ bitmap_fd = open(optarg, O_RDWR);
+ if (!*optarg || bitmap_fd < 0) {
+ pr_err("cannot open bitmap file %s: %s\n", optarg, strerror(errno));
+ exit(2);
+ }
+ ident.bitmap_fd = bitmap_fd; /* for Assemble */
+ continue;
+
+ case O(ASSEMBLE, BackupFile):
+ case O(GROW, BackupFile):
+ /* Specify a file into which grow might place a backup,
+ * or from which assemble might recover a backup
+ */
+ if (c.backup_file) {
+ pr_err("backup file already specified, rejecting %s\n", optarg);
+ exit(2);
+ }
+ c.backup_file = optarg;
+ continue;
+
+ case O(GROW, Continue):
+ /* Continue interrupted grow
+ */
+ grow_continue = 1;
+ continue;
+ case O(ASSEMBLE, InvalidBackup):
+ /* Acknowledge that the backupfile is invalid, but ask
+ * to continue anyway
+ */
+ c.invalid_backup = 1;
+ continue;
+
+ case O(BUILD,'b'):
+ case O(BUILD,Bitmap):
+ case O(CREATE,'b'):
+ case O(CREATE,Bitmap): /* here we create the bitmap */
+ case O(GROW,'b'):
+ case O(GROW,Bitmap):
+ if (s.bitmap_file) {
+ pr_err("bitmap cannot be set twice. Second value: %s.\n", optarg);
+ exit(2);
+ }
+ if (strcmp(optarg, "internal") == 0 ||
+ strcmp(optarg, "none") == 0 ||
+ strchr(optarg, '/') != NULL) {
+ s.bitmap_file = optarg;
+ continue;
+ }
+ if (strcmp(optarg, "clustered") == 0) {
+ s.bitmap_file = optarg;
+ /* Set the default number of cluster nodes
+ * to 4 if not already set by user
+ */
+ if (c.nodes < 1)
+ c.nodes = 4;
+ continue;
+ }
+ /* probable typo */
+ pr_err("bitmap file must contain a '/', or be 'internal', or be 'clustered', or 'none'\n"
+ " not '%s'\n", optarg);
+ exit(2);
+
+ case O(GROW,BitmapChunk):
+ case O(BUILD,BitmapChunk):
+ case O(CREATE,BitmapChunk): /* bitmap chunksize */
+ s.bitmap_chunk = parse_size(optarg);
+ if (s.bitmap_chunk == 0 ||
+ s.bitmap_chunk == INVALID_SECTORS ||
+ s.bitmap_chunk & (s.bitmap_chunk - 1)) {
+ pr_err("invalid bitmap chunksize: %s\n",
+ optarg);
+ exit(2);
+ }
+ s.bitmap_chunk = s.bitmap_chunk * 512;
+ continue;
+
+ case O(GROW, WriteBehind):
+ case O(BUILD, WriteBehind):
+ case O(CREATE, WriteBehind):
+ s.write_behind = DEFAULT_MAX_WRITE_BEHIND;
+ if (parse_num(&s.write_behind, optarg) != 0 ||
+ s.write_behind < 0 || s.write_behind > 16383) {
+ pr_err("Invalid value for maximum outstanding write-behind writes: %s.\n\tMust be between 0 and 16383.\n",
+ optarg);
+ exit(2);
+ }
+ continue;
+ case O(INCREMENTAL, 'r'):
+ case O(INCREMENTAL, RebuildMapOpt):
+ rebuild_map = 1;
+ continue;
+ case O(INCREMENTAL, IncrementalPath):
+ remove_path = optarg;
+ continue;
+ case O(CREATE, WriteJournal):
+ if (s.journaldisks) {
+ pr_err("Please specify only one journal device for the array.\n");
+ pr_err("Ignoring --write-journal %s...\n", optarg);
+ continue;
+ }
+ dv = xmalloc(sizeof(*dv));
+ dv->devname = optarg;
+ dv->disposition = 'j'; /* WriteJournal */
+ dv->used = 0;
+ dv->next = NULL;
+ *devlistend = dv;
+ devlistend = &dv->next;
+ devs_found++;
+
+ s.journaldisks = 1;
+ continue;
+ case O(CREATE, 'k'):
+ case O(GROW, 'k'):
+ s.consistency_policy = map_name(consistency_policies,
+ optarg);
+ if (s.consistency_policy < CONSISTENCY_POLICY_RESYNC) {
+ pr_err("Invalid consistency policy: %s\n",
+ optarg);
+ exit(2);
+ }
+ continue;
+ }
+ /* We have now processed all the valid options. Anything else is
+ * an error
+ */
+ if (option_index > 0)
+ pr_err(":option --%s not valid in %s mode\n",
+ long_options[option_index].name,
+ map_num(modes, mode));
+ else
+ pr_err("option -%c not valid in %s mode\n",
+ opt, map_num(modes, mode));
+ exit(2);
+
+ }
+
+ if (print_help) {
+ char *help_text;
+ if (print_help == 2)
+ help_text = OptionHelp;
+ else
+ help_text = mode_help[mode];
+ if (help_text == NULL)
+ help_text = Help;
+ fputs(help_text,stdout);
+ exit(0);
+ }
+
+ if (s.journaldisks) {
+ if (s.level < 4 || s.level > 6) {
+ pr_err("--write-journal is only supported for RAID level 4/5/6.\n");
+ exit(2);
+ }
+ if (s.consistency_policy != CONSISTENCY_POLICY_UNKNOWN &&
+ s.consistency_policy != CONSISTENCY_POLICY_JOURNAL) {
+ pr_err("--write-journal is not supported with consistency policy: %s\n",
+ map_num(consistency_policies, s.consistency_policy));
+ exit(2);
+ }
+ }
+
+ if (mode == CREATE &&
+ s.consistency_policy != CONSISTENCY_POLICY_UNKNOWN) {
+ if (s.level <= 0) {
+ pr_err("--consistency-policy not meaningful with level %s.\n",
+ map_num(pers, s.level));
+ exit(2);
+ } else if (s.consistency_policy == CONSISTENCY_POLICY_JOURNAL &&
+ !s.journaldisks) {
+ pr_err("--write-journal is required for consistency policy: %s\n",
+ map_num(consistency_policies, s.consistency_policy));
+ exit(2);
+ } else if (s.consistency_policy == CONSISTENCY_POLICY_PPL &&
+ s.level != 5) {
+ pr_err("PPL consistency policy is only supported for RAID level 5.\n");
+ exit(2);
+ } else if (s.consistency_policy == CONSISTENCY_POLICY_BITMAP &&
+ (!s.bitmap_file ||
+ strcmp(s.bitmap_file, "none") == 0)) {
+ pr_err("--bitmap is required for consistency policy: %s\n",
+ map_num(consistency_policies, s.consistency_policy));
+ exit(2);
+ } else if (s.bitmap_file &&
+ strcmp(s.bitmap_file, "none") != 0 &&
+ s.consistency_policy != CONSISTENCY_POLICY_BITMAP &&
+ s.consistency_policy != CONSISTENCY_POLICY_JOURNAL) {
+ pr_err("--bitmap is not compatible with consistency policy: %s\n",
+ map_num(consistency_policies, s.consistency_policy));
+ exit(2);
+ }
+ }
+
+ if (!mode && devs_found) {
+ mode = MISC;
+ devmode = 'Q';
+ if (devlist->disposition == 0)
+ devlist->disposition = devmode;
+ }
+ if (!mode) {
+ fputs(Usage, stderr);
+ exit(2);
+ }
+
+ if (symlinks) {
+ struct createinfo *ci = conf_get_create_info();
+
+ if (strcasecmp(symlinks, "yes") == 0)
+ ci->symlinks = 1;
+ else if (strcasecmp(symlinks, "no") == 0)
+ ci->symlinks = 0;
+ else {
+ pr_err("option --symlinks must be 'no' or 'yes'\n");
+ exit(2);
+ }
+ }
+ /* Ok, got the option parsing out of the way
+ * hopefully it's mostly right but there might be some stuff
+ * missing
+ *
+ * That is mostly checked in the per-mode stuff but...
+ *
+ * For @,B,C and A without -s, the first device listed must be
+ * an md device. We check that here and open it.
+ */
+
+ if (mode == MANAGE || mode == BUILD || mode == CREATE ||
+ mode == GROW || (mode == ASSEMBLE && ! c.scan)) {
+ if (devs_found < 1) {
+ pr_err("an md device must be given in this mode\n");
+ exit(2);
+ }
+ if ((int)ident.super_minor == -2 && c.autof) {
+ pr_err("--super-minor=dev is incompatible with --auto\n");
+ exit(2);
+ }
+ if (mode == MANAGE || mode == GROW) {
+ mdfd = open_mddev(devlist->devname, 1);
+ if (mdfd < 0)
+ exit(1);
+ } else {
+ char *bname = basename(devlist->devname);
+
+ if (strlen(bname) > MD_NAME_MAX) {
+ pr_err("Name %s is too long.\n", devlist->devname);
+ exit(1);
+ }
+ /* non-existent device is OK */
+ mdfd = open_mddev(devlist->devname, 0);
+ }
+ if (mdfd == -2) {
+ pr_err("device %s exists but is not an md array.\n", devlist->devname);
+ exit(1);
+ }
+ if ((int)ident.super_minor == -2) {
+ struct stat stb;
+ if (mdfd < 0) {
+ pr_err("--super-minor=dev given, and listed device %s doesn't exist.\n",
+ devlist->devname);
+ exit(1);
+ }
+ fstat(mdfd, &stb);
+ ident.super_minor = minor(stb.st_rdev);
+ }
+ if (mdfd >= 0 && mode != MANAGE && mode != GROW) {
+ /* We don't really want this open yet, we just might
+ * have wanted to check some things
+ */
+ close(mdfd);
+ mdfd = -1;
+ }
+ }
+
+ if (s.raiddisks) {
+ if (s.raiddisks == 1 && !c.force && s.level != LEVEL_FAULTY) {
+ pr_err("'1' is an unusual number of drives for an array, so it is probably\n"
+ " a mistake. If you really mean it you will need to specify --force before\n"
+ " setting the number of drives.\n");
+ exit(2);
+ }
+ }
+
+ if (c.homehost == NULL && c.require_homehost)
+ c.homehost = conf_get_homehost(&c.require_homehost);
+ if (c.homehost == NULL || strcasecmp(c.homehost, "<system>") == 0) {
+ if (gethostname(sys_hostname, sizeof(sys_hostname)) == 0) {
+ sys_hostname[sizeof(sys_hostname)-1] = 0;
+ c.homehost = sys_hostname;
+ }
+ }
+ if (c.homehost &&
+ (!c.homehost[0] || strcasecmp(c.homehost, "<none>") == 0)) {
+ c.homehost = NULL;
+ c.require_homehost = 0;
+ }
+
+ rv = 0;
+
+ set_hooks(); /* set hooks from libs */
+
+ if (c.homecluster == NULL && (c.nodes > 0)) {
+ c.homecluster = conf_get_homecluster();
+ if (c.homecluster == NULL)
+ rv = get_cluster_name(&c.homecluster);
+ if (rv) {
+ pr_err("The md can't get cluster name\n");
+ exit(1);
+ }
+ }
+
+ if (c.update && strcmp(c.update, "nodes") == 0 && c.nodes == 0) {
+ pr_err("Please specify nodes number with --nodes\n");
+ exit(1);
+ }
+
+ if (c.backup_file && data_offset != INVALID_SECTORS) {
+ pr_err("--backup-file and --data-offset are incompatible\n");
+ exit(2);
+ }
+
+ if ((mode == MISC && devmode == 'E') ||
+ (mode == MONITOR && spare_sharing == 0))
+ /* Anyone may try this */;
+ else if (geteuid() != 0) {
+ pr_err("must be super-user to perform this action\n");
+ exit(1);
+ }
+
+ ident.autof = c.autof;
+
+ if (c.scan && c.verbose < 2)
+ /* --scan implied --brief unless -vv */
+ c.brief = 1;
+
+ if (mode == CREATE) {
+ if (s.bitmap_file && strcmp(s.bitmap_file, "clustered") == 0) {
+ locked = cluster_get_dlmlock();
+ if (locked != 1)
+ exit(1);
+ }
+ } else if (mode == MANAGE || mode == GROW || mode == INCREMENTAL) {
+ if (!md_get_array_info(mdfd, &array) && (devmode != 'c')) {
+ if (array.state & (1 << MD_SB_CLUSTERED)) {
+ locked = cluster_get_dlmlock();
+ if (locked != 1)
+ exit(1);
+ }
+ }
+ }
+
+ switch(mode) {
+ case MANAGE:
+ /* readonly, add/remove, readwrite, runstop */
+ if (c.readonly > 0)
+ rv = Manage_ro(devlist->devname, mdfd, c.readonly);
+ if (!rv && devs_found>1)
+ rv = Manage_subdevs(devlist->devname, mdfd,
+ devlist->next, c.verbose, c.test,
+ c.update, c.force);
+ if (!rv && c.readonly < 0)
+ rv = Manage_ro(devlist->devname, mdfd, c.readonly);
+ if (!rv && c.runstop > 0)
+ rv = Manage_run(devlist->devname, mdfd, &c);
+ if (!rv && c.runstop < 0)
+ rv = Manage_stop(devlist->devname, mdfd, c.verbose, 0);
+ break;
+ case ASSEMBLE:
+ if (!c.scan && c.runstop == -1) {
+ pr_err("--no-degraded not meaningful without a --scan assembly.\n");
+ exit(1);
+ } else if (devs_found == 1 && ident.uuid_set == 0 &&
+ ident.super_minor == UnSet && ident.name[0] == 0 &&
+ !c.scan) {
+ /* Only a device has been given, so get details from config file */
+ struct mddev_ident *array_ident = conf_get_ident(devlist->devname);
+ if (array_ident == NULL) {
+ pr_err("%s not identified in config file.\n",
+ devlist->devname);
+ rv |= 1;
+ if (mdfd >= 0)
+ close(mdfd);
+ } else {
+ if (array_ident->autof == 0)
+ array_ident->autof = c.autof;
+ rv |= Assemble(ss, devlist->devname, array_ident,
+ NULL, &c);
+ }
+ } else if (!c.scan)
+ rv = Assemble(ss, devlist->devname, &ident,
+ devlist->next, &c);
+ else if (devs_found > 0) {
+ if (c.update && devs_found > 1) {
+ pr_err("can only update a single array at a time\n");
+ exit(1);
+ }
+ if (c.backup_file && devs_found > 1) {
+ pr_err("can only assemble a single array when providing a backup file.\n");
+ exit(1);
+ }
+ for (dv = devlist; dv; dv = dv->next) {
+ struct mddev_ident *array_ident = conf_get_ident(dv->devname);
+ if (array_ident == NULL) {
+ pr_err("%s not identified in config file.\n",
+ dv->devname);
+ rv |= 1;
+ continue;
+ }
+ if (array_ident->autof == 0)
+ array_ident->autof = c.autof;
+ rv |= Assemble(ss, dv->devname, array_ident,
+ NULL, &c);
+ }
+ } else {
+ if (c.update) {
+ pr_err("--update not meaningful with a --scan assembly.\n");
+ exit(1);
+ }
+ if (c.backup_file) {
+ pr_err("--backup_file not meaningful with a --scan assembly.\n");
+ exit(1);
+ }
+ rv = scan_assemble(ss, &c, &ident);
+ }
+
+ break;
+ case BUILD:
+ if (c.delay == 0)
+ c.delay = DEFAULT_BITMAP_DELAY;
+ if (s.write_behind && !s.bitmap_file) {
+ pr_err("write-behind mode requires a bitmap.\n");
+ rv = 1;
+ break;
+ }
+ if (s.raiddisks == 0) {
+ pr_err("no raid-devices specified.\n");
+ rv = 1;
+ break;
+ }
+
+ if (s.bitmap_file) {
+ if (strcmp(s.bitmap_file, "internal") == 0 ||
+ strcmp(s.bitmap_file, "clustered") == 0) {
+ pr_err("'internal' and 'clustered' bitmaps not supported with --build\n");
+ rv |= 1;
+ break;
+ }
+ }
+ rv = Build(devlist->devname, devlist->next, &s, &c);
+ break;
+ case CREATE:
+ if (c.delay == 0)
+ c.delay = DEFAULT_BITMAP_DELAY;
+
+ if (c.nodes) {
+ if (!s.bitmap_file ||
+ strcmp(s.bitmap_file, "clustered") != 0) {
+ pr_err("--nodes argument only compatible with --bitmap=clustered\n");
+ rv = 1;
+ break;
+ }
+
+ if (s.level != 1 && s.level != 10) {
+ pr_err("--bitmap=clustered is currently supported with raid1/10 only\n");
+ rv = 1;
+ break;
+ }
+ if (s.level == 10 && !(is_near_layout_10(s.layout) || s.layout == UnSet)) {
+ pr_err("only near layout is supported with clustered raid10\n");
+ rv = 1;
+ break;
+ }
+ }
+
+ if (s.write_behind && !s.bitmap_file) {
+ pr_err("write-behind mode requires a bitmap.\n");
+ rv = 1;
+ break;
+ }
+ if (s.raiddisks == 0) {
+ pr_err("no raid-devices specified.\n");
+ rv = 1;
+ break;
+ }
+
+ rv = Create(ss, devlist->devname,
+ ident.name, ident.uuid_set ? ident.uuid : NULL,
+ devs_found-1, devlist->next,
+ &s, &c, data_offset);
+ break;
+ case MISC:
+ if (devmode == 'E') {
+ if (devlist == NULL && !c.scan) {
+ pr_err("No devices to examine\n");
+ exit(2);
+ }
+ if (devlist == NULL)
+ devlist = conf_get_devs();
+ if (devlist == NULL) {
+ pr_err("No devices listed in %s\n", configfile?configfile:DefaultConfFile);
+ exit(1);
+ }
+ rv = Examine(devlist, &c, ss);
+ } else if (devmode == DetailPlatform) {
+ rv = Detail_Platform(ss ? ss->ss : NULL, ss ? c.scan : 1,
+ c.verbose, c.export,
+ devlist ? devlist->devname : NULL);
+ } else if (devlist == NULL) {
+ if (devmode == 'S' && c.scan)
+ rv = stop_scan(c.verbose);
+ else if ((devmode == 'D' || devmode == Waitclean) &&
+ c.scan)
+ rv = misc_scan(devmode, &c);
+ else if (devmode == UdevRules)
+ rv = Write_rules(udev_filename);
+ else {
+ pr_err("No devices given.\n");
+ exit(2);
+ }
+ } else
+ rv = misc_list(devlist, &ident, dump_directory, ss, &c);
+ break;
+ case MONITOR:
+ if (!devlist && !c.scan) {
+ pr_err("Cannot monitor: need --scan or at least one device\n");
+ rv = 1;
+ break;
+ }
+ if (pidfile && !daemonise) {
+ pr_err("Cannot write a pid file when not in daemon mode\n");
+ rv = 1;
+ break;
+ }
+ if (c.delay == 0) {
+ c.delay = conf_get_monitor_delay();
+ if (!c.delay)
+ c.delay = 60;
+ }
+ rv = Monitor(devlist, mailaddr, program,
+ &c, daemonise, oneshot,
+ dosyslog, pidfile, increments,
+ spare_sharing);
+ break;
+
+ case GROW:
+ if (array_size > 0) {
+ /* alway impose array size first, independent of
+ * anything else
+ * Do not allow level or raid_disks changes at the
+ * same time as that can be irreversibly destructive.
+ */
+ struct mdinfo sra;
+ int err;
+ if (s.raiddisks || s.level != UnSet) {
+ pr_err("cannot change array size in same operation as changing raiddisks or level.\n"
+ " Change size first, then check that data is still intact.\n");
+ rv = 1;
+ break;
+ }
+ if (sysfs_init(&sra, mdfd, NULL)) {
+ rv = 1;
+ break;
+ }
+ if (array_size == MAX_SIZE)
+ err = sysfs_set_str(&sra, NULL, "array_size", "default");
+ else
+ err = sysfs_set_num(&sra, NULL, "array_size", array_size / 2);
+ if (err < 0) {
+ if (errno == E2BIG)
+ pr_err("--array-size setting is too large.\n");
+ else
+ pr_err("current kernel does not support setting --array-size\n");
+ rv = 1;
+ break;
+ }
+ }
+ if (devs_found > 1 && s.raiddisks == 0 && s.level == UnSet) {
+ /* must be '-a'. */
+ if (s.size > 0 || s.chunk ||
+ s.layout_str || s.bitmap_file) {
+ pr_err("--add cannot be used with other geometry changes in --grow mode\n");
+ rv = 1;
+ break;
+ }
+ for (dv = devlist->next; dv; dv = dv->next) {
+ rv = Grow_Add_device(devlist->devname, mdfd,
+ dv->devname);
+ if (rv)
+ break;
+ }
+ } else if (s.bitmap_file) {
+ if (s.size > 0 || s.raiddisks || s.chunk ||
+ s.layout_str || devs_found > 1) {
+ pr_err("--bitmap changes cannot be used with other geometry changes in --grow mode\n");
+ rv = 1;
+ break;
+ }
+ if (c.delay == 0)
+ c.delay = DEFAULT_BITMAP_DELAY;
+ rv = Grow_addbitmap(devlist->devname, mdfd, &c, &s);
+ } else if (grow_continue)
+ rv = Grow_continue_command(devlist->devname,
+ mdfd, c.backup_file,
+ c.verbose);
+ else if (s.size > 0 || s.raiddisks || s.layout_str ||
+ s.chunk != 0 || s.level != UnSet ||
+ data_offset != INVALID_SECTORS) {
+ rv = Grow_reshape(devlist->devname, mdfd,
+ devlist->next,
+ data_offset, &c, &s);
+ } else if (s.consistency_policy != CONSISTENCY_POLICY_UNKNOWN) {
+ rv = Grow_consistency_policy(devlist->devname, mdfd, &c, &s);
+ } else if (array_size == 0)
+ pr_err("no changes to --grow\n");
+ break;
+ case INCREMENTAL:
+ if (rebuild_map) {
+ RebuildMap();
+ }
+ if (c.scan) {
+ rv = 1;
+ if (devlist) {
+ pr_err("In --incremental mode, a device cannot be given with --scan.\n");
+ break;
+ }
+ if (c.runstop <= 0) {
+ pr_err("--incremental --scan meaningless without --run.\n");
+ break;
+ }
+ if (devmode == 'f') {
+ pr_err("--incremental --scan --fail not supported.\n");
+ break;
+ }
+ rv = IncrementalScan(&c, NULL);
+ }
+ if (!devlist) {
+ if (!rebuild_map && !c.scan) {
+ pr_err("--incremental requires a device.\n");
+ rv = 1;
+ }
+ break;
+ }
+ if (devmode == 'f') {
+ if (devlist->next) {
+ pr_err("'--incremental --fail' can only handle one device.\n");
+ rv = 1;
+ break;
+ }
+ rv = IncrementalRemove(devlist->devname, remove_path,
+ c.verbose);
+ } else
+ rv = Incremental(devlist, &c, ss);
+ break;
+ case AUTODETECT:
+ autodetect();
+ break;
+ }
+ if (locked)
+ cluster_release_dlmlock();
+ close_fd(&mdfd);
+ exit(rv);
+}
+
+static int scan_assemble(struct supertype *ss,
+ struct context *c,
+ struct mddev_ident *ident)
+{
+ struct mddev_ident *a, *array_list = conf_get_ident(NULL);
+ struct mddev_dev *devlist = conf_get_devs();
+ struct map_ent *map = NULL;
+ int cnt = 0;
+ int rv = 0;
+ int failures, successes;
+
+ if (conf_verify_devnames(array_list)) {
+ pr_err("Duplicate MD device names in conf file were found.\n");
+ return 1;
+ }
+ if (devlist == NULL) {
+ pr_err("No devices listed in conf file were found.\n");
+ return 1;
+ }
+ for (a = array_list; a; a = a->next) {
+ a->assembled = 0;
+ if (a->autof == 0)
+ a->autof = c->autof;
+ }
+ if (map_lock(&map))
+ pr_err("failed to get exclusive lock on mapfile\n");
+ do {
+ failures = 0;
+ successes = 0;
+ rv = 0;
+ for (a = array_list; a; a = a->next) {
+ int r;
+ if (a->assembled)
+ continue;
+ if (a->devname &&
+ strcasecmp(a->devname, "<ignore>") == 0)
+ continue;
+
+ r = Assemble(ss, a->devname,
+ a, NULL, c);
+ if (r == 0) {
+ a->assembled = 1;
+ successes++;
+ } else
+ failures++;
+ rv |= r;
+ cnt++;
+ }
+ } while (failures && successes);
+ if (c->homehost && cnt == 0) {
+ /* Maybe we can auto-assemble something.
+ * Repeatedly call Assemble in auto-assemble mode
+ * until it fails
+ */
+ int rv2;
+ int acnt;
+ ident->autof = c->autof;
+ do {
+ struct mddev_dev *devlist = conf_get_devs();
+ acnt = 0;
+ do {
+ rv2 = Assemble(ss, NULL,
+ ident,
+ devlist, c);
+ if (rv2 == 0) {
+ cnt++;
+ acnt++;
+ }
+ } while (rv2 != 2);
+ /* Incase there are stacked devices, we need to go around again */
+ } while (acnt);
+ if (cnt == 0 && rv == 0) {
+ pr_err("No arrays found in config file or automatically\n");
+ rv = 1;
+ } else if (cnt)
+ rv = 0;
+ } else if (cnt == 0 && rv == 0) {
+ pr_err("No arrays found in config file\n");
+ rv = 1;
+ }
+ map_unlock(&map);
+ return rv;
+}
+
+static int misc_scan(char devmode, struct context *c)
+{
+ /* apply --detail or --wait-clean to
+ * all devices in /proc/mdstat
+ */
+ struct mdstat_ent *ms = mdstat_read(0, 1);
+ struct mdstat_ent *e;
+ struct map_ent *map = NULL;
+ int members;
+ int rv = 0;
+
+ for (members = 0; members <= 1; members++) {
+ for (e = ms; e; e = e->next) {
+ char *name = NULL;
+ struct map_ent *me;
+ struct stat stb;
+ int member = e->metadata_version &&
+ strncmp(e->metadata_version,
+ "external:/", 10) == 0;
+ if (members != member)
+ continue;
+ me = map_by_devnm(&map, e->devnm);
+ if (me && me->path && strcmp(me->path, "/unknown") != 0)
+ name = me->path;
+ if (name == NULL || stat(name, &stb) != 0)
+ name = get_md_name(e->devnm);
+
+ if (!name) {
+ pr_err("cannot find device file for %s\n",
+ e->devnm);
+ continue;
+ }
+ if (devmode == 'D')
+ rv |= Detail(name, c);
+ else
+ rv |= WaitClean(name, c->verbose);
+ put_md_name(name);
+ map_free(map);
+ map = NULL;
+ }
+ }
+ free_mdstat(ms);
+ return rv;
+}
+
+static int stop_scan(int verbose)
+{
+ /* apply --stop to all devices in /proc/mdstat */
+ /* Due to possible stacking of devices, repeat until
+ * nothing more can be stopped
+ */
+ int progress = 1, err;
+ int last = 0;
+ int rv = 0;
+ do {
+ struct mdstat_ent *ms = mdstat_read(0, 0);
+ struct mdstat_ent *e;
+
+ if (!progress) last = 1;
+ progress = 0; err = 0;
+ for (e = ms; e; e = e->next) {
+ char *name = get_md_name(e->devnm);
+ int mdfd;
+
+ if (!name) {
+ pr_err("cannot find device file for %s\n",
+ e->devnm);
+ continue;
+ }
+ mdfd = open_mddev(name, 1);
+ if (mdfd >= 0) {
+ if (Manage_stop(name, mdfd, verbose, !last))
+ err = 1;
+ else
+ progress = 1;
+ close(mdfd);
+ }
+
+ put_md_name(name);
+ }
+ free_mdstat(ms);
+ } while (!last && err);
+ if (err)
+ rv |= 1;
+ return rv;
+}
+
+static int misc_list(struct mddev_dev *devlist,
+ struct mddev_ident *ident,
+ char *dump_directory,
+ struct supertype *ss, struct context *c)
+{
+ struct mddev_dev *dv;
+ int rv = 0;
+
+ for (dv = devlist; dv; dv = (rv & 16) ? NULL : dv->next) {
+ int mdfd = -1;
+
+ switch(dv->disposition) {
+ case 'D':
+ rv |= Detail(dv->devname, c);
+ continue;
+ case KillOpt: /* Zero superblock */
+ if (ss)
+ rv |= Kill(dv->devname, ss, c->force, c->verbose,0);
+ else {
+ int v = c->verbose;
+ do {
+ rv |= Kill(dv->devname, NULL, c->force, v, 0);
+ v = -1;
+ } while (rv == 0);
+ rv &= ~4;
+ }
+ continue;
+ case 'Q':
+ rv |= Query(dv->devname);
+ continue;
+ case 'X':
+ rv |= ExamineBitmap(dv->devname, c->brief, ss);
+ continue;
+ case ExamineBB:
+ rv |= ExamineBadblocks(dv->devname, c->brief, ss);
+ continue;
+ case 'W':
+ case WaitOpt:
+ rv |= Wait(dv->devname);
+ continue;
+ case Waitclean:
+ rv |= WaitClean(dv->devname, c->verbose);
+ continue;
+ case KillSubarray:
+ rv |= Kill_subarray(dv->devname, c->subarray, c->verbose);
+ continue;
+ case UpdateSubarray:
+ if (c->update == NULL) {
+ pr_err("-U/--update must be specified with --update-subarray\n");
+ rv |= 1;
+ continue;
+ }
+ rv |= Update_subarray(dv->devname, c->subarray,
+ c->update, ident, c->verbose);
+ continue;
+ case Dump:
+ rv |= Dump_metadata(dv->devname, dump_directory, c, ss);
+ continue;
+ case Restore:
+ rv |= Restore_metadata(dv->devname, dump_directory, c, ss,
+ (dv == devlist && dv->next == NULL));
+ continue;
+ case Action:
+ rv |= SetAction(dv->devname, c->action);
+ continue;
+ }
+
+ if (dv->devname[0] != '/')
+ mdfd = open_dev(dv->devname);
+ if (dv->devname[0] == '/' || mdfd < 0)
+ mdfd = open_mddev(dv->devname, 1);
+
+ if (mdfd >= 0) {
+ switch(dv->disposition) {
+ case 'R':
+ c->runstop = 1;
+ rv |= Manage_run(dv->devname, mdfd, c);
+ break;
+ case 'S':
+ if (c->scan) {
+ pr_err("--stop not meaningful with both a --scan assembly and a device name.\n");
+ rv |= 1;
+ break;
+ }
+ rv |= Manage_stop(dv->devname, mdfd, c->verbose, 0);
+ break;
+ case 'o':
+ rv |= Manage_ro(dv->devname, mdfd, 1);
+ break;
+ case 'w':
+ rv |= Manage_ro(dv->devname, mdfd, -1);
+ break;
+ }
+ close(mdfd);
+ } else
+ rv |= 1;
+ }
+ return rv;
+}
+
+int SetAction(char *dev, char *action)
+{
+ int fd = open(dev, O_RDONLY);
+ struct mdinfo mdi;
+ int retval;
+
+ if (fd < 0) {
+ pr_err("Couldn't open %s: %s\n", dev, strerror(errno));
+ return 1;
+ }
+ retval = sysfs_init(&mdi, fd, NULL);
+ close(fd);
+ if (retval) {
+ pr_err("%s is no an md array\n", dev);
+ return 1;
+ }
+
+ if (sysfs_set_str(&mdi, NULL, "sync_action", action) < 0) {
+ pr_err("Count not set action for %s to %s: %s\n",
+ dev, action, strerror(errno));
+ return 1;
+ }
+ return 0;
+}
diff --git a/mdadm.conf-example b/mdadm.conf-example
new file mode 100644
index 0000000..35a75d1
--- /dev/null
+++ b/mdadm.conf-example
@@ -0,0 +1,65 @@
+# mdadm configuration file
+#
+# mdadm will function properly without the use of a configuration file,
+# but this file is useful for keeping track of arrays and member disks.
+# In general, a mdadm.conf file is created, and updated, after arrays
+# are created. This is the opposite behavior of /etc/raidtab which is
+# created prior to array construction.
+#
+#
+# the config file takes two types of lines:
+#
+# DEVICE lines specify a list of devices of where to look for
+# potential member disks
+#
+# ARRAY lines specify information about how to identify arrays so
+# so that they can be activated
+#
+# You can have more than one device line and use wild cards. The first
+# example includes SCSI the first partition of SCSI disks /dev/sdb,
+# /dev/sdc, /dev/sdd, /dev/sdj, /dev/sdk, and /dev/sdl. The second
+# line looks for array slices on IDE disks.
+#
+#DEVICE /dev/sd[bcdjkl]1
+#DEVICE /dev/hda1 /dev/hdb1
+#
+# If you mount devfs on /dev, then a suitable way to list all devices is:
+#DEVICE /dev/discs/*/*
+#
+#
+# The AUTO line can control which arrays get assembled by auto-assembly,
+# meaing either "mdadm -As" when there are no 'ARRAY' lines in this file,
+# or "mdadm --incremental" when the array found is not listed in this file.
+# By default, all arrays that are found are assembled.
+# If you want to ignore all DDF arrays (maybe they are managed by dmraid),
+# and only assemble 1.x arrays if which are marked for 'this' homehost,
+# but assemble all others, then use
+#AUTO -ddf homehost -1.x +all
+#
+# ARRAY lines specify an array to assemble and a method of identification.
+# Arrays can currently be identified by using a UUID, superblock minor number,
+# or a listing of devices.
+#
+# super-minor is usually the minor number of the metadevice
+# UUID is the Universally Unique Identifier for the array
+# Each can be obtained using
+#
+# mdadm -D <md>
+#
+#ARRAY /dev/md0 UUID=3aaa0122:29827cfa:5331ad66:ca767371
+#ARRAY /dev/md1 super-minor=1
+#ARRAY /dev/md2 devices=/dev/hda1,/dev/hdb1
+#
+# ARRAY lines can also specify a "spare-group" for each array. mdadm --monitor
+# will then move a spare between arrays in a spare-group if one array has a failed
+# drive but no spare
+#ARRAY /dev/md4 uuid=b23f3c6d:aec43a9f:fd65db85:369432df spare-group=group1
+#ARRAY /dev/md5 uuid=19464854:03f71b1b:e0df2edd:246cc977 spare-group=group1
+#
+# When used in --follow (aka --monitor) mode, mdadm needs a
+# mail address and/or a program. This can be given with "mailaddr"
+# and "program" lines to that monitoring can be started using
+# mdadm --follow --scan & echo $! > /run/mdadm/mon.pid
+# If the lines are not found, mdadm will exit quietly
+#MAILADDR root@mydomain.tld
+#PROGRAM /usr/sbin/handle-mdadm-events
diff --git a/mdadm.conf.5 b/mdadm.conf.5
new file mode 100644
index 0000000..74a21c5
--- /dev/null
+++ b/mdadm.conf.5
@@ -0,0 +1,706 @@
+.\" Copyright Neil Brown and others.
+.\" This program is free software; you can redistribute it and/or modify
+.\" it under the terms of the GNU General Public License as published by
+.\" the Free Software Foundation; either version 2 of the License, or
+.\" (at your option) any later version.
+.\" See file COPYING in distribution for details.
+.TH MDADM.CONF 5
+.SH NAME
+mdadm.conf \- configuration for management of Software RAID with mdadm
+.SH SYNOPSIS
+/etc/mdadm.conf
+.SH DESCRIPTION
+.PP
+.I mdadm
+is a tool for creating, managing, and monitoring RAID devices using the
+.B md
+driver in Linux.
+.PP
+Some common tasks, such as assembling all arrays, can be simplified
+by describing the devices and arrays in this configuration file.
+
+.SS SYNTAX
+The file should be seen as a collection of words separated by white
+space (space, tab, or newline).
+Any word that beings with a hash sign (#) starts a comment and that
+word together with the remainder of the line is ignored.
+
+Spaces can be included in a word using quotation characters. Either
+single quotes
+.RB ( ' )
+or double quotes (\fB"\fP)
+may be used. All the characters from one quotation character to
+next identical character are protected and will not be used to
+separate words to start new quoted strings. To include a single quote
+it must be between double quotes. To include a double quote it must
+be between single quotes.
+
+Any line that starts with white space (space or tab) is treated as
+though it were a continuation of the previous line.
+
+Empty lines are ignored, but otherwise each (non continuation) line
+must start with a keyword as listed below. The keywords are case
+insensitive and can be abbreviated to 3 characters.
+
+The keywords are:
+.TP
+.B DEVICE
+A
+.B device
+line lists the devices (whole devices or partitions) that might contain
+a component of an MD array. When looking for the components of an
+array,
+.I mdadm
+will scan these devices (or any devices listed on the command line).
+
+The
+.B device
+line may contain a number of different devices (separated by spaces)
+and each device name can contain wild cards as defined by
+.BR glob (7).
+
+Also, there may be several device lines present in the file.
+
+Alternatively, a
+.B device
+line can contain either or both of the words
+.B containers
+and
+.BR partitions .
+The word
+.B containers
+will cause
+.I mdadm
+to look for assembled CONTAINER arrays and included them as a source
+for assembling further arrays.
+
+The word
+.I partitions
+will cause
+.I mdadm
+to read
+.I /proc/partitions
+and include all devices and partitions found therein.
+.I mdadm
+does not use the names from
+.I /proc/partitions
+but only the major and minor device numbers. It scans
+.I /dev
+to find the name that matches the numbers.
+
+If no DEVICE line is present, then "DEVICE partitions containers" is assumed.
+
+For example:
+.IP
+DEVICE /dev/hda* /dev/hdc*
+.br
+DEV /dev/sd*
+.br
+DEVICE /dev/disk/by-path/pci*
+.br
+DEVICE partitions
+
+.TP
+.B ARRAY
+The ARRAY lines identify actual arrays. The second word on the line
+may be the name of the device where the array is normally
+assembled, such as
+.B /dev/md1
+or
+.BR /dev/md/backup .
+If the name does not start with a slash
+.RB (' / '),
+it is treated as being in
+.BR /dev/md/ .
+Alternately the word
+.B <ignore>
+(complete with angle brackets) can be given in which case any array
+which matches the rest of the line will never be automatically assembled.
+If no device name is given,
+.I mdadm
+will use various heuristics to determine an appropriate name.
+
+Subsequent words identify the array, or identify the array as a member
+of a group. If multiple identities are given,
+then a component device must match ALL identities to be considered a
+match. Each identity word has a tag, and equals sign, and some value.
+The tags are:
+.RS 4
+.TP
+.B uuid=
+The value should be a 128 bit uuid in hexadecimal, with punctuation
+interspersed if desired. This must match the uuid stored in the
+superblock.
+.TP
+.B name=
+The value should be a simple textual name as was given to
+.I mdadm
+when the array was created. This must match the name stored in the
+superblock on a device for that device to be included in the array.
+Not all superblock formats support names.
+.TP
+.B super\-minor=
+The value is an integer which indicates the minor number that was
+stored in the superblock when the array was created. When an array is
+created as /dev/mdX, then the minor number X is stored.
+.TP
+.B devices=
+The value is a comma separated list of device names or device name
+patterns.
+Only devices with names which match one entry in the list will be used
+to assemble the array. Note that the devices
+listed there must also be listed on a DEVICE line.
+.TP
+.B level=
+The value is a RAID level. This is not normally used to
+identify an array, but is supported so that the output of
+
+.B "mdadm \-\-examine \-\-scan"
+
+can be use directly in the configuration file.
+.TP
+.B num\-devices=
+The value is the number of devices in a complete active array. As with
+.B level=
+this is mainly for compatibility with the output of
+
+.BR "mdadm \-\-examine \-\-scan" .
+
+.TP
+.B spares=
+The value is a number of spare devices to expect the array to have.
+The sole use of this keyword and value is as follows:
+.B mdadm \-\-monitor
+will report an array if it is found to have fewer than this number of
+spares when
+.B \-\-monitor
+starts or when
+.B \-\-oneshot
+is used.
+
+.TP
+.B spare\-group=
+The value is a textual name for a group of arrays. All arrays with
+the same
+.B spare\-group
+name are considered to be part of the same group. The significance of
+a group of arrays is that
+.I mdadm
+will, when monitoring the arrays, move a spare drive from one array in
+a group to another array in that group if the first array had a failed
+or missing drive but no spare.
+
+.TP
+.B auto=
+This option is rarely needed with mdadm-3.0, particularly if use with
+the Linux kernel v2.6.28 or later.
+It tells
+.I mdadm
+whether to use partitionable array or non-partitionable arrays and,
+in the absence of
+.IR udev ,
+how many partition devices to create. From 2.6.28 all md array
+devices are partitionable, hence this option is not needed.
+
+The value of this option can be "yes" or "md" to indicate that a
+traditional, non-partitionable md array should be created, or "mdp",
+"part" or "partition" to indicate that a partitionable md array (only
+available in linux 2.6 and later) should be used. This later set can
+also have a number appended to indicate how many partitions to create
+device files for, e.g.
+.BR auto=mdp5 .
+The default is 4.
+
+.TP
+.B bitmap=
+The option specifies a file in which a write-intent bitmap should be
+found. When assembling the array,
+.I mdadm
+will provide this file to the
+.B md
+driver as the bitmap file. This has the same function as the
+.B \-\-bitmap\-file
+option to
+.BR \-\-assemble .
+
+.TP
+.B metadata=
+Specify the metadata format that the array has. This is mainly
+recognised for comparability with the output of
+.BR "mdadm \-Es" .
+
+.TP
+.B container=
+Specify that this array is a member array of some container. The
+value given can be either a path name in /dev, or a UUID of the
+container array.
+
+.TP
+.B member=
+Specify that this array is a member array of some container. Each
+type of container has some way to enumerate member arrays, often a
+simple sequence number. The value identifies which member of a
+container the array is. It will usually accompany a "container=" word.
+.RE
+
+.TP
+.B MAILADDR
+The
+.B mailaddr
+line gives an E-mail address that alerts should be
+sent to when
+.I mdadm
+is running in
+.B \-\-monitor
+mode (and was given the
+.B \-\-scan
+option). There should only be one
+.B MAILADDR
+line and it should have only one address. Any subsequent addresses
+are silently ignored.
+
+.TP
+.B MAILFROM
+The
+.B mailfrom
+line (which can only be abbreviated to at least 5 characters) gives an
+address to appear in the "From" address for alert mails. This can be
+useful if you want to explicitly set a domain, as the default from
+address is "root" with no domain. All words on this line are
+catenated with spaces to form the address.
+
+Note that this value cannot be set via the
+.I mdadm
+commandline. It is only settable via the config file.
+
+.TP
+.B PROGRAM
+The
+.B program
+line gives the name of a program to be run when
+.B "mdadm \-\-monitor"
+detects potentially interesting events on any of the arrays that it
+is monitoring. This program gets run with two or three arguments, they
+being the Event, the md device, and possibly the related component
+device.
+
+There should only be one
+.B program
+line and it should be give only one program.
+
+
+.TP
+.B CREATE
+The
+.B create
+line gives default values to be used when creating arrays, new members
+of arrays, and device entries for arrays.
+These include:
+
+.RS 4
+.TP
+.B owner=
+.TP
+.B group=
+These can give user/group ids or names to use instead of system
+defaults (root/wheel or root/disk).
+.TP
+.B mode=
+An octal file mode such as 0660 can be given to override the default
+of 0600.
+.TP
+.B auto=
+This corresponds to the
+.B \-\-auto
+flag to mdadm. Give
+.BR yes ,
+.BR md ,
+.BR mdp ,
+.B part
+\(em possibly followed by a number of partitions \(em to indicate how
+missing device entries should be created.
+
+.TP
+.B metadata=
+The name of the metadata format to use if none is explicitly given.
+This can be useful to impose a system-wide default of version-1 superblocks.
+
+.TP
+.B symlinks=no
+Normally when creating devices in
+.B /dev/md/
+.I mdadm
+will create a matching symlink from
+.B /dev/
+with a name starting
+.B md
+or
+.BR md_ .
+Give
+.B symlinks=no
+to suppress this symlink creation.
+
+.TP
+.B names=yes
+Since Linux 2.6.29 it has been possible to create
+.B md
+devices with a name like
+.B md_home
+rather than just a number, like
+.BR md3 .
+.I mdadm
+will use the numeric alternative by default as other tools that interact
+with md arrays may expect only numbers.
+If
+.B names=yes
+is given in
+.I mdadm.conf
+then
+.I mdadm
+will use a name when appropriate.
+If
+.B names=no
+is given, then non-numeric
+.I md
+device names will not be used even if the default changes in a future
+release of
+.IR mdadm .
+
+.TP
+.B bbl=no
+By default,
+.I mdadm
+will reserve space for a bad block list (bbl) on all devices
+included in or added to any array that supports them. Setting
+.B bbl=no
+will prevent this, so newly added devices will not have a bad
+block log.
+.RE
+
+.TP
+.B HOMEHOST
+The
+.B homehost
+line gives a default value for the
+.B \-\-homehost=
+option to mdadm. There should normally be only one other word on the line.
+It should either be a host name, or one of the special words
+.BR <system>,
+.B <none>
+and
+.BR <ignore> .
+If
+.B <system>
+is given, then the
+.BR gethostname ( 2 )
+systemcall is used to get the host name. This is the default.
+
+If
+.B <ignore>
+is given, then a flag is set so that when arrays are being
+auto-assembled the checking of the recorded
+.I homehost
+is disabled.
+If
+.B <ignore>
+is given it is also possible to give an explicit name which will be
+used when creating arrays. This is the only case when there can be
+more that one other word on the
+.B HOMEHOST
+line. If there are other words, or other
+.B HOMEHOST
+lines, they are silently ignored.
+
+If
+.B <none>
+is given, then the default of using
+.BR gethostname ( 2 )
+is over-ridden and no homehost name is assumed.
+
+When arrays are created, this host name will be stored in the
+metadata. When arrays are assembled using auto-assembly, arrays which
+do not record the correct homehost name in their metadata will be
+assembled using a "foreign" name. A "foreign" name alway ends with a
+digit string preceded by an underscore to differentiate it
+from any possible local name. e.g.
+.B /dev/md/1_1
+or
+.BR /dev/md/home_0 .
+.TP
+.B AUTO
+A list of names of metadata format can be given, each preceded by a
+plus or minus sign. Also the word
+.I homehost
+is allowed as is
+.I all
+preceded by plus or minus sign.
+.I all
+is usually last.
+
+When
+.I mdadm
+is auto-assembling an array, either via
+.I \-\-assemble
+or
+.I \-\-incremental
+and it finds metadata of a given type, it checks that metadata type
+against those listed in this line. The first match wins, where
+.I all
+matches anything.
+If a match is found that was preceded by a plus sign, the auto
+assembly is allowed. If the match was preceded by a minus sign, the
+auto assembly is disallowed. If no match is found, the auto assembly
+is allowed.
+
+If the metadata indicates that the array was created for
+.I this
+host, and the word
+.I homehost
+appears before any other match, then the array is treated as a valid
+candidate for auto-assembly.
+
+This can be used to disable all auto-assembly (so that only arrays
+explicitly listed in mdadm.conf or on the command line are assembled),
+or to disable assembly of certain metadata types which might be
+handled by other software. It can also be used to disable assembly of
+all foreign arrays - normally such arrays are assembled but given a
+non-deterministic name in
+.BR /dev/md/ .
+
+The known metadata types are
+.BR 0.90 ,
+.BR 1.x ,
+.BR ddf ,
+.BR imsm .
+
+.B AUTO
+should be given at most once. Subsequent lines are silently ignored.
+Thus an earlier config file in a config directory will over-ride
+the setting in a later config file.
+
+.TP
+.B POLICY
+This is used to specify what automatic behavior is allowed on devices
+newly appearing in the system and provides a way of marking spares that can
+be moved to other arrays as well as the migration domains.
+.I Domain
+can be defined through
+.I policy
+line by specifying a domain name for a number of paths from
+.BR /dev/disk/by-path/ .
+A device may belong to several domains. The domain of an array is a union
+of domains of all devices in that array. A spare can be automatically
+moved from one array to another if the set of the destination array's
+.I domains
+contains all the
+.I domains
+of the new disk or if both arrays have the same
+.IR spare-group .
+
+To update hot plug configuration it is necessary to execute
+.B mdadm \-\-udev\-rules
+command after changing the config file
+
+Keywords used in the
+.I POLICY
+line and supported values are:
+
+.RS 4
+.TP
+.B domain=
+any arbitrary string
+.TP
+.B metadata=
+0.9 1.x ddf or imsm
+.TP
+.B path=
+file glob matching anything from
+.B /dev/disk/by-path
+.TP
+.B type=
+either
+.B disk
+or
+.BR part .
+.TP
+.B action=
+include, re-add, spare, spare-same-slot, or force-spare
+.TP
+.B auto=
+yes, no, or homehost.
+
+.P
+The
+.I action
+item determines the automatic behavior allowed for devices matching the
+.I path
+and
+.I type
+in the same line. If a device matches several lines with different
+.I actions
+then the most permissive will apply. The ordering of policy lines
+is irrelevant to the end result.
+.TP
+.B include
+allows adding a disk to an array if metadata on that disk matches that array
+.TP
+.B re\-add
+will include the device in the array if it appears to be a current member
+or a member that was recently removed and the array has a
+write-intent-bitmap to allow the
+.B re\-add
+functionality.
+.TP
+.B spare
+as above and additionally: if the device is bare it can
+become a spare if there is any array that it is a candidate for based
+on domains and metadata.
+.TP
+.B spare\-same\-slot
+as above and additionally if given slot was used by an array that went
+degraded recently and the device plugged in has no metadata then it will
+be automatically added to that array (or it's container)
+.TP
+.B force\-spare
+as above and the disk will become a spare in remaining cases
+.RE
+
+.TP
+.B PART-POLICY
+This is similar to
+.B POLICY
+and accepts the same keyword assignments. It allows a consistent set
+of policies to applied to each of the partitions of a device.
+
+A
+.B PART-POLICY
+line should set
+.I type=disk
+and identify the path to one or more disk devices. Each partition on
+these disks will be treated according to the
+.I action=
+setting from this line. If a
+.I domain
+is set in the line, then the domain associated with each patition will
+be based on the domain, but with
+.RB \(dq -part N\(dq
+appended, when N is the partition number for the partition that was
+found.
+
+.TP
+.B SYSFS
+The
+.B SYSFS
+line lists custom values of MD device's sysfs attributes which will be
+stored in sysfs after the array is assembled. Multiple lines are allowed and each
+line has to contain the uuid or the name of the device to which it relates.
+.RS 4
+.TP
+.B uuid=
+hexadecimal identifier of MD device. This has to match the uuid stored in the
+superblock.
+.TP
+.B name=
+name of the MD device as was given to
+.I mdadm
+when the array was created. It will be ignored if
+.B uuid
+is not empty.
+.RE
+
+.TP
+.B MONITORDELAY
+The
+.B monitordelay
+line gives a delay in seconds
+.I mdadm
+shall wait before pooling md arrays
+when
+.I mdadm
+is running in
+.B \-\-monitor
+mode.
+.B \-d/\-\-delay
+command line argument takes precedence over the config file
+
+.SH EXAMPLE
+DEVICE /dev/sd[bcdjkl]1
+.br
+DEVICE /dev/hda1 /dev/hdb1
+
+# /dev/md0 is known by its UUID.
+.br
+ARRAY /dev/md0 UUID=3aaa0122:29827cfa:5331ad66:ca767371
+.br
+# /dev/md1 contains all devices with a minor number of
+.br
+# 1 in the superblock.
+.br
+ARRAY /dev/md1 superminor=1
+.br
+# /dev/md2 is made from precisely these two devices
+.br
+ARRAY /dev/md2 devices=/dev/hda1,/dev/hdb1
+
+# /dev/md4 and /dev/md5 are a spare-group and spares
+.br
+# can be moved between them
+.br
+ARRAY /dev/md4 uuid=b23f3c6d:aec43a9f:fd65db85:369432df
+.br
+ spare\-group=group1
+.br
+ARRAY /dev/md5 uuid=19464854:03f71b1b:e0df2edd:246cc977
+.br
+ spare\-group=group1
+.br
+# /dev/md/home is created if need to be a partitionable md array
+.br
+# any spare device number is allocated.
+.br
+ARRAY /dev/md/home UUID=9187a482:5dde19d9:eea3cc4a:d646ab8b
+.br
+ auto=part
+.br
+# The name of this array contains a space.
+.br
+ARRAY /dev/md9 name='Data Storage'
+.sp
+POLICY domain=domain1 metadata=imsm path=pci-0000:00:1f.2-scsi-*
+.br
+ action=spare
+.br
+POLICY domain=domain1 metadata=imsm path=pci-0000:04:00.0-scsi-[01]*
+.br
+ action=include
+.br
+# One domain comprising of devices attached to specified paths is defined.
+.br
+# Bare device matching first path will be made an imsm spare on hot plug.
+.br
+# If more than one array is created on devices belonging to domain1 and
+.br
+# one of them becomes degraded, then any imsm spare matching any path for
+.br
+# given domain name can be migrated.
+.br
+MAILADDR root@mydomain.tld
+.br
+PROGRAM /usr/sbin/handle\-mdadm\-events
+.br
+CREATE group=system mode=0640 auto=part\-8
+.br
+HOMEHOST <system>
+.br
+AUTO +1.x homehost \-all
+.br
+SYSFS name=/dev/md/raid5 group_thread_cnt=4 sync_speed_max=1000000
+.br
+SYSFS uuid=bead5eb6:31c17a27:da120ba2:7dfda40d group_thread_cnt=4
+sync_speed_max=1000000
+.br
+MONITORDELAY 60
+
+.SH SEE ALSO
+.BR mdadm (8),
+.BR md (4).