geom_raid3.c revision 153190
1133808Spjd/*- 2142727Spjd * Copyright (c) 2004-2005 Pawel Jakub Dawidek <pjd@FreeBSD.org> 3133808Spjd * All rights reserved. 4133808Spjd * 5133808Spjd * Redistribution and use in source and binary forms, with or without 6133808Spjd * modification, are permitted provided that the following conditions 7133808Spjd * are met: 8133808Spjd * 1. Redistributions of source code must retain the above copyright 9133808Spjd * notice, this list of conditions and the following disclaimer. 10133808Spjd * 2. Redistributions in binary form must reproduce the above copyright 11133808Spjd * notice, this list of conditions and the following disclaimer in the 12133808Spjd * documentation and/or other materials provided with the distribution. 13133808Spjd * 14133808Spjd * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND 15133808Spjd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16133808Spjd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17133808Spjd * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE 18133808Spjd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19133808Spjd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20133808Spjd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21133808Spjd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22133808Spjd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23133808Spjd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24133808Spjd * SUCH DAMAGE. 25133808Spjd */ 26133808Spjd 27133808Spjd#include <sys/cdefs.h> 28133808Spjd__FBSDID("$FreeBSD: head/sbin/geom/class/raid3/geom_raid3.c 153190 2005-12-07 01:38:27Z pjd $"); 29133808Spjd 30133808Spjd#include <sys/param.h> 31133808Spjd#include <errno.h> 32133808Spjd#include <paths.h> 33133808Spjd#include <stdio.h> 34133808Spjd#include <stdlib.h> 35133808Spjd#include <stdint.h> 36133808Spjd#include <string.h> 37133808Spjd#include <strings.h> 38133808Spjd#include <assert.h> 39133808Spjd#include <libgeom.h> 40133808Spjd#include <geom/raid3/g_raid3.h> 41133808Spjd#include <core/geom.h> 42133808Spjd#include <misc/subr.h> 43133808Spjd 44133808Spjd 45133808Spjduint32_t lib_version = G_LIB_VERSION; 46133808Spjduint32_t version = G_RAID3_VERSION; 47133808Spjd 48133808Spjdstatic void raid3_main(struct gctl_req *req, unsigned f); 49133808Spjdstatic void raid3_clear(struct gctl_req *req); 50133808Spjdstatic void raid3_dump(struct gctl_req *req); 51133808Spjdstatic void raid3_label(struct gctl_req *req); 52133808Spjd 53133808Spjdstruct g_command class_commands[] = { 54143586Spjd { "clear", G_FLAG_VERBOSE, raid3_main, G_NULL_OPTS, 55143586Spjd "[-v] prov ..." 56143586Spjd }, 57133808Spjd { "configure", G_FLAG_VERBOSE, NULL, 58133808Spjd { 59133808Spjd { 'a', "autosync", NULL, G_TYPE_NONE }, 60133808Spjd { 'd', "dynamic", NULL, G_TYPE_NONE }, 61133808Spjd { 'h', "hardcode", NULL, G_TYPE_NONE }, 62133808Spjd { 'n', "noautosync", NULL, G_TYPE_NONE }, 63134124Spjd { 'r', "round_robin", NULL, G_TYPE_NONE }, 64134124Spjd { 'R', "noround_robin", NULL, G_TYPE_NONE }, 65134168Spjd { 'w', "verify", NULL, G_TYPE_NONE }, 66134168Spjd { 'W', "noverify", NULL, G_TYPE_NONE }, 67133808Spjd G_OPT_SENTINEL 68143586Spjd }, 69143586Spjd "[-adhnrRvwW] name" 70133808Spjd }, 71143586Spjd { "dump", 0, raid3_main, G_NULL_OPTS, 72143586Spjd "prov ..." 73143586Spjd }, 74133808Spjd { "insert", G_FLAG_VERBOSE, NULL, 75133808Spjd { 76133808Spjd { 'h', "hardcode", NULL, G_TYPE_NONE }, 77133808Spjd { 'n', "number", NULL, G_TYPE_NUMBER }, 78133808Spjd G_OPT_SENTINEL 79143586Spjd }, 80143586Spjd "[-hv] <-n number> name prov" 81133808Spjd }, 82133808Spjd { "label", G_FLAG_VERBOSE, raid3_main, 83133808Spjd { 84133808Spjd { 'h', "hardcode", NULL, G_TYPE_NONE }, 85133808Spjd { 'n', "noautosync", NULL, G_TYPE_NONE }, 86134124Spjd { 'r', "round_robin", NULL, G_TYPE_NONE }, 87134168Spjd { 'w', "verify", NULL, G_TYPE_NONE }, 88133808Spjd G_OPT_SENTINEL 89143586Spjd }, 90143586Spjd "[-hnrvw] name prov prov prov ..." 91133808Spjd }, 92143586Spjd { "rebuild", G_FLAG_VERBOSE, NULL, G_NULL_OPTS, 93143586Spjd "[-v] name prov" 94143586Spjd }, 95133808Spjd { "remove", G_FLAG_VERBOSE, NULL, 96133808Spjd { 97133808Spjd { 'n', "number", NULL, G_TYPE_NUMBER }, 98133808Spjd G_OPT_SENTINEL 99143586Spjd }, 100143586Spjd "[-v] <-n number> name" 101133808Spjd }, 102133808Spjd { "stop", G_FLAG_VERBOSE, NULL, 103133808Spjd { 104133808Spjd { 'f', "force", NULL, G_TYPE_NONE }, 105133808Spjd G_OPT_SENTINEL 106143586Spjd }, 107143586Spjd "[-fv] name ..." 108133808Spjd }, 109133808Spjd G_CMD_SENTINEL 110133808Spjd}; 111133808Spjd 112133808Spjdstatic int verbose = 0; 113133808Spjd 114133808Spjdstatic void 115133808Spjdraid3_main(struct gctl_req *req, unsigned flags) 116133808Spjd{ 117133808Spjd const char *name; 118133808Spjd 119133808Spjd if ((flags & G_FLAG_VERBOSE) != 0) 120133808Spjd verbose = 1; 121133808Spjd 122153190Spjd name = gctl_get_ascii(req, "verb"); 123133808Spjd if (name == NULL) { 124133808Spjd gctl_error(req, "No '%s' argument.", "verb"); 125133808Spjd return; 126133808Spjd } 127133808Spjd if (strcmp(name, "label") == 0) 128133808Spjd raid3_label(req); 129133808Spjd else if (strcmp(name, "clear") == 0) 130133808Spjd raid3_clear(req); 131133808Spjd else if (strcmp(name, "dump") == 0) 132133808Spjd raid3_dump(req); 133133808Spjd else 134133808Spjd gctl_error(req, "Unknown command: %s.", name); 135133808Spjd} 136133808Spjd 137133808Spjdstatic void 138133808Spjdraid3_label(struct gctl_req *req) 139133808Spjd{ 140133808Spjd struct g_raid3_metadata md; 141133808Spjd u_char sector[512]; 142133808Spjd const char *str; 143134420Spjd unsigned sectorsize, ssize; 144134420Spjd off_t mediasize, msize; 145153190Spjd int error, i, nargs, hardcode, noautosync, round_robin, verify; 146133808Spjd 147153190Spjd nargs = gctl_get_int(req, "nargs"); 148153190Spjd if (nargs < 4) { 149133808Spjd gctl_error(req, "Too few arguments."); 150133808Spjd return; 151133808Spjd } 152153190Spjd if (bitcount32(nargs - 2) != 1) { 153133808Spjd gctl_error(req, "Invalid number of components."); 154133808Spjd return; 155133808Spjd } 156133808Spjd 157133808Spjd strlcpy(md.md_magic, G_RAID3_MAGIC, sizeof(md.md_magic)); 158133808Spjd md.md_version = G_RAID3_VERSION; 159153190Spjd str = gctl_get_ascii(req, "arg0"); 160133808Spjd strlcpy(md.md_name, str, sizeof(md.md_name)); 161147947Spjd md.md_id = arc4random(); 162153190Spjd md.md_all = nargs - 1; 163133808Spjd md.md_mflags = 0; 164133808Spjd md.md_dflags = 0; 165139295Spjd md.md_genid = 0; 166133808Spjd md.md_syncid = 1; 167133808Spjd md.md_sync_offset = 0; 168153190Spjd noautosync = gctl_get_int(req, "noautosync"); 169153190Spjd if (noautosync) 170133808Spjd md.md_mflags |= G_RAID3_DEVICE_FLAG_NOAUTOSYNC; 171153190Spjd round_robin = gctl_get_int(req, "round_robin"); 172153190Spjd if (round_robin) 173134124Spjd md.md_mflags |= G_RAID3_DEVICE_FLAG_ROUND_ROBIN; 174153190Spjd verify = gctl_get_int(req, "verify"); 175153190Spjd if (verify) 176134168Spjd md.md_mflags |= G_RAID3_DEVICE_FLAG_VERIFY; 177153190Spjd if (round_robin && verify) { 178134168Spjd gctl_error(req, "Both '%c' and '%c' options given.", 'r', 'w'); 179134168Spjd return; 180134168Spjd } 181153190Spjd hardcode = gctl_get_int(req, "hardcode"); 182133808Spjd 183133808Spjd /* 184133808Spjd * Calculate sectorsize by finding least common multiple from 185133808Spjd * sectorsizes of every disk and find the smallest mediasize. 186133808Spjd */ 187133808Spjd mediasize = 0; 188133808Spjd sectorsize = 0; 189153190Spjd for (i = 1; i < nargs; i++) { 190153190Spjd str = gctl_get_ascii(req, "arg%d", i); 191133808Spjd msize = g_get_mediasize(str); 192133808Spjd ssize = g_get_sectorsize(str); 193133808Spjd if (msize == 0 || ssize == 0) { 194133808Spjd gctl_error(req, "Can't get informations about %s: %s.", 195133808Spjd str, strerror(errno)); 196133808Spjd return; 197133808Spjd } 198133808Spjd msize -= ssize; 199133808Spjd if (mediasize == 0 || (mediasize > 0 && msize < mediasize)) 200133808Spjd mediasize = msize; 201133808Spjd if (sectorsize == 0) 202133808Spjd sectorsize = ssize; 203133808Spjd else 204133808Spjd sectorsize = g_lcm(sectorsize, ssize); 205133808Spjd } 206153190Spjd md.md_mediasize = mediasize * (nargs - 2); 207153190Spjd md.md_sectorsize = sectorsize * (nargs - 2); 208133808Spjd 209133808Spjd /* 210133808Spjd * Clear last sector first, to spoil all components if device exists. 211133808Spjd */ 212153190Spjd for (i = 1; i < nargs; i++) { 213153190Spjd str = gctl_get_ascii(req, "arg%d", i); 214133808Spjd error = g_metadata_clear(str, NULL); 215133808Spjd if (error != 0) { 216133808Spjd gctl_error(req, "Can't store metadata on %s: %s.", str, 217133808Spjd strerror(error)); 218133808Spjd return; 219133808Spjd } 220133808Spjd } 221133808Spjd 222133808Spjd /* 223133808Spjd * Ok, store metadata (use disk number as priority). 224133808Spjd */ 225153190Spjd for (i = 1; i < nargs; i++) { 226153190Spjd str = gctl_get_ascii(req, "arg%d", i); 227142727Spjd msize = g_get_mediasize(str); 228142727Spjd ssize = g_get_sectorsize(str); 229142727Spjd if (mediasize < msize - ssize) { 230134420Spjd fprintf(stderr, 231134420Spjd "warning: %s: only %jd bytes from %jd bytes used.\n", 232142727Spjd str, (intmax_t)mediasize, (intmax_t)(msize - ssize)); 233134420Spjd } 234134420Spjd 235133808Spjd md.md_no = i - 1; 236142727Spjd md.md_provsize = msize; 237153190Spjd if (!hardcode) 238133808Spjd bzero(md.md_provider, sizeof(md.md_provider)); 239133808Spjd else { 240133808Spjd if (strncmp(str, _PATH_DEV, strlen(_PATH_DEV)) == 0) 241133808Spjd str += strlen(_PATH_DEV); 242133808Spjd strlcpy(md.md_provider, str, sizeof(md.md_provider)); 243133808Spjd } 244153190Spjd if (verify && md.md_no == md.md_all - 1) { 245134539Spjd /* 246134539Spjd * In "verify" mode, force synchronization of parity 247134539Spjd * component on start. 248134539Spjd */ 249134539Spjd md.md_syncid = 0; 250134539Spjd } 251133808Spjd raid3_metadata_encode(&md, sector); 252133808Spjd error = g_metadata_store(str, sector, sizeof(sector)); 253133808Spjd if (error != 0) { 254133808Spjd fprintf(stderr, "Can't store metadata on %s: %s.\n", 255133808Spjd str, strerror(error)); 256133808Spjd gctl_error(req, "Not fully done."); 257133808Spjd continue; 258133808Spjd } 259133808Spjd if (verbose) 260133808Spjd printf("Metadata value stored on %s.\n", str); 261133808Spjd } 262133808Spjd} 263133808Spjd 264133808Spjdstatic void 265133808Spjdraid3_clear(struct gctl_req *req) 266133808Spjd{ 267133808Spjd const char *name; 268153190Spjd int error, i, nargs; 269133808Spjd 270153190Spjd nargs = gctl_get_int(req, "nargs"); 271153190Spjd if (nargs < 1) { 272133808Spjd gctl_error(req, "Too few arguments."); 273133808Spjd return; 274133808Spjd } 275133808Spjd 276153190Spjd for (i = 0; i < nargs; i++) { 277153190Spjd name = gctl_get_ascii(req, "arg%d", i); 278133808Spjd error = g_metadata_clear(name, G_RAID3_MAGIC); 279133808Spjd if (error != 0) { 280133808Spjd fprintf(stderr, "Can't clear metadata on %s: %s.\n", 281133808Spjd name, strerror(error)); 282133808Spjd gctl_error(req, "Not fully done."); 283133808Spjd continue; 284133808Spjd } 285133808Spjd if (verbose) 286133808Spjd printf("Metadata cleared on %s.\n", name); 287133808Spjd } 288133808Spjd} 289133808Spjd 290133808Spjdstatic void 291133808Spjdraid3_dump(struct gctl_req *req) 292133808Spjd{ 293133808Spjd struct g_raid3_metadata md, tmpmd; 294133808Spjd const char *name; 295153190Spjd int error, i, nargs; 296133808Spjd 297153190Spjd nargs = gctl_get_int(req, "nargs"); 298153190Spjd if (nargs < 1) { 299133808Spjd gctl_error(req, "Too few arguments."); 300133808Spjd return; 301133808Spjd } 302133808Spjd 303153190Spjd for (i = 0; i < nargs; i++) { 304153190Spjd name = gctl_get_ascii(req, "arg%d", i); 305133808Spjd error = g_metadata_read(name, (u_char *)&tmpmd, sizeof(tmpmd), 306133808Spjd G_RAID3_MAGIC); 307133808Spjd if (error != 0) { 308133808Spjd fprintf(stderr, "Can't read metadata from %s: %s.\n", 309133808Spjd name, strerror(error)); 310133808Spjd gctl_error(req, "Not fully done."); 311133808Spjd continue; 312133808Spjd } 313133808Spjd if (raid3_metadata_decode((u_char *)&tmpmd, &md) != 0) { 314133808Spjd fprintf(stderr, "MD5 hash mismatch for %s, skipping.\n", 315133808Spjd name); 316133808Spjd gctl_error(req, "Not fully done."); 317133808Spjd continue; 318133808Spjd } 319133808Spjd printf("Metadata on %s:\n", name); 320133808Spjd raid3_metadata_dump(&md); 321133808Spjd printf("\n"); 322133808Spjd } 323133808Spjd} 324