1219974Smav/*- 2219974Smav * Copyright (c) 2011 Alexander Motin <mav@FreeBSD.org> 3234601Smav * Copyright (c) 2000 - 2008 S��ren Schmidt <sos@FreeBSD.org> 4219974Smav * All rights reserved. 5219974Smav * 6219974Smav * Redistribution and use in source and binary forms, with or without 7219974Smav * modification, are permitted provided that the following conditions 8219974Smav * are met: 9219974Smav * 1. Redistributions of source code must retain the above copyright 10219974Smav * notice, this list of conditions and the following disclaimer. 11219974Smav * 2. Redistributions in binary form must reproduce the above copyright 12219974Smav * notice, this list of conditions and the following disclaimer in the 13219974Smav * documentation and/or other materials provided with the distribution. 14219974Smav * 15219974Smav * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND 16219974Smav * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 17219974Smav * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 18219974Smav * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE 19219974Smav * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 20219974Smav * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 21219974Smav * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 22219974Smav * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 23219974Smav * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 24219974Smav * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 25219974Smav * SUCH DAMAGE. 26219974Smav */ 27219974Smav 28219974Smav#include <sys/cdefs.h> 29219974Smav__FBSDID("$FreeBSD$"); 30219974Smav 31219974Smav#include <sys/param.h> 32219974Smav#include <sys/bio.h> 33219974Smav#include <sys/endian.h> 34219974Smav#include <sys/kernel.h> 35219974Smav#include <sys/kobj.h> 36219974Smav#include <sys/limits.h> 37219974Smav#include <sys/lock.h> 38219974Smav#include <sys/malloc.h> 39219974Smav#include <sys/mutex.h> 40219974Smav#include <sys/systm.h> 41219974Smav#include <geom/geom.h> 42219974Smav#include "geom/raid/g_raid.h" 43219974Smav#include "g_raid_md_if.h" 44219974Smav 45219974Smavstatic MALLOC_DEFINE(M_MD_PROMISE, "md_promise_data", "GEOM_RAID Promise metadata"); 46219974Smav 47219974Smav#define PROMISE_MAX_DISKS 8 48219974Smav#define PROMISE_MAX_SUBDISKS 2 49219974Smav#define PROMISE_META_OFFSET 14 50219974Smav 51219974Smavstruct promise_raid_disk { 52219974Smav uint8_t flags; /* Subdisk status. */ 53219974Smav#define PROMISE_F_VALID 0x01 54219974Smav#define PROMISE_F_ONLINE 0x02 55219974Smav#define PROMISE_F_ASSIGNED 0x04 56219974Smav#define PROMISE_F_SPARE 0x08 57219974Smav#define PROMISE_F_DUPLICATE 0x10 58219974Smav#define PROMISE_F_REDIR 0x20 59219974Smav#define PROMISE_F_DOWN 0x40 60219974Smav#define PROMISE_F_READY 0x80 61219974Smav 62219974Smav uint8_t number; /* Position in a volume. */ 63219974Smav uint8_t channel; /* ATA channel number. */ 64219974Smav uint8_t device; /* ATA device number. */ 65219974Smav uint64_t id __packed; /* Subdisk ID. */ 66219974Smav} __packed; 67219974Smav 68219974Smavstruct promise_raid_conf { 69219974Smav char promise_id[24]; 70219974Smav#define PROMISE_MAGIC "Promise Technology, Inc." 71219974Smav#define FREEBSD_MAGIC "FreeBSD ATA driver RAID " 72219974Smav 73219974Smav uint32_t dummy_0; 74219974Smav uint64_t magic_0; 75219974Smav#define PROMISE_MAGIC0(x) (((uint64_t)(x.channel) << 48) | \ 76219974Smav ((uint64_t)(x.device != 0) << 56)) 77219974Smav uint16_t magic_1; 78219974Smav uint32_t magic_2; 79219974Smav uint8_t filler1[470]; 80219974Smav 81219974Smav uint32_t integrity; 82219974Smav#define PROMISE_I_VALID 0x00000080 83219974Smav 84219974Smav struct promise_raid_disk disk; /* This subdisk info. */ 85219974Smav uint32_t disk_offset; /* Subdisk offset. */ 86219974Smav uint32_t disk_sectors; /* Subdisk size */ 87245522Smav uint32_t disk_rebuild; /* Rebuild position. */ 88219974Smav uint16_t generation; /* Generation number. */ 89219974Smav uint8_t status; /* Volume status. */ 90219974Smav#define PROMISE_S_VALID 0x01 91219974Smav#define PROMISE_S_ONLINE 0x02 92219974Smav#define PROMISE_S_INITED 0x04 93219974Smav#define PROMISE_S_READY 0x08 94219974Smav#define PROMISE_S_DEGRADED 0x10 95219974Smav#define PROMISE_S_MARKED 0x20 96219974Smav#define PROMISE_S_MIGRATING 0x40 97219974Smav#define PROMISE_S_FUNCTIONAL 0x80 98219974Smav 99219974Smav uint8_t type; /* Voluem type. */ 100219974Smav#define PROMISE_T_RAID0 0x00 101219974Smav#define PROMISE_T_RAID1 0x01 102219974Smav#define PROMISE_T_RAID3 0x02 103219974Smav#define PROMISE_T_RAID5 0x04 104219974Smav#define PROMISE_T_SPAN 0x08 105219974Smav#define PROMISE_T_JBOD 0x10 106219974Smav 107219974Smav uint8_t total_disks; /* Disks in this volume. */ 108219974Smav uint8_t stripe_shift; /* Strip size. */ 109219974Smav uint8_t array_width; /* Number of RAID0 stripes. */ 110219974Smav uint8_t array_number; /* Global volume number. */ 111219974Smav uint32_t total_sectors; /* Volume size. */ 112219974Smav uint16_t cylinders; /* Volume geometry: C. */ 113219974Smav uint8_t heads; /* Volume geometry: H. */ 114219974Smav uint8_t sectors; /* Volume geometry: S. */ 115219974Smav uint64_t volume_id __packed; /* Volume ID, */ 116219974Smav struct promise_raid_disk disks[PROMISE_MAX_DISKS]; 117219974Smav /* Subdisks in this volume. */ 118219974Smav char name[32]; /* Volume label. */ 119219974Smav 120219974Smav uint32_t filler2[8]; 121219974Smav uint32_t magic_3; /* Something related to rebuild. */ 122219974Smav uint64_t rebuild_lba64; /* Per-volume rebuild position. */ 123219974Smav uint32_t magic_4; 124219974Smav uint32_t magic_5; 125226816Smav uint32_t total_sectors_high; 126245522Smav uint8_t magic_6; 127245522Smav uint8_t sector_size; 128245522Smav uint16_t magic_7; 129245533Smav uint32_t magic_8[31]; 130245533Smav uint32_t backup_time; 131245522Smav uint16_t magic_9; 132245522Smav uint32_t disk_offset_high; 133245522Smav uint32_t disk_sectors_high; 134245522Smav uint32_t disk_rebuild_high; 135245522Smav uint16_t magic_10; 136245522Smav uint32_t magic_11[3]; 137245522Smav uint32_t filler3[284]; 138219974Smav uint32_t checksum; 139219974Smav} __packed; 140219974Smav 141219974Smavstruct g_raid_md_promise_perdisk { 142219974Smav int pd_updated; 143219974Smav int pd_subdisks; 144219974Smav struct promise_raid_conf *pd_meta[PROMISE_MAX_SUBDISKS]; 145219974Smav}; 146219974Smav 147219974Smavstruct g_raid_md_promise_pervolume { 148219974Smav struct promise_raid_conf *pv_meta; 149219974Smav uint64_t pv_id; 150219974Smav uint16_t pv_generation; 151219974Smav int pv_disks_present; 152219974Smav int pv_started; 153219974Smav struct callout pv_start_co; /* STARTING state timer. */ 154219974Smav}; 155219974Smav 156219974Smavstatic g_raid_md_create_t g_raid_md_create_promise; 157219974Smavstatic g_raid_md_taste_t g_raid_md_taste_promise; 158219974Smavstatic g_raid_md_event_t g_raid_md_event_promise; 159219974Smavstatic g_raid_md_volume_event_t g_raid_md_volume_event_promise; 160219974Smavstatic g_raid_md_ctl_t g_raid_md_ctl_promise; 161219974Smavstatic g_raid_md_write_t g_raid_md_write_promise; 162219974Smavstatic g_raid_md_fail_disk_t g_raid_md_fail_disk_promise; 163219974Smavstatic g_raid_md_free_disk_t g_raid_md_free_disk_promise; 164219974Smavstatic g_raid_md_free_volume_t g_raid_md_free_volume_promise; 165219974Smavstatic g_raid_md_free_t g_raid_md_free_promise; 166219974Smav 167219974Smavstatic kobj_method_t g_raid_md_promise_methods[] = { 168219974Smav KOBJMETHOD(g_raid_md_create, g_raid_md_create_promise), 169219974Smav KOBJMETHOD(g_raid_md_taste, g_raid_md_taste_promise), 170219974Smav KOBJMETHOD(g_raid_md_event, g_raid_md_event_promise), 171219974Smav KOBJMETHOD(g_raid_md_volume_event, g_raid_md_volume_event_promise), 172219974Smav KOBJMETHOD(g_raid_md_ctl, g_raid_md_ctl_promise), 173219974Smav KOBJMETHOD(g_raid_md_write, g_raid_md_write_promise), 174219974Smav KOBJMETHOD(g_raid_md_fail_disk, g_raid_md_fail_disk_promise), 175219974Smav KOBJMETHOD(g_raid_md_free_disk, g_raid_md_free_disk_promise), 176219974Smav KOBJMETHOD(g_raid_md_free_volume, g_raid_md_free_volume_promise), 177219974Smav KOBJMETHOD(g_raid_md_free, g_raid_md_free_promise), 178219974Smav { 0, 0 } 179219974Smav}; 180219974Smav 181219974Smavstatic struct g_raid_md_class g_raid_md_promise_class = { 182219974Smav "Promise", 183219974Smav g_raid_md_promise_methods, 184219974Smav sizeof(struct g_raid_md_object), 185240465Smav .mdc_enable = 1, 186219974Smav .mdc_priority = 100 187219974Smav}; 188219974Smav 189219974Smav 190219974Smavstatic void 191219974Smavg_raid_md_promise_print(struct promise_raid_conf *meta) 192219974Smav{ 193219974Smav int i; 194219974Smav 195219974Smav if (g_raid_debug < 1) 196219974Smav return; 197219974Smav 198219974Smav printf("********* ATA Promise Metadata *********\n"); 199219974Smav printf("promise_id <%.24s>\n", meta->promise_id); 200219974Smav printf("disk %02x %02x %02x %02x %016jx\n", 201219974Smav meta->disk.flags, meta->disk.number, meta->disk.channel, 202219974Smav meta->disk.device, meta->disk.id); 203219974Smav printf("disk_offset %u\n", meta->disk_offset); 204219974Smav printf("disk_sectors %u\n", meta->disk_sectors); 205245522Smav printf("disk_rebuild %u\n", meta->disk_rebuild); 206219974Smav printf("generation %u\n", meta->generation); 207219974Smav printf("status 0x%02x\n", meta->status); 208219974Smav printf("type %u\n", meta->type); 209219974Smav printf("total_disks %u\n", meta->total_disks); 210219974Smav printf("stripe_shift %u\n", meta->stripe_shift); 211219974Smav printf("array_width %u\n", meta->array_width); 212219974Smav printf("array_number %u\n", meta->array_number); 213219974Smav printf("total_sectors %u\n", meta->total_sectors); 214219974Smav printf("cylinders %u\n", meta->cylinders); 215219974Smav printf("heads %u\n", meta->heads); 216219974Smav printf("sectors %u\n", meta->sectors); 217219974Smav printf("volume_id 0x%016jx\n", meta->volume_id); 218219974Smav printf("disks:\n"); 219219974Smav for (i = 0; i < PROMISE_MAX_DISKS; i++ ) { 220219974Smav printf(" %02x %02x %02x %02x %016jx\n", 221219974Smav meta->disks[i].flags, meta->disks[i].number, 222219974Smav meta->disks[i].channel, meta->disks[i].device, 223219974Smav meta->disks[i].id); 224219974Smav } 225219974Smav printf("name <%.32s>\n", meta->name); 226219974Smav printf("magic_3 0x%08x\n", meta->magic_3); 227219974Smav printf("rebuild_lba64 %ju\n", meta->rebuild_lba64); 228219974Smav printf("magic_4 0x%08x\n", meta->magic_4); 229219974Smav printf("magic_5 0x%08x\n", meta->magic_5); 230226816Smav printf("total_sectors_high 0x%08x\n", meta->total_sectors_high); 231245522Smav printf("sector_size %u\n", meta->sector_size); 232245533Smav printf("backup_time %d\n", meta->backup_time); 233245522Smav printf("disk_offset_high 0x%08x\n", meta->disk_offset_high); 234245522Smav printf("disk_sectors_high 0x%08x\n", meta->disk_sectors_high); 235245522Smav printf("disk_rebuild_high 0x%08x\n", meta->disk_rebuild_high); 236219974Smav printf("=================================================\n"); 237219974Smav} 238219974Smav 239219974Smavstatic struct promise_raid_conf * 240219974Smavpromise_meta_copy(struct promise_raid_conf *meta) 241219974Smav{ 242219974Smav struct promise_raid_conf *nmeta; 243219974Smav 244219974Smav nmeta = malloc(sizeof(*nmeta), M_MD_PROMISE, M_WAITOK); 245219974Smav memcpy(nmeta, meta, sizeof(*nmeta)); 246219974Smav return (nmeta); 247219974Smav} 248219974Smav 249219974Smavstatic int 250219974Smavpromise_meta_find_disk(struct promise_raid_conf *meta, uint64_t id) 251219974Smav{ 252219974Smav int pos; 253219974Smav 254219974Smav for (pos = 0; pos < meta->total_disks; pos++) { 255219974Smav if (meta->disks[pos].id == id) 256219974Smav return (pos); 257219974Smav } 258219974Smav return (-1); 259219974Smav} 260219974Smav 261219974Smavstatic int 262219974Smavpromise_meta_unused_range(struct promise_raid_conf **metaarr, int nsd, 263245522Smav off_t sectors, off_t *off, off_t *size) 264219974Smav{ 265245522Smav off_t coff, csize, tmp; 266219974Smav int i, j; 267219974Smav 268219974Smav sectors -= 131072; 269219974Smav *off = 0; 270219974Smav *size = 0; 271219974Smav coff = 0; 272219974Smav csize = sectors; 273219974Smav i = 0; 274219974Smav while (1) { 275219974Smav for (j = 0; j < nsd; j++) { 276245522Smav tmp = ((off_t)metaarr[j]->disk_offset_high << 32) + 277245522Smav metaarr[j]->disk_offset; 278245522Smav if (tmp >= coff) 279245522Smav csize = MIN(csize, tmp - coff); 280219974Smav } 281219974Smav if (csize > *size) { 282219974Smav *off = coff; 283219974Smav *size = csize; 284219974Smav } 285219974Smav if (i >= nsd) 286219974Smav break; 287245522Smav coff = ((off_t)metaarr[i]->disk_offset_high << 32) + 288245522Smav metaarr[i]->disk_offset + 289245522Smav ((off_t)metaarr[i]->disk_sectors_high << 32) + 290245522Smav metaarr[i]->disk_sectors; 291219974Smav csize = sectors - coff; 292219974Smav i++; 293297793Spfg } 294219974Smav return ((*size > 0) ? 1 : 0); 295219974Smav} 296219974Smav 297219974Smavstatic int 298219974Smavpromise_meta_translate_disk(struct g_raid_volume *vol, int md_disk_pos) 299219974Smav{ 300219974Smav int disk_pos, width; 301219974Smav 302219974Smav if (md_disk_pos >= 0 && vol->v_raid_level == G_RAID_VOLUME_RL_RAID1E) { 303219974Smav width = vol->v_disks_count / 2; 304219974Smav disk_pos = (md_disk_pos / width) + 305219974Smav (md_disk_pos % width) * width; 306219974Smav } else 307219974Smav disk_pos = md_disk_pos; 308219974Smav return (disk_pos); 309219974Smav} 310219974Smav 311219974Smavstatic void 312219974Smavpromise_meta_get_name(struct promise_raid_conf *meta, char *buf) 313219974Smav{ 314219974Smav int i; 315219974Smav 316219974Smav strncpy(buf, meta->name, 32); 317219974Smav buf[32] = 0; 318219974Smav for (i = 31; i >= 0; i--) { 319219974Smav if (buf[i] > 0x20) 320219974Smav break; 321219974Smav buf[i] = 0; 322219974Smav } 323219974Smav} 324219974Smav 325219974Smavstatic void 326219974Smavpromise_meta_put_name(struct promise_raid_conf *meta, char *buf) 327219974Smav{ 328219974Smav 329219974Smav memset(meta->name, 0x20, 32); 330219974Smav memcpy(meta->name, buf, MIN(strlen(buf), 32)); 331219974Smav} 332219974Smav 333219974Smavstatic int 334219974Smavpromise_meta_read(struct g_consumer *cp, struct promise_raid_conf **metaarr) 335219974Smav{ 336219974Smav struct g_provider *pp; 337219974Smav struct promise_raid_conf *meta; 338219974Smav char *buf; 339219974Smav int error, i, subdisks; 340219974Smav uint32_t checksum, *ptr; 341219974Smav 342219974Smav pp = cp->provider; 343219974Smav subdisks = 0; 344219974Smavnext: 345219974Smav /* Read metadata block. */ 346219974Smav buf = g_read_data(cp, pp->mediasize - pp->sectorsize * 347219974Smav (63 - subdisks * PROMISE_META_OFFSET), 348219974Smav pp->sectorsize * 4, &error); 349219974Smav if (buf == NULL) { 350219974Smav G_RAID_DEBUG(1, "Cannot read metadata from %s (error=%d).", 351219974Smav pp->name, error); 352219974Smav return (subdisks); 353219974Smav } 354219974Smav meta = (struct promise_raid_conf *)buf; 355219974Smav 356219974Smav /* Check if this is an Promise RAID struct */ 357219974Smav if (strncmp(meta->promise_id, PROMISE_MAGIC, strlen(PROMISE_MAGIC)) && 358219974Smav strncmp(meta->promise_id, FREEBSD_MAGIC, strlen(FREEBSD_MAGIC))) { 359219974Smav if (subdisks == 0) 360219974Smav G_RAID_DEBUG(1, 361219974Smav "Promise signature check failed on %s", pp->name); 362219974Smav g_free(buf); 363219974Smav return (subdisks); 364219974Smav } 365219974Smav meta = malloc(sizeof(*meta), M_MD_PROMISE, M_WAITOK); 366219974Smav memcpy(meta, buf, MIN(sizeof(*meta), pp->sectorsize * 4)); 367219974Smav g_free(buf); 368219974Smav 369219974Smav /* Check metadata checksum. */ 370219974Smav for (checksum = 0, ptr = (uint32_t *)meta, i = 0; i < 511; i++) 371219974Smav checksum += *ptr++; 372219974Smav if (checksum != meta->checksum) { 373219974Smav G_RAID_DEBUG(1, "Promise checksum check failed on %s", pp->name); 374219974Smav free(meta, M_MD_PROMISE); 375219974Smav return (subdisks); 376219974Smav } 377219974Smav 378219974Smav if ((meta->integrity & PROMISE_I_VALID) == 0) { 379219974Smav G_RAID_DEBUG(1, "Promise metadata is invalid on %s", pp->name); 380219974Smav free(meta, M_MD_PROMISE); 381219974Smav return (subdisks); 382219974Smav } 383219974Smav 384219974Smav if (meta->total_disks > PROMISE_MAX_DISKS) { 385219974Smav G_RAID_DEBUG(1, "Wrong number of disks on %s (%d)", 386219974Smav pp->name, meta->total_disks); 387219974Smav free(meta, M_MD_PROMISE); 388219974Smav return (subdisks); 389219974Smav } 390219974Smav 391245522Smav /* Remove filler garbage from fields used in newer metadata. */ 392245522Smav if (meta->disk_offset_high == 0x8b8c8d8e && 393245522Smav meta->disk_sectors_high == 0x8788898a && 394245522Smav meta->disk_rebuild_high == 0x83848586) { 395245522Smav meta->disk_offset_high = 0; 396245522Smav meta->disk_sectors_high = 0; 397245522Smav if (meta->disk_rebuild == UINT32_MAX) 398245522Smav meta->disk_rebuild_high = UINT32_MAX; 399245522Smav else 400245522Smav meta->disk_rebuild_high = 0; 401245522Smav if (meta->total_sectors_high == 0x15161718) { 402245522Smav meta->total_sectors_high = 0; 403245533Smav meta->backup_time = 0; 404245522Smav if (meta->rebuild_lba64 == 0x2122232425262728) 405245522Smav meta->rebuild_lba64 = UINT64_MAX; 406245522Smav } 407245522Smav } 408245522Smav if (meta->sector_size < 1 || meta->sector_size > 8) 409245522Smav meta->sector_size = 1; 410245522Smav 411219974Smav /* Save this part and look for next. */ 412219974Smav *metaarr = meta; 413219974Smav metaarr++; 414219974Smav subdisks++; 415219974Smav if (subdisks < PROMISE_MAX_SUBDISKS) 416219974Smav goto next; 417219974Smav 418219974Smav return (subdisks); 419219974Smav} 420219974Smav 421219974Smavstatic int 422219974Smavpromise_meta_write(struct g_consumer *cp, 423219974Smav struct promise_raid_conf **metaarr, int nsd) 424219974Smav{ 425219974Smav struct g_provider *pp; 426219974Smav struct promise_raid_conf *meta; 427219974Smav char *buf; 428245522Smav off_t off, size; 429219974Smav int error, i, subdisk, fake; 430245522Smav uint32_t checksum, *ptr; 431219974Smav 432219974Smav pp = cp->provider; 433219974Smav subdisk = 0; 434219974Smav fake = 0; 435219974Smavnext: 436219974Smav buf = malloc(pp->sectorsize * 4, M_MD_PROMISE, M_WAITOK | M_ZERO); 437219974Smav meta = NULL; 438219974Smav if (subdisk < nsd) { 439219974Smav meta = metaarr[subdisk]; 440219974Smav } else if (!fake && promise_meta_unused_range(metaarr, nsd, 441219974Smav cp->provider->mediasize / cp->provider->sectorsize, 442219974Smav &off, &size)) { 443219974Smav /* Optionally add record for unused space. */ 444219974Smav meta = (struct promise_raid_conf *)buf; 445220209Smav memcpy(&meta->promise_id[0], PROMISE_MAGIC, 446220209Smav sizeof(PROMISE_MAGIC) - 1); 447219974Smav meta->dummy_0 = 0x00020000; 448219974Smav meta->integrity = PROMISE_I_VALID; 449219974Smav meta->disk.flags = PROMISE_F_ONLINE | PROMISE_F_VALID; 450219974Smav meta->disk.number = 0xff; 451219974Smav arc4rand(&meta->disk.id, sizeof(meta->disk.id), 0); 452245522Smav meta->disk_offset_high = off >> 32; 453245522Smav meta->disk_offset = (uint32_t)off; 454245522Smav meta->disk_sectors_high = size >> 32; 455245522Smav meta->disk_sectors = (uint32_t)size; 456245522Smav meta->disk_rebuild_high = UINT32_MAX; 457245522Smav meta->disk_rebuild = UINT32_MAX; 458219974Smav fake = 1; 459219974Smav } 460219974Smav if (meta != NULL) { 461219974Smav /* Recalculate checksum for case if metadata were changed. */ 462219974Smav meta->checksum = 0; 463219974Smav for (checksum = 0, ptr = (uint32_t *)meta, i = 0; i < 511; i++) 464219974Smav checksum += *ptr++; 465219974Smav meta->checksum = checksum; 466219974Smav memcpy(buf, meta, MIN(pp->sectorsize * 4, sizeof(*meta))); 467219974Smav } 468219974Smav error = g_write_data(cp, pp->mediasize - pp->sectorsize * 469219974Smav (63 - subdisk * PROMISE_META_OFFSET), 470219974Smav buf, pp->sectorsize * 4); 471219974Smav if (error != 0) { 472219974Smav G_RAID_DEBUG(1, "Cannot write metadata to %s (error=%d).", 473219974Smav pp->name, error); 474219974Smav } 475219974Smav free(buf, M_MD_PROMISE); 476219974Smav 477219974Smav subdisk++; 478219974Smav if (subdisk < PROMISE_MAX_SUBDISKS) 479219974Smav goto next; 480219974Smav 481219974Smav return (error); 482219974Smav} 483219974Smav 484219974Smavstatic int 485219974Smavpromise_meta_erase(struct g_consumer *cp) 486219974Smav{ 487219974Smav struct g_provider *pp; 488219974Smav char *buf; 489219974Smav int error, subdisk; 490219974Smav 491219974Smav pp = cp->provider; 492219974Smav buf = malloc(4 * pp->sectorsize, M_MD_PROMISE, M_WAITOK | M_ZERO); 493219974Smav for (subdisk = 0; subdisk < PROMISE_MAX_SUBDISKS; subdisk++) { 494219974Smav error = g_write_data(cp, pp->mediasize - pp->sectorsize * 495219974Smav (63 - subdisk * PROMISE_META_OFFSET), 496219974Smav buf, 4 * pp->sectorsize); 497219974Smav if (error != 0) { 498219974Smav G_RAID_DEBUG(1, "Cannot erase metadata on %s (error=%d).", 499219974Smav pp->name, error); 500219974Smav } 501219974Smav } 502219974Smav free(buf, M_MD_PROMISE); 503219974Smav return (error); 504219974Smav} 505219974Smav 506219974Smavstatic int 507219974Smavpromise_meta_write_spare(struct g_consumer *cp) 508219974Smav{ 509219974Smav struct promise_raid_conf *meta; 510245522Smav off_t tmp; 511219974Smav int error; 512219974Smav 513219974Smav meta = malloc(sizeof(*meta), M_MD_PROMISE, M_WAITOK | M_ZERO); 514220209Smav memcpy(&meta->promise_id[0], PROMISE_MAGIC, sizeof(PROMISE_MAGIC) - 1); 515219974Smav meta->dummy_0 = 0x00020000; 516219974Smav meta->integrity = PROMISE_I_VALID; 517219974Smav meta->disk.flags = PROMISE_F_SPARE | PROMISE_F_ONLINE | PROMISE_F_VALID; 518219974Smav meta->disk.number = 0xff; 519219974Smav arc4rand(&meta->disk.id, sizeof(meta->disk.id), 0); 520245522Smav tmp = cp->provider->mediasize / cp->provider->sectorsize - 131072; 521245522Smav meta->disk_sectors_high = tmp >> 32; 522245522Smav meta->disk_sectors = (uint32_t)tmp; 523245522Smav meta->disk_rebuild_high = UINT32_MAX; 524245522Smav meta->disk_rebuild = UINT32_MAX; 525219974Smav error = promise_meta_write(cp, &meta, 1); 526219974Smav free(meta, M_MD_PROMISE); 527219974Smav return (error); 528219974Smav} 529219974Smav 530219974Smavstatic struct g_raid_volume * 531219974Smavg_raid_md_promise_get_volume(struct g_raid_softc *sc, uint64_t id) 532219974Smav{ 533219974Smav struct g_raid_volume *vol; 534219974Smav struct g_raid_md_promise_pervolume *pv; 535219974Smav 536219974Smav TAILQ_FOREACH(vol, &sc->sc_volumes, v_next) { 537219974Smav pv = vol->v_md_data; 538219974Smav if (pv->pv_id == id) 539219974Smav break; 540219974Smav } 541219974Smav return (vol); 542219974Smav} 543219974Smav 544219974Smavstatic int 545219974Smavg_raid_md_promise_purge_volumes(struct g_raid_softc *sc) 546219974Smav{ 547219974Smav struct g_raid_volume *vol, *tvol; 548219974Smav struct g_raid_md_promise_pervolume *pv; 549219974Smav int i, res; 550219974Smav 551219974Smav res = 0; 552219974Smav TAILQ_FOREACH_SAFE(vol, &sc->sc_volumes, v_next, tvol) { 553219974Smav pv = vol->v_md_data; 554219974Smav if (!pv->pv_started || vol->v_stopping) 555219974Smav continue; 556219974Smav for (i = 0; i < vol->v_disks_count; i++) { 557219974Smav if (vol->v_subdisks[i].sd_state != G_RAID_SUBDISK_S_NONE) 558219974Smav break; 559219974Smav } 560219974Smav if (i >= vol->v_disks_count) { 561219974Smav g_raid_destroy_volume(vol); 562219974Smav res = 1; 563219974Smav } 564219974Smav } 565219974Smav return (res); 566219974Smav} 567219974Smav 568219974Smavstatic int 569219974Smavg_raid_md_promise_purge_disks(struct g_raid_softc *sc) 570219974Smav{ 571219974Smav struct g_raid_disk *disk, *tdisk; 572219974Smav struct g_raid_volume *vol; 573219974Smav struct g_raid_md_promise_perdisk *pd; 574219974Smav int i, j, res; 575219974Smav 576219974Smav res = 0; 577219974Smav TAILQ_FOREACH_SAFE(disk, &sc->sc_disks, d_next, tdisk) { 578219974Smav if (disk->d_state == G_RAID_DISK_S_SPARE) 579219974Smav continue; 580219974Smav pd = (struct g_raid_md_promise_perdisk *)disk->d_md_data; 581219974Smav 582219974Smav /* Scan for deleted volumes. */ 583219974Smav for (i = 0; i < pd->pd_subdisks; ) { 584219974Smav vol = g_raid_md_promise_get_volume(sc, 585219974Smav pd->pd_meta[i]->volume_id); 586219974Smav if (vol != NULL && !vol->v_stopping) { 587219974Smav i++; 588219974Smav continue; 589219974Smav } 590219974Smav free(pd->pd_meta[i], M_MD_PROMISE); 591219974Smav for (j = i; j < pd->pd_subdisks - 1; j++) 592219974Smav pd->pd_meta[j] = pd->pd_meta[j + 1]; 593241418Smav pd->pd_meta[pd->pd_subdisks - 1] = NULL; 594219974Smav pd->pd_subdisks--; 595219974Smav pd->pd_updated = 1; 596219974Smav } 597219974Smav 598219974Smav /* If there is no metadata left - erase and delete disk. */ 599219974Smav if (pd->pd_subdisks == 0) { 600219974Smav promise_meta_erase(disk->d_consumer); 601219974Smav g_raid_destroy_disk(disk); 602219974Smav res = 1; 603219974Smav } 604219974Smav } 605219974Smav return (res); 606219974Smav} 607219974Smav 608219974Smavstatic int 609219974Smavg_raid_md_promise_supported(int level, int qual, int disks, int force) 610219974Smav{ 611219974Smav 612219974Smav if (disks > PROMISE_MAX_DISKS) 613219974Smav return (0); 614219974Smav switch (level) { 615219974Smav case G_RAID_VOLUME_RL_RAID0: 616219974Smav if (disks < 1) 617219974Smav return (0); 618219974Smav if (!force && disks < 2) 619219974Smav return (0); 620219974Smav break; 621219974Smav case G_RAID_VOLUME_RL_RAID1: 622219974Smav if (disks < 1) 623219974Smav return (0); 624219974Smav if (!force && (disks != 2)) 625219974Smav return (0); 626219974Smav break; 627219974Smav case G_RAID_VOLUME_RL_RAID1E: 628219974Smav if (disks < 2) 629219974Smav return (0); 630219974Smav if (disks % 2 != 0) 631219974Smav return (0); 632219974Smav if (!force && (disks != 4)) 633219974Smav return (0); 634219974Smav break; 635219974Smav case G_RAID_VOLUME_RL_SINGLE: 636219974Smav if (disks != 1) 637219974Smav return (0); 638219974Smav break; 639219974Smav case G_RAID_VOLUME_RL_CONCAT: 640219974Smav if (disks < 2) 641219974Smav return (0); 642219974Smav break; 643219974Smav case G_RAID_VOLUME_RL_RAID5: 644219974Smav if (disks < 3) 645219974Smav return (0); 646234458Smav if (qual != G_RAID_VOLUME_RLQ_R5LA) 647234458Smav return (0); 648219974Smav break; 649219974Smav default: 650219974Smav return (0); 651219974Smav } 652234458Smav if (level != G_RAID_VOLUME_RL_RAID5 && qual != G_RAID_VOLUME_RLQ_NONE) 653219974Smav return (0); 654219974Smav return (1); 655219974Smav} 656219974Smav 657219974Smavstatic int 658219974Smavg_raid_md_promise_start_disk(struct g_raid_disk *disk, int sdn, 659219974Smav struct g_raid_volume *vol) 660219974Smav{ 661219974Smav struct g_raid_softc *sc; 662219974Smav struct g_raid_subdisk *sd; 663219974Smav struct g_raid_md_promise_perdisk *pd; 664219974Smav struct g_raid_md_promise_pervolume *pv; 665219974Smav struct promise_raid_conf *meta; 666245522Smav off_t eoff, esize, size; 667219974Smav int disk_pos, md_disk_pos, i, resurrection = 0; 668219974Smav 669219974Smav sc = disk->d_softc; 670219974Smav pd = (struct g_raid_md_promise_perdisk *)disk->d_md_data; 671219974Smav 672219974Smav pv = vol->v_md_data; 673219974Smav meta = pv->pv_meta; 674219974Smav 675219974Smav if (sdn >= 0) { 676219974Smav /* Find disk position in metadata by it's serial. */ 677219974Smav md_disk_pos = promise_meta_find_disk(meta, pd->pd_meta[sdn]->disk.id); 678219974Smav /* For RAID0+1 we need to translate order. */ 679219974Smav disk_pos = promise_meta_translate_disk(vol, md_disk_pos); 680219974Smav } else { 681219974Smav md_disk_pos = -1; 682219974Smav disk_pos = -1; 683219974Smav } 684219974Smav if (disk_pos < 0) { 685219974Smav G_RAID_DEBUG1(1, sc, "Disk %s is not part of the volume %s", 686219974Smav g_raid_get_diskname(disk), vol->v_name); 687219974Smav /* Failed stale disk is useless for us. */ 688219974Smav if (sdn >= 0 && 689219974Smav pd->pd_meta[sdn]->disk.flags & PROMISE_F_DOWN) { 690219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_STALE_FAILED); 691219974Smav return (0); 692219974Smav } 693219974Smav /* If we were given specific metadata subdisk - erase it. */ 694219974Smav if (sdn >= 0) { 695219974Smav free(pd->pd_meta[sdn], M_MD_PROMISE); 696219974Smav for (i = sdn; i < pd->pd_subdisks - 1; i++) 697219974Smav pd->pd_meta[i] = pd->pd_meta[i + 1]; 698241418Smav pd->pd_meta[pd->pd_subdisks - 1] = NULL; 699219974Smav pd->pd_subdisks--; 700219974Smav } 701219974Smav /* If we are in the start process, that's all for now. */ 702219974Smav if (!pv->pv_started) 703219974Smav goto nofit; 704219974Smav /* 705219974Smav * If we have already started - try to get use of the disk. 706219974Smav * Try to replace OFFLINE disks first, then FAILED. 707219974Smav */ 708219974Smav promise_meta_unused_range(pd->pd_meta, pd->pd_subdisks, 709219974Smav disk->d_consumer->provider->mediasize / 710219974Smav disk->d_consumer->provider->sectorsize, 711219974Smav &eoff, &esize); 712219974Smav if (esize == 0) { 713219974Smav G_RAID_DEBUG1(1, sc, "No free space on disk %s", 714219974Smav g_raid_get_diskname(disk)); 715219974Smav goto nofit; 716219974Smav } 717219974Smav size = INT64_MAX; 718219974Smav for (i = 0; i < vol->v_disks_count; i++) { 719219974Smav sd = &vol->v_subdisks[i]; 720219974Smav if (sd->sd_state != G_RAID_SUBDISK_S_NONE) 721219974Smav size = sd->sd_size; 722219974Smav if (sd->sd_state <= G_RAID_SUBDISK_S_FAILED && 723219974Smav (disk_pos < 0 || 724219974Smav vol->v_subdisks[i].sd_state < sd->sd_state)) 725219974Smav disk_pos = i; 726219974Smav } 727219974Smav if (disk_pos >= 0 && 728219974Smav vol->v_raid_level != G_RAID_VOLUME_RL_CONCAT && 729219974Smav (off_t)esize * 512 < size) { 730219974Smav G_RAID_DEBUG1(1, sc, "Disk %s free space " 731219974Smav "is too small (%ju < %ju)", 732219974Smav g_raid_get_diskname(disk), 733219974Smav (off_t)esize * 512, size); 734219974Smav disk_pos = -1; 735219974Smav } 736219974Smav if (disk_pos >= 0) { 737219974Smav if (vol->v_raid_level != G_RAID_VOLUME_RL_CONCAT) 738219974Smav esize = size / 512; 739219974Smav /* For RAID0+1 we need to translate order. */ 740219974Smav md_disk_pos = promise_meta_translate_disk(vol, disk_pos); 741219974Smav } else { 742219974Smavnofit: 743219974Smav if (pd->pd_subdisks == 0) { 744219974Smav g_raid_change_disk_state(disk, 745219974Smav G_RAID_DISK_S_SPARE); 746219974Smav } 747219974Smav return (0); 748219974Smav } 749219974Smav G_RAID_DEBUG1(1, sc, "Disk %s takes pos %d in the volume %s", 750219974Smav g_raid_get_diskname(disk), disk_pos, vol->v_name); 751219974Smav resurrection = 1; 752219974Smav } 753219974Smav 754219974Smav sd = &vol->v_subdisks[disk_pos]; 755219974Smav 756219974Smav if (resurrection && sd->sd_disk != NULL) { 757219974Smav g_raid_change_disk_state(sd->sd_disk, 758219974Smav G_RAID_DISK_S_STALE_FAILED); 759219974Smav TAILQ_REMOVE(&sd->sd_disk->d_subdisks, 760219974Smav sd, sd_next); 761219974Smav } 762219974Smav vol->v_subdisks[disk_pos].sd_disk = disk; 763219974Smav TAILQ_INSERT_TAIL(&disk->d_subdisks, sd, sd_next); 764219974Smav 765219974Smav /* Welcome the new disk. */ 766219974Smav if (resurrection) 767219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_ACTIVE); 768219974Smav else if (meta->disks[md_disk_pos].flags & PROMISE_F_DOWN) 769219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_FAILED); 770219974Smav else 771219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_ACTIVE); 772219974Smav 773219974Smav if (resurrection) { 774219974Smav sd->sd_offset = (off_t)eoff * 512; 775219974Smav sd->sd_size = (off_t)esize * 512; 776219974Smav } else { 777245522Smav sd->sd_offset = (((off_t)pd->pd_meta[sdn]->disk_offset_high 778245522Smav << 32) + pd->pd_meta[sdn]->disk_offset) * 512; 779245522Smav sd->sd_size = (((off_t)pd->pd_meta[sdn]->disk_sectors_high 780245522Smav << 32) + pd->pd_meta[sdn]->disk_sectors) * 512; 781219974Smav } 782219974Smav 783219974Smav if (resurrection) { 784219974Smav /* Stale disk, almost same as new. */ 785219974Smav g_raid_change_subdisk_state(sd, 786219974Smav G_RAID_SUBDISK_S_NEW); 787219974Smav } else if (meta->disks[md_disk_pos].flags & PROMISE_F_DOWN) { 788219974Smav /* Failed disk. */ 789219974Smav g_raid_change_subdisk_state(sd, 790219974Smav G_RAID_SUBDISK_S_FAILED); 791219974Smav } else if (meta->disks[md_disk_pos].flags & PROMISE_F_REDIR) { 792219974Smav /* Rebuilding disk. */ 793219974Smav g_raid_change_subdisk_state(sd, 794219974Smav G_RAID_SUBDISK_S_REBUILD); 795219974Smav if (pd->pd_meta[sdn]->generation != meta->generation) 796219974Smav sd->sd_rebuild_pos = 0; 797219974Smav else { 798219974Smav sd->sd_rebuild_pos = 799245533Smav (((off_t)pd->pd_meta[sdn]->disk_rebuild_high << 32) + 800245522Smav pd->pd_meta[sdn]->disk_rebuild) * 512; 801219974Smav } 802219974Smav } else if (!(meta->disks[md_disk_pos].flags & PROMISE_F_ONLINE)) { 803219974Smav /* Rebuilding disk. */ 804219974Smav g_raid_change_subdisk_state(sd, 805219974Smav G_RAID_SUBDISK_S_NEW); 806219974Smav } else if (pd->pd_meta[sdn]->generation != meta->generation || 807219974Smav (meta->status & PROMISE_S_MARKED)) { 808219974Smav /* Stale disk or dirty volume (unclean shutdown). */ 809219974Smav g_raid_change_subdisk_state(sd, 810219974Smav G_RAID_SUBDISK_S_STALE); 811219974Smav } else { 812219974Smav /* Up to date disk. */ 813219974Smav g_raid_change_subdisk_state(sd, 814219974Smav G_RAID_SUBDISK_S_ACTIVE); 815219974Smav } 816219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_NEW, 817219974Smav G_RAID_EVENT_SUBDISK); 818219974Smav 819219974Smav return (resurrection); 820219974Smav} 821219974Smav 822219974Smavstatic void 823219974Smavg_raid_md_promise_refill(struct g_raid_softc *sc) 824219974Smav{ 825219974Smav struct g_raid_volume *vol; 826219974Smav struct g_raid_subdisk *sd; 827219974Smav struct g_raid_disk *disk; 828219974Smav struct g_raid_md_object *md; 829219974Smav struct g_raid_md_promise_perdisk *pd; 830219974Smav struct g_raid_md_promise_pervolume *pv; 831219974Smav int update, updated, i, bad; 832219974Smav 833219974Smav md = sc->sc_md; 834219974Smavrestart: 835219974Smav updated = 0; 836219974Smav TAILQ_FOREACH(vol, &sc->sc_volumes, v_next) { 837219974Smav pv = vol->v_md_data; 838219974Smav if (!pv->pv_started || vol->v_stopping) 839219974Smav continue; 840219974Smav 841219974Smav /* Search for subdisk that needs replacement. */ 842219974Smav bad = 0; 843219974Smav for (i = 0; i < vol->v_disks_count; i++) { 844219974Smav sd = &vol->v_subdisks[i]; 845219974Smav if (sd->sd_state == G_RAID_SUBDISK_S_NONE || 846219974Smav sd->sd_state == G_RAID_SUBDISK_S_FAILED) 847219974Smav bad = 1; 848219974Smav } 849219974Smav if (!bad) 850219974Smav continue; 851219974Smav 852219974Smav G_RAID_DEBUG1(1, sc, "Volume %s is not complete, " 853219974Smav "trying to refill.", vol->v_name); 854219974Smav 855219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 856219974Smav /* Skip failed. */ 857219974Smav if (disk->d_state < G_RAID_DISK_S_SPARE) 858219974Smav continue; 859219974Smav /* Skip already used by this volume. */ 860219974Smav for (i = 0; i < vol->v_disks_count; i++) { 861219974Smav sd = &vol->v_subdisks[i]; 862219974Smav if (sd->sd_disk == disk) 863219974Smav break; 864219974Smav } 865219974Smav if (i < vol->v_disks_count) 866219974Smav continue; 867219974Smav 868219974Smav /* Try to use disk if it has empty extents. */ 869219974Smav pd = disk->d_md_data; 870219974Smav if (pd->pd_subdisks < PROMISE_MAX_SUBDISKS) { 871219974Smav update = 872219974Smav g_raid_md_promise_start_disk(disk, -1, vol); 873219974Smav } else 874219974Smav update = 0; 875219974Smav if (update) { 876220209Smav updated = 1; 877219974Smav g_raid_md_write_promise(md, vol, NULL, disk); 878219974Smav break; 879219974Smav } 880219974Smav } 881219974Smav } 882219974Smav if (updated) 883219974Smav goto restart; 884219974Smav} 885219974Smav 886219974Smavstatic void 887219974Smavg_raid_md_promise_start(struct g_raid_volume *vol) 888219974Smav{ 889219974Smav struct g_raid_softc *sc; 890219974Smav struct g_raid_subdisk *sd; 891219974Smav struct g_raid_disk *disk; 892219974Smav struct g_raid_md_object *md; 893219974Smav struct g_raid_md_promise_perdisk *pd; 894219974Smav struct g_raid_md_promise_pervolume *pv; 895219974Smav struct promise_raid_conf *meta; 896298698Spfg u_int i; 897219974Smav 898219974Smav sc = vol->v_softc; 899219974Smav md = sc->sc_md; 900219974Smav pv = vol->v_md_data; 901219974Smav meta = pv->pv_meta; 902219974Smav 903234458Smav vol->v_raid_level_qualifier = G_RAID_VOLUME_RLQ_NONE; 904219974Smav if (meta->type == PROMISE_T_RAID0) 905219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID0; 906219974Smav else if (meta->type == PROMISE_T_RAID1) { 907219974Smav if (meta->array_width == 1) 908219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID1; 909219974Smav else 910219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID1E; 911219974Smav } else if (meta->type == PROMISE_T_RAID3) 912219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID3; 913234458Smav else if (meta->type == PROMISE_T_RAID5) { 914219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID5; 915234458Smav vol->v_raid_level_qualifier = G_RAID_VOLUME_RLQ_R5LA; 916234458Smav } else if (meta->type == PROMISE_T_SPAN) 917219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_CONCAT; 918219974Smav else if (meta->type == PROMISE_T_JBOD) 919219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_SINGLE; 920219974Smav else 921219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_UNKNOWN; 922219974Smav vol->v_strip_size = 512 << meta->stripe_shift; //ZZZ 923219974Smav vol->v_disks_count = meta->total_disks; 924219974Smav vol->v_mediasize = (off_t)meta->total_sectors * 512; //ZZZ 925226816Smav if (meta->total_sectors_high < 256) /* If value looks sane. */ 926245522Smav vol->v_mediasize += 927226816Smav ((off_t)meta->total_sectors_high << 32) * 512; //ZZZ 928245522Smav vol->v_sectorsize = 512 * meta->sector_size; 929219974Smav for (i = 0; i < vol->v_disks_count; i++) { 930219974Smav sd = &vol->v_subdisks[i]; 931245522Smav sd->sd_offset = (((off_t)meta->disk_offset_high << 32) + 932245522Smav meta->disk_offset) * 512; 933245522Smav sd->sd_size = (((off_t)meta->disk_sectors_high << 32) + 934245522Smav meta->disk_sectors) * 512; 935219974Smav } 936219974Smav g_raid_start_volume(vol); 937219974Smav 938219974Smav /* Make all disks found till the moment take their places. */ 939219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 940219974Smav pd = disk->d_md_data; 941219974Smav for (i = 0; i < pd->pd_subdisks; i++) { 942219974Smav if (pd->pd_meta[i]->volume_id == meta->volume_id) 943219974Smav g_raid_md_promise_start_disk(disk, i, vol); 944219974Smav } 945219974Smav } 946219974Smav 947219974Smav pv->pv_started = 1; 948219974Smav callout_stop(&pv->pv_start_co); 949219974Smav G_RAID_DEBUG1(0, sc, "Volume started."); 950219974Smav g_raid_md_write_promise(md, vol, NULL, NULL); 951219974Smav 952219974Smav /* Pickup any STALE/SPARE disks to refill array if needed. */ 953219974Smav g_raid_md_promise_refill(sc); 954219974Smav 955219974Smav g_raid_event_send(vol, G_RAID_VOLUME_E_START, G_RAID_EVENT_VOLUME); 956219974Smav} 957219974Smav 958219974Smavstatic void 959219974Smavg_raid_promise_go(void *arg) 960219974Smav{ 961219974Smav struct g_raid_volume *vol; 962219974Smav struct g_raid_softc *sc; 963219974Smav struct g_raid_md_promise_pervolume *pv; 964219974Smav 965219974Smav vol = arg; 966219974Smav pv = vol->v_md_data; 967219974Smav sc = vol->v_softc; 968219974Smav if (!pv->pv_started) { 969219974Smav G_RAID_DEBUG1(0, sc, "Force volume start due to timeout."); 970219974Smav g_raid_event_send(vol, G_RAID_VOLUME_E_STARTMD, 971219974Smav G_RAID_EVENT_VOLUME); 972219974Smav } 973219974Smav} 974219974Smav 975219974Smavstatic void 976219974Smavg_raid_md_promise_new_disk(struct g_raid_disk *disk) 977219974Smav{ 978219974Smav struct g_raid_softc *sc; 979219974Smav struct g_raid_md_object *md; 980219974Smav struct promise_raid_conf *pdmeta; 981219974Smav struct g_raid_md_promise_perdisk *pd; 982219974Smav struct g_raid_md_promise_pervolume *pv; 983219974Smav struct g_raid_volume *vol; 984219974Smav int i; 985219974Smav char buf[33]; 986219974Smav 987219974Smav sc = disk->d_softc; 988219974Smav md = sc->sc_md; 989219974Smav pd = (struct g_raid_md_promise_perdisk *)disk->d_md_data; 990219974Smav 991219974Smav if (pd->pd_subdisks == 0) { 992219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_SPARE); 993219974Smav g_raid_md_promise_refill(sc); 994219974Smav return; 995219974Smav } 996219974Smav 997219974Smav for (i = 0; i < pd->pd_subdisks; i++) { 998219974Smav pdmeta = pd->pd_meta[i]; 999219974Smav 1000219974Smav /* Look for volume with matching ID. */ 1001219974Smav vol = g_raid_md_promise_get_volume(sc, pdmeta->volume_id); 1002219974Smav if (vol == NULL) { 1003219974Smav promise_meta_get_name(pdmeta, buf); 1004219974Smav vol = g_raid_create_volume(sc, buf, pdmeta->array_number); 1005219974Smav pv = malloc(sizeof(*pv), M_MD_PROMISE, M_WAITOK | M_ZERO); 1006219974Smav pv->pv_id = pdmeta->volume_id; 1007219974Smav vol->v_md_data = pv; 1008219974Smav callout_init(&pv->pv_start_co, 1); 1009219974Smav callout_reset(&pv->pv_start_co, 1010219974Smav g_raid_start_timeout * hz, 1011219974Smav g_raid_promise_go, vol); 1012219974Smav } else 1013219974Smav pv = vol->v_md_data; 1014219974Smav 1015219974Smav /* If we haven't started yet - check metadata freshness. */ 1016219974Smav if (pv->pv_meta == NULL || !pv->pv_started) { 1017219974Smav if (pv->pv_meta == NULL || 1018219974Smav ((int16_t)(pdmeta->generation - pv->pv_generation)) > 0) { 1019219974Smav G_RAID_DEBUG1(1, sc, "Newer disk"); 1020219974Smav if (pv->pv_meta != NULL) 1021219974Smav free(pv->pv_meta, M_MD_PROMISE); 1022219974Smav pv->pv_meta = promise_meta_copy(pdmeta); 1023219974Smav pv->pv_generation = pv->pv_meta->generation; 1024219974Smav pv->pv_disks_present = 1; 1025219974Smav } else if (pdmeta->generation == pv->pv_generation) { 1026219974Smav pv->pv_disks_present++; 1027219974Smav G_RAID_DEBUG1(1, sc, "Matching disk (%d of %d up)", 1028219974Smav pv->pv_disks_present, 1029219974Smav pv->pv_meta->total_disks); 1030219974Smav } else { 1031219974Smav G_RAID_DEBUG1(1, sc, "Older disk"); 1032219974Smav } 1033219974Smav } 1034219974Smav } 1035219974Smav 1036219974Smav for (i = 0; i < pd->pd_subdisks; i++) { 1037219974Smav pdmeta = pd->pd_meta[i]; 1038219974Smav 1039219974Smav /* Look for volume with matching ID. */ 1040219974Smav vol = g_raid_md_promise_get_volume(sc, pdmeta->volume_id); 1041219974Smav if (vol == NULL) 1042219974Smav continue; 1043219974Smav pv = vol->v_md_data; 1044219974Smav 1045219974Smav if (pv->pv_started) { 1046219974Smav if (g_raid_md_promise_start_disk(disk, i, vol)) 1047219974Smav g_raid_md_write_promise(md, vol, NULL, NULL); 1048219974Smav } else { 1049219974Smav /* If we collected all needed disks - start array. */ 1050219974Smav if (pv->pv_disks_present == pv->pv_meta->total_disks) 1051219974Smav g_raid_md_promise_start(vol); 1052219974Smav } 1053219974Smav } 1054219974Smav} 1055219974Smav 1056219974Smavstatic int 1057219974Smavg_raid_md_create_promise(struct g_raid_md_object *md, struct g_class *mp, 1058219974Smav struct g_geom **gp) 1059219974Smav{ 1060219974Smav struct g_geom *geom; 1061219974Smav struct g_raid_softc *sc; 1062219974Smav 1063219974Smav /* Search for existing node. */ 1064219974Smav LIST_FOREACH(geom, &mp->geom, geom) { 1065219974Smav sc = geom->softc; 1066219974Smav if (sc == NULL) 1067219974Smav continue; 1068219974Smav if (sc->sc_stopping != 0) 1069219974Smav continue; 1070219974Smav if (sc->sc_md->mdo_class != md->mdo_class) 1071219974Smav continue; 1072219974Smav break; 1073219974Smav } 1074219974Smav if (geom != NULL) { 1075219974Smav *gp = geom; 1076219974Smav return (G_RAID_MD_TASTE_EXISTING); 1077219974Smav } 1078219974Smav 1079219974Smav /* Create new one if not found. */ 1080219974Smav sc = g_raid_create_node(mp, "Promise", md); 1081219974Smav if (sc == NULL) 1082219974Smav return (G_RAID_MD_TASTE_FAIL); 1083219974Smav md->mdo_softc = sc; 1084219974Smav *gp = sc->sc_geom; 1085219974Smav return (G_RAID_MD_TASTE_NEW); 1086219974Smav} 1087219974Smav 1088219974Smavstatic int 1089219974Smavg_raid_md_taste_promise(struct g_raid_md_object *md, struct g_class *mp, 1090219974Smav struct g_consumer *cp, struct g_geom **gp) 1091219974Smav{ 1092219974Smav struct g_consumer *rcp; 1093219974Smav struct g_provider *pp; 1094219974Smav struct g_raid_softc *sc; 1095219974Smav struct g_raid_disk *disk; 1096219974Smav struct promise_raid_conf *meta, *metaarr[4]; 1097219974Smav struct g_raid_md_promise_perdisk *pd; 1098219974Smav struct g_geom *geom; 1099242323Smav int i, j, result, len, subdisks; 1100219974Smav char name[16]; 1101219974Smav uint16_t vendor; 1102219974Smav 1103219974Smav G_RAID_DEBUG(1, "Tasting Promise on %s", cp->provider->name); 1104219974Smav pp = cp->provider; 1105219974Smav 1106219974Smav /* Read metadata from device. */ 1107219974Smav meta = NULL; 1108279278Smav g_topology_unlock(); 1109219974Smav vendor = 0xffff; 1110279278Smav len = sizeof(vendor); 1111219974Smav if (pp->geom->rank == 1) 1112219974Smav g_io_getattr("GEOM::hba_vendor", cp, &len, &vendor); 1113219974Smav subdisks = promise_meta_read(cp, metaarr); 1114219974Smav g_topology_lock(); 1115219974Smav if (subdisks == 0) { 1116219974Smav if (g_raid_aggressive_spare) { 1117219974Smav if (vendor == 0x105a || vendor == 0x1002) { 1118219974Smav G_RAID_DEBUG(1, 1119219974Smav "No Promise metadata, forcing spare."); 1120219974Smav goto search; 1121219974Smav } else { 1122219974Smav G_RAID_DEBUG(1, 1123219974Smav "Promise/ATI vendor mismatch " 1124219974Smav "0x%04x != 0x105a/0x1002", 1125219974Smav vendor); 1126219974Smav } 1127219974Smav } 1128219974Smav return (G_RAID_MD_TASTE_FAIL); 1129219974Smav } 1130219974Smav 1131219974Smav /* Metadata valid. Print it. */ 1132219974Smav for (i = 0; i < subdisks; i++) 1133219974Smav g_raid_md_promise_print(metaarr[i]); 1134219974Smav 1135219974Smav /* Purge meaningless (empty/spare) records. */ 1136219974Smav for (i = 0; i < subdisks; ) { 1137219974Smav if (metaarr[i]->disk.flags & PROMISE_F_ASSIGNED) { 1138219974Smav i++; 1139219974Smav continue; 1140219974Smav } 1141219974Smav free(metaarr[i], M_MD_PROMISE); 1142219974Smav for (j = i; j < subdisks - 1; j++) 1143219974Smav metaarr[i] = metaarr[j + 1]; 1144241418Smav metaarr[subdisks - 1] = NULL; 1145219974Smav subdisks--; 1146219974Smav } 1147219974Smav 1148219974Smavsearch: 1149219974Smav /* Search for matching node. */ 1150219974Smav sc = NULL; 1151219974Smav LIST_FOREACH(geom, &mp->geom, geom) { 1152219974Smav sc = geom->softc; 1153219974Smav if (sc == NULL) 1154219974Smav continue; 1155219974Smav if (sc->sc_stopping != 0) 1156219974Smav continue; 1157219974Smav if (sc->sc_md->mdo_class != md->mdo_class) 1158219974Smav continue; 1159219974Smav break; 1160219974Smav } 1161219974Smav 1162219974Smav /* Found matching node. */ 1163219974Smav if (geom != NULL) { 1164219974Smav G_RAID_DEBUG(1, "Found matching array %s", sc->sc_name); 1165219974Smav result = G_RAID_MD_TASTE_EXISTING; 1166219974Smav 1167219974Smav } else { /* Not found matching node -- create one. */ 1168219974Smav result = G_RAID_MD_TASTE_NEW; 1169219974Smav snprintf(name, sizeof(name), "Promise"); 1170219974Smav sc = g_raid_create_node(mp, name, md); 1171219974Smav md->mdo_softc = sc; 1172219974Smav geom = sc->sc_geom; 1173219974Smav } 1174219974Smav 1175265054Smav /* There is no return after this point, so we close passed consumer. */ 1176265054Smav g_access(cp, -1, 0, 0); 1177265054Smav 1178219974Smav rcp = g_new_consumer(geom); 1179256880Smav rcp->flags |= G_CF_DIRECT_RECEIVE; 1180219974Smav g_attach(rcp, pp); 1181219974Smav if (g_access(rcp, 1, 1, 1) != 0) 1182219974Smav ; //goto fail1; 1183219974Smav 1184219974Smav g_topology_unlock(); 1185219974Smav sx_xlock(&sc->sc_lock); 1186219974Smav 1187219974Smav pd = malloc(sizeof(*pd), M_MD_PROMISE, M_WAITOK | M_ZERO); 1188219974Smav pd->pd_subdisks = subdisks; 1189219974Smav for (i = 0; i < subdisks; i++) 1190219974Smav pd->pd_meta[i] = metaarr[i]; 1191219974Smav disk = g_raid_create_disk(sc); 1192219974Smav disk->d_md_data = (void *)pd; 1193219974Smav disk->d_consumer = rcp; 1194219974Smav rcp->private = disk; 1195219974Smav 1196242323Smav g_raid_get_disk_info(disk); 1197219974Smav 1198219974Smav g_raid_md_promise_new_disk(disk); 1199219974Smav 1200219974Smav sx_xunlock(&sc->sc_lock); 1201219974Smav g_topology_lock(); 1202219974Smav *gp = geom; 1203219974Smav return (result); 1204219974Smav} 1205219974Smav 1206219974Smavstatic int 1207219974Smavg_raid_md_event_promise(struct g_raid_md_object *md, 1208219974Smav struct g_raid_disk *disk, u_int event) 1209219974Smav{ 1210219974Smav struct g_raid_softc *sc; 1211219974Smav 1212219974Smav sc = md->mdo_softc; 1213219974Smav if (disk == NULL) 1214219974Smav return (-1); 1215219974Smav switch (event) { 1216219974Smav case G_RAID_DISK_E_DISCONNECTED: 1217219974Smav /* Delete disk. */ 1218219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_NONE); 1219219974Smav g_raid_destroy_disk(disk); 1220219974Smav g_raid_md_promise_purge_volumes(sc); 1221219974Smav 1222219974Smav /* Write updated metadata to all disks. */ 1223219974Smav g_raid_md_write_promise(md, NULL, NULL, NULL); 1224219974Smav 1225219974Smav /* Check if anything left. */ 1226219974Smav if (g_raid_ndisks(sc, -1) == 0) 1227219974Smav g_raid_destroy_node(sc, 0); 1228219974Smav else 1229219974Smav g_raid_md_promise_refill(sc); 1230219974Smav return (0); 1231219974Smav } 1232219974Smav return (-2); 1233219974Smav} 1234219974Smav 1235219974Smavstatic int 1236219974Smavg_raid_md_volume_event_promise(struct g_raid_md_object *md, 1237219974Smav struct g_raid_volume *vol, u_int event) 1238219974Smav{ 1239219974Smav struct g_raid_md_promise_pervolume *pv; 1240219974Smav 1241219974Smav pv = (struct g_raid_md_promise_pervolume *)vol->v_md_data; 1242219974Smav switch (event) { 1243219974Smav case G_RAID_VOLUME_E_STARTMD: 1244219974Smav if (!pv->pv_started) 1245219974Smav g_raid_md_promise_start(vol); 1246219974Smav return (0); 1247219974Smav } 1248219974Smav return (-2); 1249219974Smav} 1250219974Smav 1251219974Smavstatic int 1252219974Smavg_raid_md_ctl_promise(struct g_raid_md_object *md, 1253219974Smav struct gctl_req *req) 1254219974Smav{ 1255219974Smav struct g_raid_softc *sc; 1256219974Smav struct g_raid_volume *vol, *vol1; 1257219974Smav struct g_raid_subdisk *sd; 1258219974Smav struct g_raid_disk *disk, *disks[PROMISE_MAX_DISKS]; 1259219974Smav struct g_raid_md_promise_perdisk *pd; 1260219974Smav struct g_raid_md_promise_pervolume *pv; 1261219974Smav struct g_consumer *cp; 1262219974Smav struct g_provider *pp; 1263219974Smav char arg[16]; 1264241329Smav const char *nodename, *verb, *volname, *levelname, *diskname; 1265219974Smav char *tmp; 1266219974Smav int *nargs, *force; 1267245522Smav off_t esize, offs[PROMISE_MAX_DISKS], size, sectorsize, strip; 1268219974Smav intmax_t *sizearg, *striparg; 1269219974Smav int numdisks, i, len, level, qual; 1270219974Smav int error; 1271219974Smav 1272219974Smav sc = md->mdo_softc; 1273219974Smav verb = gctl_get_param(req, "verb", NULL); 1274219974Smav nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); 1275219974Smav error = 0; 1276219974Smav if (strcmp(verb, "label") == 0) { 1277219974Smav 1278219974Smav if (*nargs < 4) { 1279219974Smav gctl_error(req, "Invalid number of arguments."); 1280219974Smav return (-1); 1281219974Smav } 1282219974Smav volname = gctl_get_asciiparam(req, "arg1"); 1283219974Smav if (volname == NULL) { 1284219974Smav gctl_error(req, "No volume name."); 1285219974Smav return (-2); 1286219974Smav } 1287219974Smav levelname = gctl_get_asciiparam(req, "arg2"); 1288219974Smav if (levelname == NULL) { 1289219974Smav gctl_error(req, "No RAID level."); 1290219974Smav return (-3); 1291219974Smav } 1292234458Smav if (strcasecmp(levelname, "RAID5") == 0) 1293234727Smav levelname = "RAID5-LA"; 1294219974Smav if (g_raid_volume_str2level(levelname, &level, &qual)) { 1295219974Smav gctl_error(req, "Unknown RAID level '%s'.", levelname); 1296219974Smav return (-4); 1297219974Smav } 1298219974Smav numdisks = *nargs - 3; 1299219974Smav force = gctl_get_paraml(req, "force", sizeof(*force)); 1300219974Smav if (!g_raid_md_promise_supported(level, qual, numdisks, 1301219974Smav force ? *force : 0)) { 1302219974Smav gctl_error(req, "Unsupported RAID level " 1303219974Smav "(0x%02x/0x%02x), or number of disks (%d).", 1304219974Smav level, qual, numdisks); 1305219974Smav return (-5); 1306219974Smav } 1307219974Smav 1308219974Smav /* Search for disks, connect them and probe. */ 1309219974Smav size = INT64_MAX; 1310219974Smav sectorsize = 0; 1311219974Smav bzero(disks, sizeof(disks)); 1312219974Smav bzero(offs, sizeof(offs)); 1313219974Smav for (i = 0; i < numdisks; i++) { 1314219974Smav snprintf(arg, sizeof(arg), "arg%d", i + 3); 1315219974Smav diskname = gctl_get_asciiparam(req, arg); 1316219974Smav if (diskname == NULL) { 1317219974Smav gctl_error(req, "No disk name (%s).", arg); 1318219974Smav error = -6; 1319219974Smav break; 1320219974Smav } 1321219974Smav if (strcmp(diskname, "NONE") == 0) 1322219974Smav continue; 1323219974Smav 1324219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1325219974Smav if (disk->d_consumer != NULL && 1326219974Smav disk->d_consumer->provider != NULL && 1327219974Smav strcmp(disk->d_consumer->provider->name, 1328219974Smav diskname) == 0) 1329219974Smav break; 1330219974Smav } 1331219974Smav if (disk != NULL) { 1332219974Smav if (disk->d_state != G_RAID_DISK_S_ACTIVE) { 1333219974Smav gctl_error(req, "Disk '%s' is in a " 1334219974Smav "wrong state (%s).", diskname, 1335219974Smav g_raid_disk_state2str(disk->d_state)); 1336219974Smav error = -7; 1337219974Smav break; 1338219974Smav } 1339219974Smav pd = disk->d_md_data; 1340219974Smav if (pd->pd_subdisks >= PROMISE_MAX_SUBDISKS) { 1341219974Smav gctl_error(req, "Disk '%s' already " 1342219974Smav "used by %d volumes.", 1343219974Smav diskname, pd->pd_subdisks); 1344219974Smav error = -7; 1345219974Smav break; 1346219974Smav } 1347219974Smav pp = disk->d_consumer->provider; 1348219974Smav disks[i] = disk; 1349219974Smav promise_meta_unused_range(pd->pd_meta, 1350219974Smav pd->pd_subdisks, 1351219974Smav pp->mediasize / pp->sectorsize, 1352219974Smav &offs[i], &esize); 1353219974Smav size = MIN(size, (off_t)esize * pp->sectorsize); 1354219974Smav sectorsize = MAX(sectorsize, pp->sectorsize); 1355219974Smav continue; 1356219974Smav } 1357219974Smav 1358219974Smav g_topology_lock(); 1359219974Smav cp = g_raid_open_consumer(sc, diskname); 1360219974Smav if (cp == NULL) { 1361219974Smav gctl_error(req, "Can't open disk '%s'.", 1362219974Smav diskname); 1363219974Smav g_topology_unlock(); 1364219974Smav error = -8; 1365219974Smav break; 1366219974Smav } 1367219974Smav pp = cp->provider; 1368219974Smav pd = malloc(sizeof(*pd), M_MD_PROMISE, M_WAITOK | M_ZERO); 1369219974Smav disk = g_raid_create_disk(sc); 1370219974Smav disk->d_md_data = (void *)pd; 1371219974Smav disk->d_consumer = cp; 1372219974Smav disks[i] = disk; 1373219974Smav cp->private = disk; 1374219974Smav g_topology_unlock(); 1375219974Smav 1376242323Smav g_raid_get_disk_info(disk); 1377219974Smav 1378219974Smav /* Reserve some space for metadata. */ 1379219974Smav size = MIN(size, pp->mediasize - 131072llu * pp->sectorsize); 1380219974Smav sectorsize = MAX(sectorsize, pp->sectorsize); 1381219974Smav } 1382219974Smav if (error != 0) { 1383219974Smav for (i = 0; i < numdisks; i++) { 1384219974Smav if (disks[i] != NULL && 1385219974Smav disks[i]->d_state == G_RAID_DISK_S_NONE) 1386219974Smav g_raid_destroy_disk(disks[i]); 1387219974Smav } 1388219974Smav return (error); 1389219974Smav } 1390219974Smav 1391220210Smav if (sectorsize <= 0) { 1392220210Smav gctl_error(req, "Can't get sector size."); 1393220210Smav return (-8); 1394220210Smav } 1395220210Smav 1396219974Smav /* Handle size argument. */ 1397219974Smav len = sizeof(*sizearg); 1398219974Smav sizearg = gctl_get_param(req, "size", &len); 1399219974Smav if (sizearg != NULL && len == sizeof(*sizearg) && 1400219974Smav *sizearg > 0) { 1401219974Smav if (*sizearg > size) { 1402219974Smav gctl_error(req, "Size too big %lld > %lld.", 1403219974Smav (long long)*sizearg, (long long)size); 1404219974Smav return (-9); 1405219974Smav } 1406219974Smav size = *sizearg; 1407219974Smav } 1408219974Smav 1409219974Smav /* Handle strip argument. */ 1410219974Smav strip = 131072; 1411219974Smav len = sizeof(*striparg); 1412219974Smav striparg = gctl_get_param(req, "strip", &len); 1413219974Smav if (striparg != NULL && len == sizeof(*striparg) && 1414219974Smav *striparg > 0) { 1415219974Smav if (*striparg < sectorsize) { 1416219974Smav gctl_error(req, "Strip size too small."); 1417219974Smav return (-10); 1418219974Smav } 1419219974Smav if (*striparg % sectorsize != 0) { 1420219974Smav gctl_error(req, "Incorrect strip size."); 1421219974Smav return (-11); 1422219974Smav } 1423219974Smav strip = *striparg; 1424219974Smav } 1425219974Smav 1426219974Smav /* Round size down to strip or sector. */ 1427219974Smav if (level == G_RAID_VOLUME_RL_RAID1 || 1428219974Smav level == G_RAID_VOLUME_RL_SINGLE || 1429219974Smav level == G_RAID_VOLUME_RL_CONCAT) 1430219974Smav size -= (size % sectorsize); 1431219974Smav else if (level == G_RAID_VOLUME_RL_RAID1E && 1432219974Smav (numdisks & 1) != 0) 1433219974Smav size -= (size % (2 * strip)); 1434219974Smav else 1435219974Smav size -= (size % strip); 1436219974Smav if (size <= 0) { 1437219974Smav gctl_error(req, "Size too small."); 1438219974Smav return (-13); 1439219974Smav } 1440219974Smav 1441219974Smav /* We have all we need, create things: volume, ... */ 1442219974Smav pv = malloc(sizeof(*pv), M_MD_PROMISE, M_WAITOK | M_ZERO); 1443219974Smav arc4rand(&pv->pv_id, sizeof(pv->pv_id), 0); 1444219974Smav pv->pv_generation = 0; 1445219974Smav pv->pv_started = 1; 1446219974Smav vol = g_raid_create_volume(sc, volname, -1); 1447219974Smav vol->v_md_data = pv; 1448219974Smav vol->v_raid_level = level; 1449234458Smav vol->v_raid_level_qualifier = qual; 1450219974Smav vol->v_strip_size = strip; 1451219974Smav vol->v_disks_count = numdisks; 1452219974Smav if (level == G_RAID_VOLUME_RL_RAID0 || 1453219974Smav level == G_RAID_VOLUME_RL_CONCAT || 1454219974Smav level == G_RAID_VOLUME_RL_SINGLE) 1455219974Smav vol->v_mediasize = size * numdisks; 1456219974Smav else if (level == G_RAID_VOLUME_RL_RAID1) 1457219974Smav vol->v_mediasize = size; 1458219974Smav else if (level == G_RAID_VOLUME_RL_RAID3 || 1459219974Smav level == G_RAID_VOLUME_RL_RAID5) 1460219974Smav vol->v_mediasize = size * (numdisks - 1); 1461219974Smav else { /* RAID1E */ 1462219974Smav vol->v_mediasize = ((size * numdisks) / strip / 2) * 1463219974Smav strip; 1464219974Smav } 1465219974Smav vol->v_sectorsize = sectorsize; 1466219974Smav g_raid_start_volume(vol); 1467219974Smav 1468219974Smav /* , and subdisks. */ 1469219974Smav for (i = 0; i < numdisks; i++) { 1470219974Smav disk = disks[i]; 1471219974Smav sd = &vol->v_subdisks[i]; 1472219974Smav sd->sd_disk = disk; 1473219974Smav sd->sd_offset = (off_t)offs[i] * 512; 1474219974Smav sd->sd_size = size; 1475219974Smav if (disk == NULL) 1476219974Smav continue; 1477219974Smav TAILQ_INSERT_TAIL(&disk->d_subdisks, sd, sd_next); 1478219974Smav g_raid_change_disk_state(disk, 1479219974Smav G_RAID_DISK_S_ACTIVE); 1480219974Smav g_raid_change_subdisk_state(sd, 1481219974Smav G_RAID_SUBDISK_S_ACTIVE); 1482219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_NEW, 1483219974Smav G_RAID_EVENT_SUBDISK); 1484219974Smav } 1485219974Smav 1486219974Smav /* Write metadata based on created entities. */ 1487219974Smav G_RAID_DEBUG1(0, sc, "Array started."); 1488219974Smav g_raid_md_write_promise(md, vol, NULL, NULL); 1489219974Smav 1490219974Smav /* Pickup any STALE/SPARE disks to refill array if needed. */ 1491219974Smav g_raid_md_promise_refill(sc); 1492219974Smav 1493219974Smav g_raid_event_send(vol, G_RAID_VOLUME_E_START, 1494219974Smav G_RAID_EVENT_VOLUME); 1495219974Smav return (0); 1496219974Smav } 1497219974Smav if (strcmp(verb, "add") == 0) { 1498219974Smav 1499219974Smav gctl_error(req, "`add` command is not applicable, " 1500219974Smav "use `label` instead."); 1501219974Smav return (-99); 1502219974Smav } 1503219974Smav if (strcmp(verb, "delete") == 0) { 1504219974Smav 1505241329Smav nodename = gctl_get_asciiparam(req, "arg0"); 1506241329Smav if (nodename != NULL && strcasecmp(sc->sc_name, nodename) != 0) 1507241329Smav nodename = NULL; 1508241329Smav 1509219974Smav /* Full node destruction. */ 1510241329Smav if (*nargs == 1 && nodename != NULL) { 1511219974Smav /* Check if some volume is still open. */ 1512219974Smav force = gctl_get_paraml(req, "force", sizeof(*force)); 1513219974Smav if (force != NULL && *force == 0 && 1514219974Smav g_raid_nopens(sc) != 0) { 1515219974Smav gctl_error(req, "Some volume is still open."); 1516219974Smav return (-4); 1517219974Smav } 1518219974Smav 1519219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1520219974Smav if (disk->d_consumer) 1521219974Smav promise_meta_erase(disk->d_consumer); 1522219974Smav } 1523219974Smav g_raid_destroy_node(sc, 0); 1524219974Smav return (0); 1525219974Smav } 1526219974Smav 1527219974Smav /* Destroy specified volume. If it was last - all node. */ 1528241329Smav if (*nargs > 2) { 1529219974Smav gctl_error(req, "Invalid number of arguments."); 1530219974Smav return (-1); 1531219974Smav } 1532241329Smav volname = gctl_get_asciiparam(req, 1533241329Smav nodename != NULL ? "arg1" : "arg0"); 1534219974Smav if (volname == NULL) { 1535219974Smav gctl_error(req, "No volume name."); 1536219974Smav return (-2); 1537219974Smav } 1538219974Smav 1539219974Smav /* Search for volume. */ 1540219974Smav TAILQ_FOREACH(vol, &sc->sc_volumes, v_next) { 1541219974Smav if (strcmp(vol->v_name, volname) == 0) 1542219974Smav break; 1543241329Smav pp = vol->v_provider; 1544241329Smav if (pp == NULL) 1545241329Smav continue; 1546241329Smav if (strcmp(pp->name, volname) == 0) 1547241329Smav break; 1548241329Smav if (strncmp(pp->name, "raid/", 5) == 0 && 1549241329Smav strcmp(pp->name + 5, volname) == 0) 1550241329Smav break; 1551219974Smav } 1552219974Smav if (vol == NULL) { 1553219974Smav i = strtol(volname, &tmp, 10); 1554219974Smav if (verb != volname && tmp[0] == 0) { 1555219974Smav TAILQ_FOREACH(vol, &sc->sc_volumes, v_next) { 1556219974Smav if (vol->v_global_id == i) 1557219974Smav break; 1558219974Smav } 1559219974Smav } 1560219974Smav } 1561219974Smav if (vol == NULL) { 1562219974Smav gctl_error(req, "Volume '%s' not found.", volname); 1563219974Smav return (-3); 1564219974Smav } 1565219974Smav 1566219974Smav /* Check if volume is still open. */ 1567219974Smav force = gctl_get_paraml(req, "force", sizeof(*force)); 1568219974Smav if (force != NULL && *force == 0 && 1569219974Smav vol->v_provider_open != 0) { 1570219974Smav gctl_error(req, "Volume is still open."); 1571219974Smav return (-4); 1572219974Smav } 1573219974Smav 1574219974Smav /* Destroy volume and potentially node. */ 1575219974Smav i = 0; 1576219974Smav TAILQ_FOREACH(vol1, &sc->sc_volumes, v_next) 1577219974Smav i++; 1578219974Smav if (i >= 2) { 1579219974Smav g_raid_destroy_volume(vol); 1580219974Smav g_raid_md_promise_purge_disks(sc); 1581219974Smav g_raid_md_write_promise(md, NULL, NULL, NULL); 1582219974Smav } else { 1583219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1584219974Smav if (disk->d_consumer) 1585219974Smav promise_meta_erase(disk->d_consumer); 1586219974Smav } 1587219974Smav g_raid_destroy_node(sc, 0); 1588219974Smav } 1589219974Smav return (0); 1590219974Smav } 1591219974Smav if (strcmp(verb, "remove") == 0 || 1592219974Smav strcmp(verb, "fail") == 0) { 1593219974Smav if (*nargs < 2) { 1594219974Smav gctl_error(req, "Invalid number of arguments."); 1595219974Smav return (-1); 1596219974Smav } 1597219974Smav for (i = 1; i < *nargs; i++) { 1598219974Smav snprintf(arg, sizeof(arg), "arg%d", i); 1599219974Smav diskname = gctl_get_asciiparam(req, arg); 1600219974Smav if (diskname == NULL) { 1601219974Smav gctl_error(req, "No disk name (%s).", arg); 1602219974Smav error = -2; 1603219974Smav break; 1604219974Smav } 1605219974Smav if (strncmp(diskname, "/dev/", 5) == 0) 1606219974Smav diskname += 5; 1607219974Smav 1608219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1609219974Smav if (disk->d_consumer != NULL && 1610219974Smav disk->d_consumer->provider != NULL && 1611219974Smav strcmp(disk->d_consumer->provider->name, 1612219974Smav diskname) == 0) 1613219974Smav break; 1614219974Smav } 1615219974Smav if (disk == NULL) { 1616219974Smav gctl_error(req, "Disk '%s' not found.", 1617219974Smav diskname); 1618219974Smav error = -3; 1619219974Smav break; 1620219974Smav } 1621219974Smav 1622219974Smav if (strcmp(verb, "fail") == 0) { 1623219974Smav g_raid_md_fail_disk_promise(md, NULL, disk); 1624219974Smav continue; 1625219974Smav } 1626219974Smav 1627219974Smav /* Erase metadata on deleting disk and destroy it. */ 1628219974Smav promise_meta_erase(disk->d_consumer); 1629219974Smav g_raid_destroy_disk(disk); 1630219974Smav } 1631219974Smav g_raid_md_promise_purge_volumes(sc); 1632219974Smav 1633219974Smav /* Write updated metadata to remaining disks. */ 1634219974Smav g_raid_md_write_promise(md, NULL, NULL, NULL); 1635219974Smav 1636219974Smav /* Check if anything left. */ 1637219974Smav if (g_raid_ndisks(sc, -1) == 0) 1638219974Smav g_raid_destroy_node(sc, 0); 1639219974Smav else 1640219974Smav g_raid_md_promise_refill(sc); 1641219974Smav return (error); 1642219974Smav } 1643219974Smav if (strcmp(verb, "insert") == 0) { 1644219974Smav if (*nargs < 2) { 1645219974Smav gctl_error(req, "Invalid number of arguments."); 1646219974Smav return (-1); 1647219974Smav } 1648219974Smav for (i = 1; i < *nargs; i++) { 1649219974Smav /* Get disk name. */ 1650219974Smav snprintf(arg, sizeof(arg), "arg%d", i); 1651219974Smav diskname = gctl_get_asciiparam(req, arg); 1652219974Smav if (diskname == NULL) { 1653219974Smav gctl_error(req, "No disk name (%s).", arg); 1654219974Smav error = -3; 1655219974Smav break; 1656219974Smav } 1657219974Smav 1658219974Smav /* Try to find provider with specified name. */ 1659219974Smav g_topology_lock(); 1660219974Smav cp = g_raid_open_consumer(sc, diskname); 1661219974Smav if (cp == NULL) { 1662219974Smav gctl_error(req, "Can't open disk '%s'.", 1663219974Smav diskname); 1664219974Smav g_topology_unlock(); 1665219974Smav error = -4; 1666219974Smav break; 1667219974Smav } 1668226816Smav pp = cp->provider; 1669219974Smav g_topology_unlock(); 1670219974Smav 1671219974Smav pd = malloc(sizeof(*pd), M_MD_PROMISE, M_WAITOK | M_ZERO); 1672219974Smav 1673219974Smav disk = g_raid_create_disk(sc); 1674219974Smav disk->d_consumer = cp; 1675219974Smav disk->d_md_data = (void *)pd; 1676219974Smav cp->private = disk; 1677219974Smav 1678242323Smav g_raid_get_disk_info(disk); 1679219974Smav 1680219974Smav /* Welcome the "new" disk. */ 1681219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_SPARE); 1682219974Smav promise_meta_write_spare(cp); 1683219974Smav g_raid_md_promise_refill(sc); 1684219974Smav } 1685219974Smav return (error); 1686219974Smav } 1687219974Smav return (-100); 1688219974Smav} 1689219974Smav 1690219974Smavstatic int 1691219974Smavg_raid_md_write_promise(struct g_raid_md_object *md, struct g_raid_volume *tvol, 1692219974Smav struct g_raid_subdisk *tsd, struct g_raid_disk *tdisk) 1693219974Smav{ 1694219974Smav struct g_raid_softc *sc; 1695219974Smav struct g_raid_volume *vol; 1696219974Smav struct g_raid_subdisk *sd; 1697219974Smav struct g_raid_disk *disk; 1698219974Smav struct g_raid_md_promise_perdisk *pd; 1699219974Smav struct g_raid_md_promise_pervolume *pv; 1700219974Smav struct promise_raid_conf *meta; 1701219974Smav off_t rebuild_lba64; 1702219974Smav int i, j, pos, rebuild; 1703219974Smav 1704219974Smav sc = md->mdo_softc; 1705219974Smav 1706219974Smav if (sc->sc_stopping == G_RAID_DESTROY_HARD) 1707219974Smav return (0); 1708219974Smav 1709219974Smav /* Generate new per-volume metadata for affected volumes. */ 1710219974Smav TAILQ_FOREACH(vol, &sc->sc_volumes, v_next) { 1711219974Smav if (vol->v_stopping) 1712219974Smav continue; 1713219974Smav 1714219974Smav /* Skip volumes not related to specified targets. */ 1715219974Smav if (tvol != NULL && vol != tvol) 1716219974Smav continue; 1717219974Smav if (tsd != NULL && vol != tsd->sd_volume) 1718219974Smav continue; 1719219974Smav if (tdisk != NULL) { 1720219974Smav for (i = 0; i < vol->v_disks_count; i++) { 1721219974Smav if (vol->v_subdisks[i].sd_disk == tdisk) 1722219974Smav break; 1723219974Smav } 1724219974Smav if (i >= vol->v_disks_count) 1725219974Smav continue; 1726219974Smav } 1727219974Smav 1728219974Smav pv = (struct g_raid_md_promise_pervolume *)vol->v_md_data; 1729219974Smav pv->pv_generation++; 1730219974Smav 1731219974Smav meta = malloc(sizeof(*meta), M_MD_PROMISE, M_WAITOK | M_ZERO); 1732219974Smav if (pv->pv_meta != NULL) 1733219974Smav memcpy(meta, pv->pv_meta, sizeof(*meta)); 1734220209Smav memcpy(meta->promise_id, PROMISE_MAGIC, 1735220209Smav sizeof(PROMISE_MAGIC) - 1); 1736219974Smav meta->dummy_0 = 0x00020000; 1737219974Smav meta->integrity = PROMISE_I_VALID; 1738219974Smav 1739219974Smav meta->generation = pv->pv_generation; 1740219974Smav meta->status = PROMISE_S_VALID | PROMISE_S_ONLINE | 1741219974Smav PROMISE_S_INITED | PROMISE_S_READY; 1742219974Smav if (vol->v_state <= G_RAID_VOLUME_S_DEGRADED) 1743219974Smav meta->status |= PROMISE_S_DEGRADED; 1744219974Smav if (vol->v_dirty) 1745219974Smav meta->status |= PROMISE_S_MARKED; /* XXX: INVENTED! */ 1746219974Smav if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID0 || 1747219974Smav vol->v_raid_level == G_RAID_VOLUME_RL_SINGLE) 1748219974Smav meta->type = PROMISE_T_RAID0; 1749219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1 || 1750219974Smav vol->v_raid_level == G_RAID_VOLUME_RL_RAID1E) 1751219974Smav meta->type = PROMISE_T_RAID1; 1752219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID3) 1753219974Smav meta->type = PROMISE_T_RAID3; 1754219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID5) 1755219974Smav meta->type = PROMISE_T_RAID5; 1756219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_CONCAT) 1757219974Smav meta->type = PROMISE_T_SPAN; 1758219974Smav else 1759219974Smav meta->type = PROMISE_T_JBOD; 1760219974Smav meta->total_disks = vol->v_disks_count; 1761219974Smav meta->stripe_shift = ffs(vol->v_strip_size / 1024); 1762219974Smav meta->array_width = vol->v_disks_count; 1763219974Smav if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1 || 1764219974Smav vol->v_raid_level == G_RAID_VOLUME_RL_RAID1E) 1765219974Smav meta->array_width /= 2; 1766219974Smav meta->array_number = vol->v_global_id; 1767245522Smav meta->total_sectors = vol->v_mediasize / 512; 1768245522Smav meta->total_sectors_high = (vol->v_mediasize / 512) >> 32; 1769245522Smav meta->sector_size = vol->v_sectorsize / 512; 1770219974Smav meta->cylinders = meta->total_sectors / (255 * 63) - 1; 1771219974Smav meta->heads = 254; 1772219974Smav meta->sectors = 63; 1773219974Smav meta->volume_id = pv->pv_id; 1774219974Smav rebuild_lba64 = UINT64_MAX; 1775219974Smav rebuild = 0; 1776219974Smav for (i = 0; i < vol->v_disks_count; i++) { 1777219974Smav sd = &vol->v_subdisks[i]; 1778219974Smav /* For RAID0+1 we need to translate order. */ 1779219974Smav pos = promise_meta_translate_disk(vol, i); 1780219974Smav meta->disks[pos].flags = PROMISE_F_VALID | 1781219974Smav PROMISE_F_ASSIGNED; 1782219974Smav if (sd->sd_state == G_RAID_SUBDISK_S_NONE) { 1783219974Smav meta->disks[pos].flags |= 0; 1784219974Smav } else if (sd->sd_state == G_RAID_SUBDISK_S_FAILED) { 1785219974Smav meta->disks[pos].flags |= 1786219974Smav PROMISE_F_DOWN | PROMISE_F_REDIR; 1787219974Smav } else if (sd->sd_state <= G_RAID_SUBDISK_S_REBUILD) { 1788219974Smav meta->disks[pos].flags |= 1789219974Smav PROMISE_F_ONLINE | PROMISE_F_REDIR; 1790219974Smav if (sd->sd_state == G_RAID_SUBDISK_S_REBUILD) { 1791219974Smav rebuild_lba64 = MIN(rebuild_lba64, 1792219974Smav sd->sd_rebuild_pos / 512); 1793219974Smav } else 1794219974Smav rebuild_lba64 = 0; 1795219974Smav rebuild = 1; 1796219974Smav } else { 1797219974Smav meta->disks[pos].flags |= PROMISE_F_ONLINE; 1798219974Smav if (sd->sd_state < G_RAID_SUBDISK_S_ACTIVE) { 1799219974Smav meta->status |= PROMISE_S_MARKED; 1800219974Smav if (sd->sd_state == G_RAID_SUBDISK_S_RESYNC) { 1801219974Smav rebuild_lba64 = MIN(rebuild_lba64, 1802219974Smav sd->sd_rebuild_pos / 512); 1803219974Smav } else 1804219974Smav rebuild_lba64 = 0; 1805219974Smav } 1806219974Smav } 1807219974Smav if (pv->pv_meta != NULL) { 1808219974Smav meta->disks[pos].id = pv->pv_meta->disks[pos].id; 1809219974Smav } else { 1810219974Smav meta->disks[pos].number = i * 2; 1811219974Smav arc4rand(&meta->disks[pos].id, 1812219974Smav sizeof(meta->disks[pos].id), 0); 1813219974Smav } 1814219974Smav } 1815219974Smav promise_meta_put_name(meta, vol->v_name); 1816219974Smav 1817219974Smav /* Try to mimic AMD BIOS rebuild/resync behavior. */ 1818219974Smav if (rebuild_lba64 != UINT64_MAX) { 1819219974Smav if (rebuild) 1820219974Smav meta->magic_3 = 0x03040010UL; /* Rebuild? */ 1821219974Smav else 1822219974Smav meta->magic_3 = 0x03040008UL; /* Resync? */ 1823219974Smav /* Translate from per-disk to per-volume LBA. */ 1824219974Smav if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1 || 1825219974Smav vol->v_raid_level == G_RAID_VOLUME_RL_RAID1E) { 1826219974Smav rebuild_lba64 *= meta->array_width; 1827219974Smav } else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID3 || 1828219974Smav vol->v_raid_level == G_RAID_VOLUME_RL_RAID5) { 1829219974Smav rebuild_lba64 *= meta->array_width - 1; 1830219974Smav } else 1831219974Smav rebuild_lba64 = 0; 1832219974Smav } else 1833219974Smav meta->magic_3 = 0x03000000UL; 1834219974Smav meta->rebuild_lba64 = rebuild_lba64; 1835219974Smav meta->magic_4 = 0x04010101UL; 1836219974Smav 1837219974Smav /* Replace per-volume metadata with new. */ 1838219974Smav if (pv->pv_meta != NULL) 1839219974Smav free(pv->pv_meta, M_MD_PROMISE); 1840219974Smav pv->pv_meta = meta; 1841219974Smav 1842219974Smav /* Copy new metadata to the disks, adding or replacing old. */ 1843219974Smav for (i = 0; i < vol->v_disks_count; i++) { 1844219974Smav sd = &vol->v_subdisks[i]; 1845219974Smav disk = sd->sd_disk; 1846219974Smav if (disk == NULL) 1847219974Smav continue; 1848219974Smav /* For RAID0+1 we need to translate order. */ 1849219974Smav pos = promise_meta_translate_disk(vol, i); 1850219974Smav pd = (struct g_raid_md_promise_perdisk *)disk->d_md_data; 1851219974Smav for (j = 0; j < pd->pd_subdisks; j++) { 1852219974Smav if (pd->pd_meta[j]->volume_id == meta->volume_id) 1853219974Smav break; 1854219974Smav } 1855219974Smav if (j == pd->pd_subdisks) 1856219974Smav pd->pd_subdisks++; 1857219974Smav if (pd->pd_meta[j] != NULL) 1858219974Smav free(pd->pd_meta[j], M_MD_PROMISE); 1859219974Smav pd->pd_meta[j] = promise_meta_copy(meta); 1860219974Smav pd->pd_meta[j]->disk = meta->disks[pos]; 1861219974Smav pd->pd_meta[j]->disk.number = pos; 1862245522Smav pd->pd_meta[j]->disk_offset_high = 1863245522Smav (sd->sd_offset / 512) >> 32; 1864219974Smav pd->pd_meta[j]->disk_offset = sd->sd_offset / 512; 1865245522Smav pd->pd_meta[j]->disk_sectors_high = 1866245522Smav (sd->sd_size / 512) >> 32; 1867219974Smav pd->pd_meta[j]->disk_sectors = sd->sd_size / 512; 1868219974Smav if (sd->sd_state == G_RAID_SUBDISK_S_REBUILD) { 1869245522Smav pd->pd_meta[j]->disk_rebuild_high = 1870245522Smav (sd->sd_rebuild_pos / 512) >> 32; 1871245522Smav pd->pd_meta[j]->disk_rebuild = 1872219974Smav sd->sd_rebuild_pos / 512; 1873245522Smav } else if (sd->sd_state < G_RAID_SUBDISK_S_REBUILD) { 1874245522Smav pd->pd_meta[j]->disk_rebuild_high = 0; 1875245522Smav pd->pd_meta[j]->disk_rebuild = 0; 1876245522Smav } else { 1877245522Smav pd->pd_meta[j]->disk_rebuild_high = UINT32_MAX; 1878245522Smav pd->pd_meta[j]->disk_rebuild = UINT32_MAX; 1879245522Smav } 1880219974Smav pd->pd_updated = 1; 1881219974Smav } 1882219974Smav } 1883219974Smav 1884219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1885219974Smav pd = (struct g_raid_md_promise_perdisk *)disk->d_md_data; 1886219974Smav if (disk->d_state != G_RAID_DISK_S_ACTIVE) 1887219974Smav continue; 1888219974Smav if (!pd->pd_updated) 1889219974Smav continue; 1890219974Smav G_RAID_DEBUG(1, "Writing Promise metadata to %s", 1891219974Smav g_raid_get_diskname(disk)); 1892219974Smav for (i = 0; i < pd->pd_subdisks; i++) 1893219974Smav g_raid_md_promise_print(pd->pd_meta[i]); 1894219974Smav promise_meta_write(disk->d_consumer, 1895219974Smav pd->pd_meta, pd->pd_subdisks); 1896219974Smav pd->pd_updated = 0; 1897219974Smav } 1898219974Smav 1899219974Smav return (0); 1900219974Smav} 1901219974Smav 1902219974Smavstatic int 1903219974Smavg_raid_md_fail_disk_promise(struct g_raid_md_object *md, 1904219974Smav struct g_raid_subdisk *tsd, struct g_raid_disk *tdisk) 1905219974Smav{ 1906219974Smav struct g_raid_softc *sc; 1907219974Smav struct g_raid_md_promise_perdisk *pd; 1908219974Smav struct g_raid_subdisk *sd; 1909219974Smav int i, pos; 1910219974Smav 1911219974Smav sc = md->mdo_softc; 1912219974Smav pd = (struct g_raid_md_promise_perdisk *)tdisk->d_md_data; 1913219974Smav 1914219974Smav /* We can't fail disk that is not a part of array now. */ 1915219974Smav if (tdisk->d_state != G_RAID_DISK_S_ACTIVE) 1916219974Smav return (-1); 1917219974Smav 1918219974Smav /* 1919219974Smav * Mark disk as failed in metadata and try to write that metadata 1920219974Smav * to the disk itself to prevent it's later resurrection as STALE. 1921219974Smav */ 1922219974Smav if (pd->pd_subdisks > 0 && tdisk->d_consumer != NULL) 1923219974Smav G_RAID_DEBUG(1, "Writing Promise metadata to %s", 1924219974Smav g_raid_get_diskname(tdisk)); 1925219974Smav for (i = 0; i < pd->pd_subdisks; i++) { 1926219974Smav pd->pd_meta[i]->disk.flags |= 1927219974Smav PROMISE_F_DOWN | PROMISE_F_REDIR; 1928219974Smav pos = pd->pd_meta[i]->disk.number; 1929219974Smav if (pos >= 0 && pos < PROMISE_MAX_DISKS) { 1930219974Smav pd->pd_meta[i]->disks[pos].flags |= 1931219974Smav PROMISE_F_DOWN | PROMISE_F_REDIR; 1932219974Smav } 1933219974Smav g_raid_md_promise_print(pd->pd_meta[i]); 1934219974Smav } 1935219974Smav if (tdisk->d_consumer != NULL) 1936219974Smav promise_meta_write(tdisk->d_consumer, 1937219974Smav pd->pd_meta, pd->pd_subdisks); 1938219974Smav 1939219974Smav /* Change states. */ 1940219974Smav g_raid_change_disk_state(tdisk, G_RAID_DISK_S_FAILED); 1941219974Smav TAILQ_FOREACH(sd, &tdisk->d_subdisks, sd_next) { 1942219974Smav g_raid_change_subdisk_state(sd, 1943219974Smav G_RAID_SUBDISK_S_FAILED); 1944219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_FAILED, 1945219974Smav G_RAID_EVENT_SUBDISK); 1946219974Smav } 1947219974Smav 1948219974Smav /* Write updated metadata to remaining disks. */ 1949219974Smav g_raid_md_write_promise(md, NULL, NULL, tdisk); 1950219974Smav 1951219974Smav g_raid_md_promise_refill(sc); 1952219974Smav return (0); 1953219974Smav} 1954219974Smav 1955219974Smavstatic int 1956219974Smavg_raid_md_free_disk_promise(struct g_raid_md_object *md, 1957219974Smav struct g_raid_disk *disk) 1958219974Smav{ 1959219974Smav struct g_raid_md_promise_perdisk *pd; 1960219974Smav int i; 1961219974Smav 1962219974Smav pd = (struct g_raid_md_promise_perdisk *)disk->d_md_data; 1963219974Smav for (i = 0; i < pd->pd_subdisks; i++) { 1964219974Smav if (pd->pd_meta[i] != NULL) { 1965219974Smav free(pd->pd_meta[i], M_MD_PROMISE); 1966219974Smav pd->pd_meta[i] = NULL; 1967219974Smav } 1968219974Smav } 1969219974Smav free(pd, M_MD_PROMISE); 1970219974Smav disk->d_md_data = NULL; 1971219974Smav return (0); 1972219974Smav} 1973219974Smav 1974219974Smavstatic int 1975219974Smavg_raid_md_free_volume_promise(struct g_raid_md_object *md, 1976219974Smav struct g_raid_volume *vol) 1977219974Smav{ 1978219974Smav struct g_raid_md_promise_pervolume *pv; 1979219974Smav 1980219974Smav pv = (struct g_raid_md_promise_pervolume *)vol->v_md_data; 1981219974Smav if (pv && pv->pv_meta != NULL) { 1982219974Smav free(pv->pv_meta, M_MD_PROMISE); 1983219974Smav pv->pv_meta = NULL; 1984219974Smav } 1985219974Smav if (pv && !pv->pv_started) { 1986219974Smav pv->pv_started = 1; 1987219974Smav callout_stop(&pv->pv_start_co); 1988219974Smav } 1989235080Smav free(pv, M_MD_PROMISE); 1990235080Smav vol->v_md_data = NULL; 1991219974Smav return (0); 1992219974Smav} 1993219974Smav 1994219974Smavstatic int 1995219974Smavg_raid_md_free_promise(struct g_raid_md_object *md) 1996219974Smav{ 1997219974Smav 1998219974Smav return (0); 1999219974Smav} 2000219974Smav 2001240465SmavG_RAID_MD_DECLARE(promise, "Promise"); 2002