1219974Smav/*- 2219974Smav * Copyright (c) 2011 Alexander Motin <mav@FreeBSD.org> 3235092Smav * Copyright (c) 2000 - 2008 S��ren Schmidt <sos@FreeBSD.org> 4219974Smav * All rights reserved. 5219974Smav * 6219974Smav * Redistribution and use in source and binary forms, with or without 7219974Smav * modification, are permitted provided that the following conditions 8219974Smav * are met: 9219974Smav * 1. Redistributions of source code must retain the above copyright 10219974Smav * notice, this list of conditions and the following disclaimer. 11219974Smav * 2. Redistributions in binary form must reproduce the above copyright 12219974Smav * notice, this list of conditions and the following disclaimer in the 13219974Smav * documentation and/or other materials provided with the distribution. 14219974Smav * 15219974Smav * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND 16219974Smav * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 17219974Smav * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 18219974Smav * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE 19219974Smav * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 20219974Smav * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 21219974Smav * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 22219974Smav * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 23219974Smav * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 24219974Smav * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 25219974Smav * SUCH DAMAGE. 26219974Smav */ 27219974Smav 28219974Smav#include <sys/cdefs.h> 29219974Smav__FBSDID("$FreeBSD$"); 30219974Smav 31219974Smav#include <sys/param.h> 32219974Smav#include <sys/bio.h> 33219974Smav#include <sys/endian.h> 34219974Smav#include <sys/kernel.h> 35219974Smav#include <sys/kobj.h> 36219974Smav#include <sys/limits.h> 37219974Smav#include <sys/lock.h> 38219974Smav#include <sys/malloc.h> 39219974Smav#include <sys/mutex.h> 40219974Smav#include <sys/systm.h> 41219974Smav#include <sys/taskqueue.h> 42219974Smav#include <geom/geom.h> 43219974Smav#include "geom/raid/g_raid.h" 44219974Smav#include "g_raid_md_if.h" 45219974Smav 46219974Smavstatic MALLOC_DEFINE(M_MD_NVIDIA, "md_nvidia_data", "GEOM_RAID NVIDIA metadata"); 47219974Smav 48219974Smavstruct nvidia_raid_conf { 49219974Smav uint8_t nvidia_id[8]; 50219974Smav#define NVIDIA_MAGIC "NVIDIA " 51219974Smav 52219974Smav uint32_t config_size; 53219974Smav uint32_t checksum; 54219974Smav uint16_t version; 55219974Smav uint8_t disk_number; 56219974Smav uint8_t dummy_0; 57219974Smav uint32_t total_sectors; 58219974Smav uint32_t sector_size; 59219974Smav uint8_t name[16]; 60219974Smav uint8_t revision[4]; 61219974Smav uint32_t disk_status; 62219974Smav 63219974Smav uint32_t magic_0; 64219974Smav#define NVIDIA_MAGIC0 0x00640044 65219974Smav 66219974Smav uint64_t volume_id[2]; 67219974Smav uint8_t state; 68219974Smav#define NVIDIA_S_IDLE 0 69219974Smav#define NVIDIA_S_INIT 2 70219974Smav#define NVIDIA_S_REBUILD 3 71219974Smav#define NVIDIA_S_UPGRADE 4 72219974Smav#define NVIDIA_S_SYNC 5 73219974Smav uint8_t array_width; 74219974Smav uint8_t total_disks; 75219974Smav uint8_t orig_array_width; 76219974Smav uint16_t type; 77219974Smav#define NVIDIA_T_RAID0 0x0080 78219974Smav#define NVIDIA_T_RAID1 0x0081 79219974Smav#define NVIDIA_T_RAID3 0x0083 80219974Smav#define NVIDIA_T_RAID5 0x0085 /* RLQ = 00/02? */ 81219974Smav#define NVIDIA_T_RAID5_SYM 0x0095 /* RLQ = 03 */ 82219974Smav#define NVIDIA_T_RAID10 0x008a 83219974Smav#define NVIDIA_T_RAID01 0x8180 84219974Smav#define NVIDIA_T_CONCAT 0x00ff 85219974Smav 86219974Smav uint16_t dummy_3; 87219974Smav uint32_t strip_sectors; 88219974Smav uint32_t strip_bytes; 89219974Smav uint32_t strip_shift; 90219974Smav uint32_t strip_mask; 91219974Smav uint32_t stripe_sectors; 92219974Smav uint32_t stripe_bytes; 93219974Smav uint32_t rebuild_lba; 94219974Smav uint32_t orig_type; 95219974Smav uint32_t orig_total_sectors; 96219974Smav uint32_t status; 97219974Smav#define NVIDIA_S_BOOTABLE 0x00000001 98219974Smav#define NVIDIA_S_DEGRADED 0x00000002 99219974Smav 100219974Smav uint32_t filler[98]; 101219974Smav} __packed; 102219974Smav 103219974Smavstruct g_raid_md_nvidia_perdisk { 104219974Smav struct nvidia_raid_conf *pd_meta; 105219974Smav int pd_disk_pos; 106219974Smav off_t pd_disk_size; 107219974Smav}; 108219974Smav 109219974Smavstruct g_raid_md_nvidia_object { 110219974Smav struct g_raid_md_object mdio_base; 111219974Smav uint64_t mdio_volume_id[2]; 112219974Smav struct nvidia_raid_conf *mdio_meta; 113219974Smav struct callout mdio_start_co; /* STARTING state timer. */ 114219974Smav int mdio_total_disks; 115219974Smav int mdio_disks_present; 116219974Smav int mdio_started; 117219974Smav int mdio_incomplete; 118219974Smav struct root_hold_token *mdio_rootmount; /* Root mount delay token. */ 119219974Smav}; 120219974Smav 121219974Smavstatic g_raid_md_create_t g_raid_md_create_nvidia; 122219974Smavstatic g_raid_md_taste_t g_raid_md_taste_nvidia; 123219974Smavstatic g_raid_md_event_t g_raid_md_event_nvidia; 124219974Smavstatic g_raid_md_ctl_t g_raid_md_ctl_nvidia; 125219974Smavstatic g_raid_md_write_t g_raid_md_write_nvidia; 126219974Smavstatic g_raid_md_fail_disk_t g_raid_md_fail_disk_nvidia; 127219974Smavstatic g_raid_md_free_disk_t g_raid_md_free_disk_nvidia; 128219974Smavstatic g_raid_md_free_t g_raid_md_free_nvidia; 129219974Smav 130219974Smavstatic kobj_method_t g_raid_md_nvidia_methods[] = { 131219974Smav KOBJMETHOD(g_raid_md_create, g_raid_md_create_nvidia), 132219974Smav KOBJMETHOD(g_raid_md_taste, g_raid_md_taste_nvidia), 133219974Smav KOBJMETHOD(g_raid_md_event, g_raid_md_event_nvidia), 134219974Smav KOBJMETHOD(g_raid_md_ctl, g_raid_md_ctl_nvidia), 135219974Smav KOBJMETHOD(g_raid_md_write, g_raid_md_write_nvidia), 136219974Smav KOBJMETHOD(g_raid_md_fail_disk, g_raid_md_fail_disk_nvidia), 137219974Smav KOBJMETHOD(g_raid_md_free_disk, g_raid_md_free_disk_nvidia), 138219974Smav KOBJMETHOD(g_raid_md_free, g_raid_md_free_nvidia), 139219974Smav { 0, 0 } 140219974Smav}; 141219974Smav 142219974Smavstatic struct g_raid_md_class g_raid_md_nvidia_class = { 143219974Smav "NVIDIA", 144219974Smav g_raid_md_nvidia_methods, 145219974Smav sizeof(struct g_raid_md_nvidia_object), 146240552Smav .mdc_enable = 1, 147219974Smav .mdc_priority = 100 148219974Smav}; 149219974Smav 150219974Smavstatic int NVIDIANodeID = 1; 151219974Smav 152219974Smavstatic void 153219974Smavg_raid_md_nvidia_print(struct nvidia_raid_conf *meta) 154219974Smav{ 155219974Smav 156219974Smav if (g_raid_debug < 1) 157219974Smav return; 158219974Smav 159219974Smav printf("********* ATA NVIDIA RAID Metadata *********\n"); 160219974Smav printf("nvidia_id <%.8s>\n", meta->nvidia_id); 161219974Smav printf("config_size %u\n", meta->config_size); 162219974Smav printf("checksum 0x%08x\n", meta->checksum); 163219974Smav printf("version 0x%04x\n", meta->version); 164219974Smav printf("disk_number %d\n", meta->disk_number); 165219974Smav printf("dummy_0 0x%02x\n", meta->dummy_0); 166219974Smav printf("total_sectors %u\n", meta->total_sectors); 167219974Smav printf("sector_size %u\n", meta->sector_size); 168219974Smav printf("name <%.16s>\n", meta->name); 169219974Smav printf("revision 0x%02x%02x%02x%02x\n", 170219974Smav meta->revision[0], meta->revision[1], 171219974Smav meta->revision[2], meta->revision[3]); 172219974Smav printf("disk_status 0x%08x\n", meta->disk_status); 173219974Smav printf("magic_0 0x%08x\n", meta->magic_0); 174219974Smav printf("volume_id 0x%016jx%016jx\n", 175219974Smav meta->volume_id[1], meta->volume_id[0]); 176219974Smav printf("state 0x%02x\n", meta->state); 177219974Smav printf("array_width %u\n", meta->array_width); 178219974Smav printf("total_disks %u\n", meta->total_disks); 179219974Smav printf("orig_array_width %u\n", meta->orig_array_width); 180219974Smav printf("type 0x%04x\n", meta->type); 181219974Smav printf("dummy_3 0x%04x\n", meta->dummy_3); 182219974Smav printf("strip_sectors %u\n", meta->strip_sectors); 183219974Smav printf("strip_bytes %u\n", meta->strip_bytes); 184219974Smav printf("strip_shift %u\n", meta->strip_shift); 185219974Smav printf("strip_mask 0x%08x\n", meta->strip_mask); 186219974Smav printf("stripe_sectors %u\n", meta->stripe_sectors); 187219974Smav printf("stripe_bytes %u\n", meta->stripe_bytes); 188219974Smav printf("rebuild_lba %u\n", meta->rebuild_lba); 189219974Smav printf("orig_type 0x%04x\n", meta->orig_type); 190219974Smav printf("orig_total_sectors %u\n", meta->orig_total_sectors); 191219974Smav printf("status 0x%08x\n", meta->status); 192219974Smav printf("=================================================\n"); 193219974Smav} 194219974Smav 195219974Smavstatic struct nvidia_raid_conf * 196219974Smavnvidia_meta_copy(struct nvidia_raid_conf *meta) 197219974Smav{ 198219974Smav struct nvidia_raid_conf *nmeta; 199219974Smav 200219974Smav nmeta = malloc(sizeof(*meta), M_MD_NVIDIA, M_WAITOK); 201219974Smav memcpy(nmeta, meta, sizeof(*meta)); 202219974Smav return (nmeta); 203219974Smav} 204219974Smav 205219974Smavstatic int 206219974Smavnvidia_meta_translate_disk(struct nvidia_raid_conf *meta, int md_disk_pos) 207219974Smav{ 208219974Smav int disk_pos; 209219974Smav 210219974Smav if (md_disk_pos >= 0 && meta->type == NVIDIA_T_RAID01) { 211219974Smav disk_pos = (md_disk_pos / meta->array_width) + 212219974Smav (md_disk_pos % meta->array_width) * meta->array_width; 213219974Smav } else 214219974Smav disk_pos = md_disk_pos; 215219974Smav return (disk_pos); 216219974Smav} 217219974Smav 218219974Smavstatic void 219219974Smavnvidia_meta_get_name(struct nvidia_raid_conf *meta, char *buf) 220219974Smav{ 221219974Smav int i; 222219974Smav 223219974Smav strncpy(buf, meta->name, 16); 224219974Smav buf[16] = 0; 225219974Smav for (i = 15; i >= 0; i--) { 226219974Smav if (buf[i] > 0x20) 227219974Smav break; 228219974Smav buf[i] = 0; 229219974Smav } 230219974Smav} 231219974Smav 232219974Smavstatic void 233219974Smavnvidia_meta_put_name(struct nvidia_raid_conf *meta, char *buf) 234219974Smav{ 235219974Smav 236219974Smav memset(meta->name, 0x20, 16); 237219974Smav memcpy(meta->name, buf, MIN(strlen(buf), 16)); 238219974Smav} 239219974Smav 240219974Smavstatic struct nvidia_raid_conf * 241219974Smavnvidia_meta_read(struct g_consumer *cp) 242219974Smav{ 243219974Smav struct g_provider *pp; 244219974Smav struct nvidia_raid_conf *meta; 245219974Smav char *buf; 246219974Smav int error, i; 247219974Smav uint32_t checksum, *ptr; 248219974Smav 249219974Smav pp = cp->provider; 250219974Smav 251219974Smav /* Read the anchor sector. */ 252219974Smav buf = g_read_data(cp, 253219974Smav pp->mediasize - 2 * pp->sectorsize, pp->sectorsize, &error); 254219974Smav if (buf == NULL) { 255219974Smav G_RAID_DEBUG(1, "Cannot read metadata from %s (error=%d).", 256219974Smav pp->name, error); 257219974Smav return (NULL); 258219974Smav } 259219974Smav meta = malloc(sizeof(*meta), M_MD_NVIDIA, M_WAITOK); 260219974Smav memcpy(meta, buf, min(sizeof(*meta), pp->sectorsize)); 261219974Smav g_free(buf); 262219974Smav 263219974Smav /* Check if this is an NVIDIA RAID struct */ 264219974Smav if (strncmp(meta->nvidia_id, NVIDIA_MAGIC, strlen(NVIDIA_MAGIC))) { 265219974Smav G_RAID_DEBUG(1, "NVIDIA signature check failed on %s", pp->name); 266219974Smav free(meta, M_MD_NVIDIA); 267219974Smav return (NULL); 268219974Smav } 269219974Smav if (meta->config_size > 128 || 270219974Smav meta->config_size < 30) { 271219974Smav G_RAID_DEBUG(1, "NVIDIA metadata size looks wrong: %d", 272219974Smav meta->config_size); 273219974Smav free(meta, M_MD_NVIDIA); 274219974Smav return (NULL); 275219974Smav } 276219974Smav 277219974Smav /* Check metadata checksum. */ 278219974Smav for (checksum = 0, ptr = (uint32_t *)meta, 279219974Smav i = 0; i < meta->config_size; i++) 280219974Smav checksum += *ptr++; 281219974Smav if (checksum != 0) { 282219974Smav G_RAID_DEBUG(1, "NVIDIA checksum check failed on %s", pp->name); 283219974Smav free(meta, M_MD_NVIDIA); 284219974Smav return (NULL); 285219974Smav } 286219974Smav 287219974Smav /* Check volume state. */ 288219974Smav if (meta->state != NVIDIA_S_IDLE && meta->state != NVIDIA_S_INIT && 289219974Smav meta->state != NVIDIA_S_REBUILD && meta->state != NVIDIA_S_SYNC) { 290219974Smav G_RAID_DEBUG(1, "NVIDIA unknown state on %s (0x%02x)", 291219974Smav pp->name, meta->state); 292219974Smav free(meta, M_MD_NVIDIA); 293219974Smav return (NULL); 294219974Smav } 295219974Smav 296219974Smav /* Check raid type. */ 297219974Smav if (meta->type != NVIDIA_T_RAID0 && meta->type != NVIDIA_T_RAID1 && 298219974Smav meta->type != NVIDIA_T_RAID3 && meta->type != NVIDIA_T_RAID5 && 299219974Smav meta->type != NVIDIA_T_RAID5_SYM && 300219974Smav meta->type != NVIDIA_T_RAID01 && meta->type != NVIDIA_T_CONCAT) { 301219974Smav G_RAID_DEBUG(1, "NVIDIA unknown RAID level on %s (0x%02x)", 302219974Smav pp->name, meta->type); 303219974Smav free(meta, M_MD_NVIDIA); 304219974Smav return (NULL); 305219974Smav } 306219974Smav 307219974Smav return (meta); 308219974Smav} 309219974Smav 310219974Smavstatic int 311219974Smavnvidia_meta_write(struct g_consumer *cp, struct nvidia_raid_conf *meta) 312219974Smav{ 313219974Smav struct g_provider *pp; 314219974Smav char *buf; 315219974Smav int error, i; 316219974Smav uint32_t checksum, *ptr; 317219974Smav 318219974Smav pp = cp->provider; 319219974Smav 320219974Smav /* Recalculate checksum for case if metadata were changed. */ 321219974Smav meta->checksum = 0; 322219974Smav for (checksum = 0, ptr = (uint32_t *)meta, 323219974Smav i = 0; i < meta->config_size; i++) 324219974Smav checksum += *ptr++; 325219974Smav meta->checksum -= checksum; 326219974Smav 327219974Smav /* Create and fill buffer. */ 328219974Smav buf = malloc(pp->sectorsize, M_MD_NVIDIA, M_WAITOK | M_ZERO); 329219974Smav memcpy(buf, meta, sizeof(*meta)); 330219974Smav 331219974Smav /* Write metadata. */ 332219974Smav error = g_write_data(cp, 333219974Smav pp->mediasize - 2 * pp->sectorsize, buf, pp->sectorsize); 334219974Smav if (error != 0) { 335219974Smav G_RAID_DEBUG(1, "Cannot write metadata to %s (error=%d).", 336219974Smav pp->name, error); 337219974Smav } 338219974Smav 339219974Smav free(buf, M_MD_NVIDIA); 340219974Smav return (error); 341219974Smav} 342219974Smav 343219974Smavstatic int 344219974Smavnvidia_meta_erase(struct g_consumer *cp) 345219974Smav{ 346219974Smav struct g_provider *pp; 347219974Smav char *buf; 348219974Smav int error; 349219974Smav 350219974Smav pp = cp->provider; 351219974Smav buf = malloc(pp->sectorsize, M_MD_NVIDIA, M_WAITOK | M_ZERO); 352219974Smav error = g_write_data(cp, 353219974Smav pp->mediasize - 2 * pp->sectorsize, buf, pp->sectorsize); 354219974Smav if (error != 0) { 355219974Smav G_RAID_DEBUG(1, "Cannot erase metadata on %s (error=%d).", 356219974Smav pp->name, error); 357219974Smav } 358219974Smav free(buf, M_MD_NVIDIA); 359219974Smav return (error); 360219974Smav} 361219974Smav 362219974Smavstatic struct g_raid_disk * 363219974Smavg_raid_md_nvidia_get_disk(struct g_raid_softc *sc, int id) 364219974Smav{ 365219974Smav struct g_raid_disk *disk; 366219974Smav struct g_raid_md_nvidia_perdisk *pd; 367219974Smav 368219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 369219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 370219974Smav if (pd->pd_disk_pos == id) 371219974Smav break; 372219974Smav } 373219974Smav return (disk); 374219974Smav} 375219974Smav 376219974Smavstatic int 377219974Smavg_raid_md_nvidia_supported(int level, int qual, int disks, int force) 378219974Smav{ 379219974Smav 380219974Smav switch (level) { 381219974Smav case G_RAID_VOLUME_RL_RAID0: 382219974Smav if (disks < 1) 383219974Smav return (0); 384219974Smav if (!force && (disks < 2 || disks > 6)) 385219974Smav return (0); 386219974Smav break; 387219974Smav case G_RAID_VOLUME_RL_RAID1: 388219974Smav if (disks < 1) 389219974Smav return (0); 390219974Smav if (!force && (disks != 2)) 391219974Smav return (0); 392219974Smav break; 393219974Smav case G_RAID_VOLUME_RL_RAID1E: 394219974Smav if (disks < 2) 395219974Smav return (0); 396219974Smav if (disks % 2 != 0) 397219974Smav return (0); 398219974Smav if (!force && (disks < 4)) 399219974Smav return (0); 400219974Smav break; 401219974Smav case G_RAID_VOLUME_RL_SINGLE: 402219974Smav if (disks != 1) 403219974Smav return (0); 404219974Smav break; 405219974Smav case G_RAID_VOLUME_RL_CONCAT: 406219974Smav if (disks < 2) 407219974Smav return (0); 408219974Smav break; 409219974Smav case G_RAID_VOLUME_RL_RAID5: 410219974Smav if (disks < 3) 411219974Smav return (0); 412235874Smav if (qual != G_RAID_VOLUME_RLQ_R5LA && 413235874Smav qual != G_RAID_VOLUME_RLQ_R5LS) 414235874Smav return (0); 415219974Smav break; 416219974Smav default: 417219974Smav return (0); 418219974Smav } 419235874Smav if (level != G_RAID_VOLUME_RL_RAID5 && qual != G_RAID_VOLUME_RLQ_NONE) 420219974Smav return (0); 421219974Smav return (1); 422219974Smav} 423219974Smav 424219974Smavstatic int 425219974Smavg_raid_md_nvidia_start_disk(struct g_raid_disk *disk) 426219974Smav{ 427219974Smav struct g_raid_softc *sc; 428219974Smav struct g_raid_subdisk *sd, *tmpsd; 429219974Smav struct g_raid_disk *olddisk, *tmpdisk; 430219974Smav struct g_raid_md_object *md; 431219974Smav struct g_raid_md_nvidia_object *mdi; 432219974Smav struct g_raid_md_nvidia_perdisk *pd, *oldpd; 433219974Smav struct nvidia_raid_conf *meta; 434219974Smav int disk_pos, resurrection = 0; 435219974Smav 436219974Smav sc = disk->d_softc; 437219974Smav md = sc->sc_md; 438219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 439219974Smav meta = mdi->mdio_meta; 440219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 441219974Smav olddisk = NULL; 442219974Smav 443219974Smav /* Find disk position in metadata by it's serial. */ 444219974Smav if (pd->pd_meta != NULL) { 445219974Smav disk_pos = pd->pd_meta->disk_number; 446219974Smav if (disk_pos >= meta->total_disks || mdi->mdio_started) 447219974Smav disk_pos = -3; 448219974Smav } else 449219974Smav disk_pos = -3; 450219974Smav /* For RAID0+1 we need to translate order. */ 451219974Smav disk_pos = nvidia_meta_translate_disk(meta, disk_pos); 452219974Smav if (disk_pos < 0) { 453219974Smav G_RAID_DEBUG1(1, sc, "Unknown, probably new or stale disk"); 454219974Smav /* If we are in the start process, that's all for now. */ 455219974Smav if (!mdi->mdio_started) 456219974Smav goto nofit; 457219974Smav /* 458219974Smav * If we have already started - try to get use of the disk. 459219974Smav * Try to replace OFFLINE disks first, then FAILED. 460219974Smav */ 461219974Smav TAILQ_FOREACH(tmpdisk, &sc->sc_disks, d_next) { 462219974Smav if (tmpdisk->d_state != G_RAID_DISK_S_OFFLINE && 463219974Smav tmpdisk->d_state != G_RAID_DISK_S_FAILED) 464219974Smav continue; 465219974Smav /* Make sure this disk is big enough. */ 466219974Smav TAILQ_FOREACH(sd, &tmpdisk->d_subdisks, sd_next) { 467219974Smav if (sd->sd_offset + sd->sd_size + 2 * 512 > 468219974Smav pd->pd_disk_size) { 469219974Smav G_RAID_DEBUG1(1, sc, 470219974Smav "Disk too small (%ju < %ju)", 471219974Smav pd->pd_disk_size, 472219974Smav sd->sd_offset + sd->sd_size + 512); 473219974Smav break; 474219974Smav } 475219974Smav } 476219974Smav if (sd != NULL) 477219974Smav continue; 478219974Smav if (tmpdisk->d_state == G_RAID_DISK_S_OFFLINE) { 479219974Smav olddisk = tmpdisk; 480219974Smav break; 481219974Smav } else if (olddisk == NULL) 482219974Smav olddisk = tmpdisk; 483219974Smav } 484219974Smav if (olddisk == NULL) { 485219974Smavnofit: 486219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_SPARE); 487219974Smav return (1); 488219974Smav } 489219974Smav oldpd = (struct g_raid_md_nvidia_perdisk *)olddisk->d_md_data; 490219974Smav disk_pos = oldpd->pd_disk_pos; 491219974Smav resurrection = 1; 492219974Smav } 493219974Smav 494219974Smav if (olddisk == NULL) { 495219974Smav /* Find placeholder by position. */ 496219974Smav olddisk = g_raid_md_nvidia_get_disk(sc, disk_pos); 497219974Smav if (olddisk == NULL) 498219974Smav panic("No disk at position %d!", disk_pos); 499219974Smav if (olddisk->d_state != G_RAID_DISK_S_OFFLINE) { 500219974Smav G_RAID_DEBUG1(1, sc, "More then one disk for pos %d", 501219974Smav disk_pos); 502219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_STALE); 503219974Smav return (0); 504219974Smav } 505219974Smav oldpd = (struct g_raid_md_nvidia_perdisk *)olddisk->d_md_data; 506219974Smav } 507219974Smav 508219974Smav /* Replace failed disk or placeholder with new disk. */ 509219974Smav TAILQ_FOREACH_SAFE(sd, &olddisk->d_subdisks, sd_next, tmpsd) { 510219974Smav TAILQ_REMOVE(&olddisk->d_subdisks, sd, sd_next); 511219974Smav TAILQ_INSERT_TAIL(&disk->d_subdisks, sd, sd_next); 512219974Smav sd->sd_disk = disk; 513219974Smav } 514219974Smav oldpd->pd_disk_pos = -2; 515219974Smav pd->pd_disk_pos = disk_pos; 516219974Smav 517219974Smav /* If it was placeholder -- destroy it. */ 518219974Smav if (olddisk->d_state == G_RAID_DISK_S_OFFLINE) { 519219974Smav g_raid_destroy_disk(olddisk); 520219974Smav } else { 521219974Smav /* Otherwise, make it STALE_FAILED. */ 522219974Smav g_raid_change_disk_state(olddisk, G_RAID_DISK_S_STALE_FAILED); 523219974Smav } 524219974Smav 525219974Smav /* Welcome the new disk. */ 526219974Smav if (resurrection) 527219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_ACTIVE); 528219974Smav else// if (pd->pd_meta->disk_status == NVIDIA_S_CURRENT || 529219974Smav //pd->pd_meta->disk_status == NVIDIA_S_REBUILD) 530219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_ACTIVE); 531219974Smav// else 532219974Smav// g_raid_change_disk_state(disk, G_RAID_DISK_S_FAILED); 533219974Smav TAILQ_FOREACH(sd, &disk->d_subdisks, sd_next) { 534219974Smav 535219974Smav /* 536219974Smav * Different disks may have different sizes, 537219974Smav * in concat mode. Update from real disk size. 538219974Smav */ 539219974Smav if (meta->type == NVIDIA_T_CONCAT) 540219974Smav sd->sd_size = pd->pd_disk_size - 0x800 * 512; 541219974Smav 542219974Smav if (resurrection) { 543219974Smav /* New or ex-spare disk. */ 544219974Smav g_raid_change_subdisk_state(sd, 545219974Smav G_RAID_SUBDISK_S_NEW); 546219974Smav } else if (meta->state == NVIDIA_S_REBUILD && 547219974Smav (pd->pd_meta->disk_status & 0x100)) { 548219974Smav /* Rebuilding disk. */ 549219974Smav g_raid_change_subdisk_state(sd, 550219974Smav G_RAID_SUBDISK_S_REBUILD); 551219974Smav sd->sd_rebuild_pos = (off_t)pd->pd_meta->rebuild_lba / 552219974Smav meta->array_width * pd->pd_meta->sector_size; 553219974Smav } else if (meta->state == NVIDIA_S_SYNC) { 554219974Smav /* Resyncing/dirty disk. */ 555219974Smav g_raid_change_subdisk_state(sd, 556219974Smav G_RAID_SUBDISK_S_RESYNC); 557219974Smav sd->sd_rebuild_pos = (off_t)pd->pd_meta->rebuild_lba / 558219974Smav meta->array_width * pd->pd_meta->sector_size; 559219974Smav } else { 560219974Smav /* Up to date disk. */ 561219974Smav g_raid_change_subdisk_state(sd, 562219974Smav G_RAID_SUBDISK_S_ACTIVE); 563219974Smav } 564219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_NEW, 565219974Smav G_RAID_EVENT_SUBDISK); 566219974Smav } 567219974Smav 568219974Smav /* Update status of our need for spare. */ 569219974Smav if (mdi->mdio_started) { 570219974Smav mdi->mdio_incomplete = 571219974Smav (g_raid_ndisks(sc, G_RAID_DISK_S_ACTIVE) < 572219974Smav mdi->mdio_total_disks); 573219974Smav } 574219974Smav 575219974Smav return (resurrection); 576219974Smav} 577219974Smav 578219974Smavstatic void 579219974Smavg_disk_md_nvidia_retaste(void *arg, int pending) 580219974Smav{ 581219974Smav 582219974Smav G_RAID_DEBUG(1, "Array is not complete, trying to retaste."); 583219974Smav g_retaste(&g_raid_class); 584219974Smav free(arg, M_MD_NVIDIA); 585219974Smav} 586219974Smav 587219974Smavstatic void 588219974Smavg_raid_md_nvidia_refill(struct g_raid_softc *sc) 589219974Smav{ 590219974Smav struct g_raid_md_object *md; 591219974Smav struct g_raid_md_nvidia_object *mdi; 592219974Smav struct g_raid_disk *disk; 593219974Smav struct task *task; 594219974Smav int update, na; 595219974Smav 596219974Smav md = sc->sc_md; 597219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 598219974Smav update = 0; 599219974Smav do { 600219974Smav /* Make sure we miss anything. */ 601219974Smav na = g_raid_ndisks(sc, G_RAID_DISK_S_ACTIVE); 602219974Smav if (na == mdi->mdio_total_disks) 603219974Smav break; 604219974Smav 605219974Smav G_RAID_DEBUG1(1, md->mdo_softc, 606219974Smav "Array is not complete (%d of %d), " 607219974Smav "trying to refill.", na, mdi->mdio_total_disks); 608219974Smav 609219974Smav /* Try to get use some of STALE disks. */ 610219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 611219974Smav if (disk->d_state == G_RAID_DISK_S_STALE) { 612219974Smav update += g_raid_md_nvidia_start_disk(disk); 613219974Smav if (disk->d_state == G_RAID_DISK_S_ACTIVE) 614219974Smav break; 615219974Smav } 616219974Smav } 617219974Smav if (disk != NULL) 618219974Smav continue; 619219974Smav 620219974Smav /* Try to get use some of SPARE disks. */ 621219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 622219974Smav if (disk->d_state == G_RAID_DISK_S_SPARE) { 623219974Smav update += g_raid_md_nvidia_start_disk(disk); 624219974Smav if (disk->d_state == G_RAID_DISK_S_ACTIVE) 625219974Smav break; 626219974Smav } 627219974Smav } 628219974Smav } while (disk != NULL); 629219974Smav 630219974Smav /* Write new metadata if we changed something. */ 631220210Smav if (update) 632219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 633219974Smav 634219974Smav /* Update status of our need for spare. */ 635219974Smav mdi->mdio_incomplete = (g_raid_ndisks(sc, G_RAID_DISK_S_ACTIVE) < 636219974Smav mdi->mdio_total_disks); 637219974Smav 638219974Smav /* Request retaste hoping to find spare. */ 639219974Smav if (mdi->mdio_incomplete) { 640219974Smav task = malloc(sizeof(struct task), 641219974Smav M_MD_NVIDIA, M_WAITOK | M_ZERO); 642219974Smav TASK_INIT(task, 0, g_disk_md_nvidia_retaste, task); 643219974Smav taskqueue_enqueue(taskqueue_swi, task); 644219974Smav } 645219974Smav} 646219974Smav 647219974Smavstatic void 648219974Smavg_raid_md_nvidia_start(struct g_raid_softc *sc) 649219974Smav{ 650219974Smav struct g_raid_md_object *md; 651219974Smav struct g_raid_md_nvidia_object *mdi; 652219974Smav struct g_raid_md_nvidia_perdisk *pd; 653219974Smav struct nvidia_raid_conf *meta; 654219974Smav struct g_raid_volume *vol; 655219974Smav struct g_raid_subdisk *sd; 656219974Smav struct g_raid_disk *disk; 657219974Smav off_t size; 658219974Smav int j, disk_pos; 659219974Smav char buf[17]; 660219974Smav 661219974Smav md = sc->sc_md; 662219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 663219974Smav meta = mdi->mdio_meta; 664219974Smav 665219974Smav /* Create volumes and subdisks. */ 666219974Smav nvidia_meta_get_name(meta, buf); 667219974Smav vol = g_raid_create_volume(sc, buf, -1); 668219974Smav vol->v_mediasize = (off_t)meta->total_sectors * 512; 669219974Smav vol->v_raid_level_qualifier = G_RAID_VOLUME_RLQ_NONE; 670219974Smav if (meta->type == NVIDIA_T_RAID0) { 671219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID0; 672219974Smav size = vol->v_mediasize / mdi->mdio_total_disks; 673219974Smav } else if (meta->type == NVIDIA_T_RAID1) { 674219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID1; 675219974Smav size = vol->v_mediasize; 676219974Smav } else if (meta->type == NVIDIA_T_RAID01) { 677219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID1E; 678219974Smav size = vol->v_mediasize / (mdi->mdio_total_disks / 2); 679219974Smav } else if (meta->type == NVIDIA_T_CONCAT) { 680219974Smav if (mdi->mdio_total_disks == 1) 681219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_SINGLE; 682219974Smav else 683219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_CONCAT; 684219974Smav size = 0; 685219974Smav } else if (meta->type == NVIDIA_T_RAID5) { 686219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID5; 687235874Smav vol->v_raid_level_qualifier = G_RAID_VOLUME_RLQ_R5LA; 688219974Smav size = vol->v_mediasize / (mdi->mdio_total_disks - 1); 689219974Smav } else if (meta->type == NVIDIA_T_RAID5_SYM) { 690219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_RAID5; 691235874Smav vol->v_raid_level_qualifier = G_RAID_VOLUME_RLQ_R5LS; 692219974Smav size = vol->v_mediasize / (mdi->mdio_total_disks - 1); 693219974Smav } else { 694219974Smav vol->v_raid_level = G_RAID_VOLUME_RL_UNKNOWN; 695219974Smav size = 0; 696219974Smav } 697219974Smav vol->v_strip_size = meta->strip_sectors * 512; //ZZZ 698219974Smav vol->v_disks_count = mdi->mdio_total_disks; 699219974Smav vol->v_sectorsize = 512; //ZZZ 700219974Smav for (j = 0; j < vol->v_disks_count; j++) { 701219974Smav sd = &vol->v_subdisks[j]; 702219974Smav sd->sd_offset = 0; 703219974Smav sd->sd_size = size; 704219974Smav } 705219974Smav g_raid_start_volume(vol); 706219974Smav 707219974Smav /* Create disk placeholders to store data for later writing. */ 708219974Smav for (disk_pos = 0; disk_pos < mdi->mdio_total_disks; disk_pos++) { 709219974Smav pd = malloc(sizeof(*pd), M_MD_NVIDIA, M_WAITOK | M_ZERO); 710219974Smav pd->pd_disk_pos = disk_pos; 711219974Smav disk = g_raid_create_disk(sc); 712219974Smav disk->d_md_data = (void *)pd; 713219974Smav disk->d_state = G_RAID_DISK_S_OFFLINE; 714219974Smav sd = &vol->v_subdisks[disk_pos]; 715219974Smav sd->sd_disk = disk; 716219974Smav TAILQ_INSERT_TAIL(&disk->d_subdisks, sd, sd_next); 717219974Smav } 718219974Smav 719219974Smav /* Make all disks found till the moment take their places. */ 720219974Smav do { 721219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 722219974Smav if (disk->d_state == G_RAID_DISK_S_NONE) { 723219974Smav g_raid_md_nvidia_start_disk(disk); 724219974Smav break; 725219974Smav } 726219974Smav } 727219974Smav } while (disk != NULL); 728219974Smav 729219974Smav mdi->mdio_started = 1; 730219974Smav G_RAID_DEBUG1(0, sc, "Array started."); 731219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 732219974Smav 733219974Smav /* Pickup any STALE/SPARE disks to refill array if needed. */ 734219974Smav g_raid_md_nvidia_refill(sc); 735219974Smav 736219974Smav g_raid_event_send(vol, G_RAID_VOLUME_E_START, G_RAID_EVENT_VOLUME); 737219974Smav 738219974Smav callout_stop(&mdi->mdio_start_co); 739219974Smav G_RAID_DEBUG1(1, sc, "root_mount_rel %p", mdi->mdio_rootmount); 740219974Smav root_mount_rel(mdi->mdio_rootmount); 741219974Smav mdi->mdio_rootmount = NULL; 742219974Smav} 743219974Smav 744219974Smavstatic void 745219974Smavg_raid_md_nvidia_new_disk(struct g_raid_disk *disk) 746219974Smav{ 747219974Smav struct g_raid_softc *sc; 748219974Smav struct g_raid_md_object *md; 749219974Smav struct g_raid_md_nvidia_object *mdi; 750219974Smav struct nvidia_raid_conf *pdmeta; 751219974Smav struct g_raid_md_nvidia_perdisk *pd; 752219974Smav 753219974Smav sc = disk->d_softc; 754219974Smav md = sc->sc_md; 755219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 756219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 757219974Smav pdmeta = pd->pd_meta; 758219974Smav 759219974Smav if (mdi->mdio_started) { 760219974Smav if (g_raid_md_nvidia_start_disk(disk)) 761219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 762219974Smav } else { 763219974Smav if (mdi->mdio_meta == NULL || 764219974Smav mdi->mdio_meta->disk_number >= mdi->mdio_meta->total_disks) { 765219974Smav G_RAID_DEBUG1(1, sc, "Newer disk"); 766219974Smav if (mdi->mdio_meta != NULL) 767219974Smav free(mdi->mdio_meta, M_MD_NVIDIA); 768219974Smav mdi->mdio_meta = nvidia_meta_copy(pdmeta); 769219974Smav mdi->mdio_total_disks = pdmeta->total_disks; 770219974Smav mdi->mdio_disks_present = 1; 771219974Smav } else if (pdmeta->disk_number < mdi->mdio_meta->total_disks) { 772219974Smav mdi->mdio_disks_present++; 773219974Smav G_RAID_DEBUG1(1, sc, "Matching disk (%d of %d up)", 774219974Smav mdi->mdio_disks_present, 775219974Smav mdi->mdio_total_disks); 776219974Smav } else 777219974Smav G_RAID_DEBUG1(1, sc, "Spare disk"); 778219974Smav 779219974Smav /* If we collected all needed disks - start array. */ 780219974Smav if (mdi->mdio_disks_present == mdi->mdio_total_disks) 781219974Smav g_raid_md_nvidia_start(sc); 782219974Smav } 783219974Smav} 784219974Smav 785219974Smavstatic void 786219974Smavg_raid_nvidia_go(void *arg) 787219974Smav{ 788219974Smav struct g_raid_softc *sc; 789219974Smav struct g_raid_md_object *md; 790219974Smav struct g_raid_md_nvidia_object *mdi; 791219974Smav 792219974Smav sc = arg; 793219974Smav md = sc->sc_md; 794219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 795219974Smav if (!mdi->mdio_started) { 796219974Smav G_RAID_DEBUG1(0, sc, "Force array start due to timeout."); 797219974Smav g_raid_event_send(sc, G_RAID_NODE_E_START, 0); 798219974Smav } 799219974Smav} 800219974Smav 801219974Smavstatic int 802219974Smavg_raid_md_create_nvidia(struct g_raid_md_object *md, struct g_class *mp, 803219974Smav struct g_geom **gp) 804219974Smav{ 805219974Smav struct g_raid_softc *sc; 806219974Smav struct g_raid_md_nvidia_object *mdi; 807219974Smav char name[32]; 808219974Smav 809219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 810219974Smav arc4rand(&mdi->mdio_volume_id, 16, 0); 811219974Smav snprintf(name, sizeof(name), "NVIDIA-%d", 812219974Smav atomic_fetchadd_int(&NVIDIANodeID, 1)); 813219974Smav sc = g_raid_create_node(mp, name, md); 814219974Smav if (sc == NULL) 815219974Smav return (G_RAID_MD_TASTE_FAIL); 816219974Smav md->mdo_softc = sc; 817219974Smav *gp = sc->sc_geom; 818219974Smav return (G_RAID_MD_TASTE_NEW); 819219974Smav} 820219974Smav 821219974Smavstatic int 822219974Smavg_raid_md_taste_nvidia(struct g_raid_md_object *md, struct g_class *mp, 823219974Smav struct g_consumer *cp, struct g_geom **gp) 824219974Smav{ 825219974Smav struct g_consumer *rcp; 826219974Smav struct g_provider *pp; 827219974Smav struct g_raid_md_nvidia_object *mdi, *mdi1; 828219974Smav struct g_raid_softc *sc; 829219974Smav struct g_raid_disk *disk; 830219974Smav struct nvidia_raid_conf *meta; 831219974Smav struct g_raid_md_nvidia_perdisk *pd; 832219974Smav struct g_geom *geom; 833243678Smav int result, spare, len; 834219974Smav char name[32]; 835219974Smav uint16_t vendor; 836219974Smav 837219974Smav G_RAID_DEBUG(1, "Tasting NVIDIA on %s", cp->provider->name); 838219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 839219974Smav pp = cp->provider; 840219974Smav 841219974Smav /* Read metadata from device. */ 842219974Smav meta = NULL; 843219974Smav vendor = 0xffff; 844219974Smav g_topology_unlock(); 845219974Smav len = 2; 846219974Smav if (pp->geom->rank == 1) 847219974Smav g_io_getattr("GEOM::hba_vendor", cp, &len, &vendor); 848219974Smav meta = nvidia_meta_read(cp); 849219974Smav g_topology_lock(); 850219974Smav if (meta == NULL) { 851219974Smav if (g_raid_aggressive_spare) { 852219974Smav if (vendor == 0x10de) { 853219974Smav G_RAID_DEBUG(1, 854219974Smav "No NVIDIA metadata, forcing spare."); 855219974Smav spare = 2; 856219974Smav goto search; 857219974Smav } else { 858219974Smav G_RAID_DEBUG(1, 859219974Smav "NVIDIA vendor mismatch 0x%04x != 0x10de", 860219974Smav vendor); 861219974Smav } 862219974Smav } 863219974Smav return (G_RAID_MD_TASTE_FAIL); 864219974Smav } 865219974Smav 866219974Smav /* Metadata valid. Print it. */ 867219974Smav g_raid_md_nvidia_print(meta); 868220210Smav G_RAID_DEBUG(1, "NVIDIA disk position %d", meta->disk_number); 869219974Smav spare = 0;//(meta->type == NVIDIA_T_SPARE) ? 1 : 0; 870219974Smav 871219974Smavsearch: 872219974Smav /* Search for matching node. */ 873219974Smav sc = NULL; 874219974Smav mdi1 = NULL; 875219974Smav LIST_FOREACH(geom, &mp->geom, geom) { 876219974Smav sc = geom->softc; 877219974Smav if (sc == NULL) 878219974Smav continue; 879219974Smav if (sc->sc_stopping != 0) 880219974Smav continue; 881219974Smav if (sc->sc_md->mdo_class != md->mdo_class) 882219974Smav continue; 883219974Smav mdi1 = (struct g_raid_md_nvidia_object *)sc->sc_md; 884219974Smav if (spare) { 885219974Smav if (mdi1->mdio_incomplete) 886219974Smav break; 887219974Smav } else { 888219974Smav if (memcmp(&mdi1->mdio_volume_id, 889219974Smav &meta->volume_id, 16) == 0) 890219974Smav break; 891219974Smav } 892219974Smav } 893219974Smav 894219974Smav /* Found matching node. */ 895219974Smav if (geom != NULL) { 896219974Smav G_RAID_DEBUG(1, "Found matching array %s", sc->sc_name); 897219974Smav result = G_RAID_MD_TASTE_EXISTING; 898219974Smav 899219974Smav } else if (spare) { /* Not found needy node -- left for later. */ 900219974Smav G_RAID_DEBUG(1, "Spare is not needed at this time"); 901219974Smav goto fail1; 902219974Smav 903219974Smav } else { /* Not found matching node -- create one. */ 904219974Smav result = G_RAID_MD_TASTE_NEW; 905219974Smav memcpy(&mdi->mdio_volume_id, &meta->volume_id, 16); 906219974Smav snprintf(name, sizeof(name), "NVIDIA-%d", 907219974Smav atomic_fetchadd_int(&NVIDIANodeID, 1)); 908219974Smav sc = g_raid_create_node(mp, name, md); 909219974Smav md->mdo_softc = sc; 910219974Smav geom = sc->sc_geom; 911219974Smav callout_init(&mdi->mdio_start_co, 1); 912219974Smav callout_reset(&mdi->mdio_start_co, g_raid_start_timeout * hz, 913219974Smav g_raid_nvidia_go, sc); 914219974Smav mdi->mdio_rootmount = root_mount_hold("GRAID-NVIDIA"); 915219974Smav G_RAID_DEBUG1(1, sc, "root_mount_hold %p", mdi->mdio_rootmount); 916219974Smav } 917219974Smav 918265675Smav /* There is no return after this point, so we close passed consumer. */ 919265675Smav g_access(cp, -1, 0, 0); 920265675Smav 921219974Smav rcp = g_new_consumer(geom); 922219974Smav g_attach(rcp, pp); 923219974Smav if (g_access(rcp, 1, 1, 1) != 0) 924219974Smav ; //goto fail1; 925219974Smav 926219974Smav g_topology_unlock(); 927219974Smav sx_xlock(&sc->sc_lock); 928219974Smav 929219974Smav pd = malloc(sizeof(*pd), M_MD_NVIDIA, M_WAITOK | M_ZERO); 930219974Smav pd->pd_meta = meta; 931219974Smav if (spare == 2) { 932219974Smav pd->pd_disk_pos = -3; 933219974Smav } else { 934219974Smav pd->pd_disk_pos = -1; 935219974Smav } 936219974Smav pd->pd_disk_size = pp->mediasize; 937219974Smav disk = g_raid_create_disk(sc); 938219974Smav disk->d_md_data = (void *)pd; 939219974Smav disk->d_consumer = rcp; 940219974Smav rcp->private = disk; 941219974Smav 942243678Smav g_raid_get_disk_info(disk); 943219974Smav 944219974Smav g_raid_md_nvidia_new_disk(disk); 945219974Smav 946219974Smav sx_xunlock(&sc->sc_lock); 947219974Smav g_topology_lock(); 948219974Smav *gp = geom; 949219974Smav return (result); 950219974Smavfail1: 951219974Smav free(meta, M_MD_NVIDIA); 952219974Smav return (G_RAID_MD_TASTE_FAIL); 953219974Smav} 954219974Smav 955219974Smavstatic int 956219974Smavg_raid_md_event_nvidia(struct g_raid_md_object *md, 957219974Smav struct g_raid_disk *disk, u_int event) 958219974Smav{ 959219974Smav struct g_raid_softc *sc; 960219974Smav struct g_raid_subdisk *sd; 961219974Smav struct g_raid_md_nvidia_object *mdi; 962219974Smav struct g_raid_md_nvidia_perdisk *pd; 963219974Smav 964219974Smav sc = md->mdo_softc; 965219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 966219974Smav if (disk == NULL) { 967219974Smav switch (event) { 968219974Smav case G_RAID_NODE_E_START: 969219974Smav if (!mdi->mdio_started) { 970219974Smav /* Bump volume ID to drop missing disks. */ 971219974Smav arc4rand(&mdi->mdio_volume_id, 16, 0); 972219974Smav g_raid_md_nvidia_start(sc); 973219974Smav } 974219974Smav return (0); 975219974Smav } 976219974Smav return (-1); 977219974Smav } 978219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 979219974Smav switch (event) { 980219974Smav case G_RAID_DISK_E_DISCONNECTED: 981219974Smav /* If disk was assigned, just update statuses. */ 982219974Smav if (pd->pd_disk_pos >= 0) { 983219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_OFFLINE); 984219974Smav if (disk->d_consumer) { 985219974Smav g_raid_kill_consumer(sc, disk->d_consumer); 986219974Smav disk->d_consumer = NULL; 987219974Smav } 988219974Smav TAILQ_FOREACH(sd, &disk->d_subdisks, sd_next) { 989219974Smav g_raid_change_subdisk_state(sd, 990219974Smav G_RAID_SUBDISK_S_NONE); 991219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_DISCONNECTED, 992219974Smav G_RAID_EVENT_SUBDISK); 993219974Smav } 994219974Smav } else { 995219974Smav /* Otherwise -- delete. */ 996219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_NONE); 997219974Smav g_raid_destroy_disk(disk); 998219974Smav } 999219974Smav 1000219974Smav if (mdi->mdio_started) { 1001219974Smav /* Bump volume ID to prevent disk resurrection. */ 1002219974Smav if (pd->pd_disk_pos >= 0) 1003219974Smav arc4rand(&mdi->mdio_volume_id, 16, 0); 1004219974Smav 1005219974Smav /* Write updated metadata to all disks. */ 1006219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 1007219974Smav } 1008219974Smav 1009219974Smav /* Check if anything left except placeholders. */ 1010219974Smav if (g_raid_ndisks(sc, -1) == 1011219974Smav g_raid_ndisks(sc, G_RAID_DISK_S_OFFLINE)) 1012219974Smav g_raid_destroy_node(sc, 0); 1013219974Smav else 1014219974Smav g_raid_md_nvidia_refill(sc); 1015219974Smav return (0); 1016219974Smav } 1017219974Smav return (-2); 1018219974Smav} 1019219974Smav 1020219974Smavstatic int 1021219974Smavg_raid_md_ctl_nvidia(struct g_raid_md_object *md, 1022219974Smav struct gctl_req *req) 1023219974Smav{ 1024219974Smav struct g_raid_softc *sc; 1025219974Smav struct g_raid_volume *vol; 1026219974Smav struct g_raid_subdisk *sd; 1027219974Smav struct g_raid_disk *disk; 1028219974Smav struct g_raid_md_nvidia_object *mdi; 1029219974Smav struct g_raid_md_nvidia_perdisk *pd; 1030219974Smav struct g_consumer *cp; 1031219974Smav struct g_provider *pp; 1032219974Smav char arg[16]; 1033219974Smav const char *verb, *volname, *levelname, *diskname; 1034219974Smav int *nargs, *force; 1035229301Smav off_t size, sectorsize, strip, volsize; 1036219974Smav intmax_t *sizearg, *striparg; 1037219974Smav int numdisks, i, len, level, qual, update; 1038219974Smav int error; 1039219974Smav 1040219974Smav sc = md->mdo_softc; 1041219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 1042219974Smav verb = gctl_get_param(req, "verb", NULL); 1043219974Smav nargs = gctl_get_paraml(req, "nargs", sizeof(*nargs)); 1044219974Smav error = 0; 1045219974Smav if (strcmp(verb, "label") == 0) { 1046219974Smav 1047219974Smav if (*nargs < 4) { 1048219974Smav gctl_error(req, "Invalid number of arguments."); 1049219974Smav return (-1); 1050219974Smav } 1051219974Smav volname = gctl_get_asciiparam(req, "arg1"); 1052219974Smav if (volname == NULL) { 1053219974Smav gctl_error(req, "No volume name."); 1054219974Smav return (-2); 1055219974Smav } 1056219974Smav levelname = gctl_get_asciiparam(req, "arg2"); 1057219974Smav if (levelname == NULL) { 1058219974Smav gctl_error(req, "No RAID level."); 1059219974Smav return (-3); 1060219974Smav } 1061235874Smav if (strcasecmp(levelname, "RAID5") == 0) 1062235874Smav levelname = "RAID5-LS"; 1063219974Smav if (g_raid_volume_str2level(levelname, &level, &qual)) { 1064219974Smav gctl_error(req, "Unknown RAID level '%s'.", levelname); 1065219974Smav return (-4); 1066219974Smav } 1067219974Smav numdisks = *nargs - 3; 1068219974Smav force = gctl_get_paraml(req, "force", sizeof(*force)); 1069219974Smav if (!g_raid_md_nvidia_supported(level, qual, numdisks, 1070219974Smav force ? *force : 0)) { 1071219974Smav gctl_error(req, "Unsupported RAID level " 1072219974Smav "(0x%02x/0x%02x), or number of disks (%d).", 1073219974Smav level, qual, numdisks); 1074219974Smav return (-5); 1075219974Smav } 1076219974Smav 1077219974Smav /* Search for disks, connect them and probe. */ 1078219974Smav size = 0x7fffffffffffffffllu; 1079219974Smav sectorsize = 0; 1080219974Smav for (i = 0; i < numdisks; i++) { 1081219974Smav snprintf(arg, sizeof(arg), "arg%d", i + 3); 1082219974Smav diskname = gctl_get_asciiparam(req, arg); 1083219974Smav if (diskname == NULL) { 1084219974Smav gctl_error(req, "No disk name (%s).", arg); 1085219974Smav error = -6; 1086219974Smav break; 1087219974Smav } 1088219974Smav if (strcmp(diskname, "NONE") == 0) { 1089219974Smav cp = NULL; 1090219974Smav pp = NULL; 1091219974Smav } else { 1092219974Smav g_topology_lock(); 1093219974Smav cp = g_raid_open_consumer(sc, diskname); 1094219974Smav if (cp == NULL) { 1095219974Smav gctl_error(req, "Can't open '%s'.", 1096219974Smav diskname); 1097219974Smav g_topology_unlock(); 1098219974Smav error = -7; 1099219974Smav break; 1100219974Smav } 1101219974Smav pp = cp->provider; 1102219974Smav } 1103219974Smav pd = malloc(sizeof(*pd), M_MD_NVIDIA, M_WAITOK | M_ZERO); 1104219974Smav pd->pd_disk_pos = i; 1105219974Smav disk = g_raid_create_disk(sc); 1106219974Smav disk->d_md_data = (void *)pd; 1107219974Smav disk->d_consumer = cp; 1108219974Smav if (cp == NULL) 1109219974Smav continue; 1110219974Smav cp->private = disk; 1111219974Smav g_topology_unlock(); 1112219974Smav 1113243678Smav g_raid_get_disk_info(disk); 1114219974Smav 1115219974Smav pd->pd_disk_size = pp->mediasize; 1116219974Smav if (size > pp->mediasize) 1117219974Smav size = pp->mediasize; 1118219974Smav if (sectorsize < pp->sectorsize) 1119219974Smav sectorsize = pp->sectorsize; 1120219974Smav } 1121219974Smav if (error != 0) 1122219974Smav return (error); 1123219974Smav 1124220210Smav if (sectorsize <= 0) { 1125220210Smav gctl_error(req, "Can't get sector size."); 1126220210Smav return (-8); 1127220210Smav } 1128220210Smav 1129219974Smav /* Reserve space for metadata. */ 1130219974Smav size -= 2 * sectorsize; 1131219974Smav 1132219974Smav /* Handle size argument. */ 1133219974Smav len = sizeof(*sizearg); 1134219974Smav sizearg = gctl_get_param(req, "size", &len); 1135219974Smav if (sizearg != NULL && len == sizeof(*sizearg) && 1136219974Smav *sizearg > 0) { 1137219974Smav if (*sizearg > size) { 1138219974Smav gctl_error(req, "Size too big %lld > %lld.", 1139219974Smav (long long)*sizearg, (long long)size); 1140219974Smav return (-9); 1141219974Smav } 1142219974Smav size = *sizearg; 1143219974Smav } 1144219974Smav 1145219974Smav /* Handle strip argument. */ 1146219974Smav strip = 131072; 1147219974Smav len = sizeof(*striparg); 1148219974Smav striparg = gctl_get_param(req, "strip", &len); 1149219974Smav if (striparg != NULL && len == sizeof(*striparg) && 1150219974Smav *striparg > 0) { 1151219974Smav if (*striparg < sectorsize) { 1152219974Smav gctl_error(req, "Strip size too small."); 1153219974Smav return (-10); 1154219974Smav } 1155219974Smav if (*striparg % sectorsize != 0) { 1156219974Smav gctl_error(req, "Incorrect strip size."); 1157219974Smav return (-11); 1158219974Smav } 1159219974Smav if (strip > 65535 * sectorsize) { 1160219974Smav gctl_error(req, "Strip size too big."); 1161219974Smav return (-12); 1162219974Smav } 1163219974Smav strip = *striparg; 1164219974Smav } 1165219974Smav 1166219974Smav /* Round size down to strip or sector. */ 1167219974Smav if (level == G_RAID_VOLUME_RL_RAID1) 1168219974Smav size -= (size % sectorsize); 1169219974Smav else if (level == G_RAID_VOLUME_RL_RAID1E && 1170219974Smav (numdisks & 1) != 0) 1171219974Smav size -= (size % (2 * strip)); 1172219974Smav else 1173219974Smav size -= (size % strip); 1174219974Smav if (size <= 0) { 1175219974Smav gctl_error(req, "Size too small."); 1176219974Smav return (-13); 1177219974Smav } 1178229301Smav 1179229301Smav if (level == G_RAID_VOLUME_RL_RAID0 || 1180229301Smav level == G_RAID_VOLUME_RL_CONCAT || 1181229301Smav level == G_RAID_VOLUME_RL_SINGLE) 1182229301Smav volsize = size * numdisks; 1183229301Smav else if (level == G_RAID_VOLUME_RL_RAID1) 1184229301Smav volsize = size; 1185229301Smav else if (level == G_RAID_VOLUME_RL_RAID5) 1186229301Smav volsize = size * (numdisks - 1); 1187229301Smav else { /* RAID1E */ 1188229301Smav volsize = ((size * numdisks) / strip / 2) * 1189229301Smav strip; 1190229301Smav } 1191229301Smav if (volsize > 0xffffffffllu * sectorsize) { 1192219974Smav gctl_error(req, "Size too big."); 1193219974Smav return (-14); 1194219974Smav } 1195219974Smav 1196219974Smav /* We have all we need, create things: volume, ... */ 1197219974Smav mdi->mdio_total_disks = numdisks; 1198219974Smav mdi->mdio_started = 1; 1199219974Smav vol = g_raid_create_volume(sc, volname, -1); 1200219974Smav vol->v_md_data = (void *)(intptr_t)0; 1201219974Smav vol->v_raid_level = level; 1202235874Smav vol->v_raid_level_qualifier = qual; 1203219974Smav vol->v_strip_size = strip; 1204219974Smav vol->v_disks_count = numdisks; 1205229301Smav vol->v_mediasize = volsize; 1206219974Smav vol->v_sectorsize = sectorsize; 1207219974Smav g_raid_start_volume(vol); 1208219974Smav 1209219974Smav /* , and subdisks. */ 1210219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1211219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 1212219974Smav sd = &vol->v_subdisks[pd->pd_disk_pos]; 1213219974Smav sd->sd_disk = disk; 1214219974Smav sd->sd_offset = 0; 1215219974Smav sd->sd_size = size; 1216219974Smav TAILQ_INSERT_TAIL(&disk->d_subdisks, sd, sd_next); 1217219974Smav if (sd->sd_disk->d_consumer != NULL) { 1218219974Smav g_raid_change_disk_state(disk, 1219219974Smav G_RAID_DISK_S_ACTIVE); 1220219974Smav g_raid_change_subdisk_state(sd, 1221219974Smav G_RAID_SUBDISK_S_ACTIVE); 1222219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_NEW, 1223219974Smav G_RAID_EVENT_SUBDISK); 1224219974Smav } else { 1225219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_OFFLINE); 1226219974Smav } 1227219974Smav } 1228219974Smav 1229219974Smav /* Write metadata based on created entities. */ 1230219974Smav G_RAID_DEBUG1(0, sc, "Array started."); 1231219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 1232219974Smav 1233219974Smav /* Pickup any STALE/SPARE disks to refill array if needed. */ 1234219974Smav g_raid_md_nvidia_refill(sc); 1235219974Smav 1236219974Smav g_raid_event_send(vol, G_RAID_VOLUME_E_START, 1237219974Smav G_RAID_EVENT_VOLUME); 1238219974Smav return (0); 1239219974Smav } 1240219974Smav if (strcmp(verb, "delete") == 0) { 1241219974Smav 1242219974Smav /* Check if some volume is still open. */ 1243219974Smav force = gctl_get_paraml(req, "force", sizeof(*force)); 1244219974Smav if (force != NULL && *force == 0 && 1245219974Smav g_raid_nopens(sc) != 0) { 1246219974Smav gctl_error(req, "Some volume is still open."); 1247219974Smav return (-4); 1248219974Smav } 1249219974Smav 1250219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1251219974Smav if (disk->d_consumer) 1252219974Smav nvidia_meta_erase(disk->d_consumer); 1253219974Smav } 1254219974Smav g_raid_destroy_node(sc, 0); 1255219974Smav return (0); 1256219974Smav } 1257219974Smav if (strcmp(verb, "remove") == 0 || 1258219974Smav strcmp(verb, "fail") == 0) { 1259219974Smav if (*nargs < 2) { 1260219974Smav gctl_error(req, "Invalid number of arguments."); 1261219974Smav return (-1); 1262219974Smav } 1263219974Smav for (i = 1; i < *nargs; i++) { 1264219974Smav snprintf(arg, sizeof(arg), "arg%d", i); 1265219974Smav diskname = gctl_get_asciiparam(req, arg); 1266219974Smav if (diskname == NULL) { 1267219974Smav gctl_error(req, "No disk name (%s).", arg); 1268219974Smav error = -2; 1269219974Smav break; 1270219974Smav } 1271219974Smav if (strncmp(diskname, "/dev/", 5) == 0) 1272219974Smav diskname += 5; 1273219974Smav 1274219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1275219974Smav if (disk->d_consumer != NULL && 1276219974Smav disk->d_consumer->provider != NULL && 1277219974Smav strcmp(disk->d_consumer->provider->name, 1278219974Smav diskname) == 0) 1279219974Smav break; 1280219974Smav } 1281219974Smav if (disk == NULL) { 1282219974Smav gctl_error(req, "Disk '%s' not found.", 1283219974Smav diskname); 1284219974Smav error = -3; 1285219974Smav break; 1286219974Smav } 1287219974Smav 1288219974Smav if (strcmp(verb, "fail") == 0) { 1289219974Smav g_raid_md_fail_disk_nvidia(md, NULL, disk); 1290219974Smav continue; 1291219974Smav } 1292219974Smav 1293219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 1294219974Smav 1295219974Smav /* Erase metadata on deleting disk. */ 1296219974Smav nvidia_meta_erase(disk->d_consumer); 1297219974Smav 1298219974Smav /* If disk was assigned, just update statuses. */ 1299219974Smav if (pd->pd_disk_pos >= 0) { 1300219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_OFFLINE); 1301220209Smav g_raid_kill_consumer(sc, disk->d_consumer); 1302220209Smav disk->d_consumer = NULL; 1303219974Smav TAILQ_FOREACH(sd, &disk->d_subdisks, sd_next) { 1304219974Smav g_raid_change_subdisk_state(sd, 1305219974Smav G_RAID_SUBDISK_S_NONE); 1306219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_DISCONNECTED, 1307219974Smav G_RAID_EVENT_SUBDISK); 1308219974Smav } 1309219974Smav } else { 1310219974Smav /* Otherwise -- delete. */ 1311219974Smav g_raid_change_disk_state(disk, G_RAID_DISK_S_NONE); 1312219974Smav g_raid_destroy_disk(disk); 1313219974Smav } 1314219974Smav } 1315219974Smav 1316219974Smav /* Write updated metadata to remaining disks. */ 1317219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 1318219974Smav 1319219974Smav /* Check if anything left except placeholders. */ 1320219974Smav if (g_raid_ndisks(sc, -1) == 1321219974Smav g_raid_ndisks(sc, G_RAID_DISK_S_OFFLINE)) 1322219974Smav g_raid_destroy_node(sc, 0); 1323219974Smav else 1324219974Smav g_raid_md_nvidia_refill(sc); 1325219974Smav return (error); 1326219974Smav } 1327219974Smav if (strcmp(verb, "insert") == 0) { 1328219974Smav if (*nargs < 2) { 1329219974Smav gctl_error(req, "Invalid number of arguments."); 1330219974Smav return (-1); 1331219974Smav } 1332219974Smav update = 0; 1333219974Smav for (i = 1; i < *nargs; i++) { 1334219974Smav /* Get disk name. */ 1335219974Smav snprintf(arg, sizeof(arg), "arg%d", i); 1336219974Smav diskname = gctl_get_asciiparam(req, arg); 1337219974Smav if (diskname == NULL) { 1338219974Smav gctl_error(req, "No disk name (%s).", arg); 1339219974Smav error = -3; 1340219974Smav break; 1341219974Smav } 1342219974Smav 1343219974Smav /* Try to find provider with specified name. */ 1344219974Smav g_topology_lock(); 1345219974Smav cp = g_raid_open_consumer(sc, diskname); 1346219974Smav if (cp == NULL) { 1347219974Smav gctl_error(req, "Can't open disk '%s'.", 1348219974Smav diskname); 1349219974Smav g_topology_unlock(); 1350219974Smav error = -4; 1351219974Smav break; 1352219974Smav } 1353219974Smav pp = cp->provider; 1354219974Smav 1355219974Smav pd = malloc(sizeof(*pd), M_MD_NVIDIA, M_WAITOK | M_ZERO); 1356219974Smav pd->pd_disk_pos = -3; 1357219974Smav pd->pd_disk_size = pp->mediasize; 1358219974Smav 1359219974Smav disk = g_raid_create_disk(sc); 1360219974Smav disk->d_consumer = cp; 1361219974Smav disk->d_md_data = (void *)pd; 1362219974Smav cp->private = disk; 1363219974Smav g_topology_unlock(); 1364219974Smav 1365243678Smav g_raid_get_disk_info(disk); 1366219974Smav 1367219974Smav /* Welcome the "new" disk. */ 1368219974Smav update += g_raid_md_nvidia_start_disk(disk); 1369219974Smav if (disk->d_state != G_RAID_DISK_S_SPARE && 1370219974Smav disk->d_state != G_RAID_DISK_S_ACTIVE) { 1371219974Smav gctl_error(req, "Disk '%s' doesn't fit.", 1372219974Smav diskname); 1373219974Smav g_raid_destroy_disk(disk); 1374219974Smav error = -8; 1375219974Smav break; 1376219974Smav } 1377219974Smav } 1378219974Smav 1379219974Smav /* Write new metadata if we changed something. */ 1380219974Smav if (update) 1381219974Smav g_raid_md_write_nvidia(md, NULL, NULL, NULL); 1382219974Smav return (error); 1383219974Smav } 1384219974Smav gctl_error(req, "Command '%s' is not supported.", verb); 1385219974Smav return (-100); 1386219974Smav} 1387219974Smav 1388219974Smavstatic int 1389219974Smavg_raid_md_write_nvidia(struct g_raid_md_object *md, struct g_raid_volume *tvol, 1390219974Smav struct g_raid_subdisk *tsd, struct g_raid_disk *tdisk) 1391219974Smav{ 1392219974Smav struct g_raid_softc *sc; 1393219974Smav struct g_raid_volume *vol; 1394219974Smav struct g_raid_subdisk *sd; 1395219974Smav struct g_raid_disk *disk; 1396219974Smav struct g_raid_md_nvidia_object *mdi; 1397219974Smav struct g_raid_md_nvidia_perdisk *pd; 1398219974Smav struct nvidia_raid_conf *meta; 1399219974Smav int i, spares; 1400219974Smav 1401219974Smav sc = md->mdo_softc; 1402219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 1403219974Smav 1404219974Smav if (sc->sc_stopping == G_RAID_DESTROY_HARD) 1405219974Smav return (0); 1406219974Smav 1407219974Smav /* There is only one volume. */ 1408219974Smav vol = TAILQ_FIRST(&sc->sc_volumes); 1409219974Smav 1410219974Smav /* Fill global fields. */ 1411219974Smav meta = malloc(sizeof(*meta), M_MD_NVIDIA, M_WAITOK | M_ZERO); 1412219974Smav if (mdi->mdio_meta) 1413219974Smav memcpy(meta, mdi->mdio_meta, sizeof(*meta)); 1414220209Smav memcpy(meta->nvidia_id, NVIDIA_MAGIC, sizeof(NVIDIA_MAGIC) - 1); 1415219974Smav meta->config_size = 30; 1416219974Smav meta->version = 0x0064; 1417219974Smav meta->total_sectors = vol->v_mediasize / vol->v_sectorsize; 1418219974Smav meta->sector_size = vol->v_sectorsize; 1419219974Smav nvidia_meta_put_name(meta, vol->v_name); 1420219974Smav meta->magic_0 = NVIDIA_MAGIC0; 1421219974Smav memcpy(&meta->volume_id, &mdi->mdio_volume_id, 16); 1422219974Smav meta->state = NVIDIA_S_IDLE; 1423219974Smav if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1) 1424219974Smav meta->array_width = 1; 1425219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1E) 1426219974Smav meta->array_width = vol->v_disks_count / 2; 1427219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID5) 1428219974Smav meta->array_width = vol->v_disks_count - 1; 1429219974Smav else 1430219974Smav meta->array_width = vol->v_disks_count; 1431219974Smav meta->total_disks = vol->v_disks_count; 1432219974Smav meta->orig_array_width = meta->array_width; 1433219974Smav if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID0) 1434219974Smav meta->type = NVIDIA_T_RAID0; 1435219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1) 1436219974Smav meta->type = NVIDIA_T_RAID1; 1437219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_RAID1E) 1438219974Smav meta->type = NVIDIA_T_RAID01; 1439219974Smav else if (vol->v_raid_level == G_RAID_VOLUME_RL_CONCAT || 1440219974Smav vol->v_raid_level == G_RAID_VOLUME_RL_SINGLE) 1441219974Smav meta->type = NVIDIA_T_CONCAT; 1442235874Smav else if (vol->v_raid_level_qualifier == G_RAID_VOLUME_RLQ_R5LA) 1443235874Smav meta->type = NVIDIA_T_RAID5; 1444219974Smav else 1445219974Smav meta->type = NVIDIA_T_RAID5_SYM; 1446219974Smav meta->strip_sectors = vol->v_strip_size / vol->v_sectorsize; 1447219974Smav meta->strip_bytes = vol->v_strip_size; 1448219974Smav meta->strip_shift = ffs(meta->strip_sectors) - 1; 1449219974Smav meta->strip_mask = meta->strip_sectors - 1; 1450219974Smav meta->stripe_sectors = meta->strip_sectors * meta->orig_array_width; 1451219974Smav meta->stripe_bytes = meta->stripe_sectors * vol->v_sectorsize; 1452219974Smav meta->rebuild_lba = 0; 1453219974Smav meta->orig_type = meta->type; 1454219974Smav meta->orig_total_sectors = meta->total_sectors; 1455219974Smav meta->status = 0; 1456219974Smav 1457219974Smav for (i = 0; i < vol->v_disks_count; i++) { 1458219974Smav sd = &vol->v_subdisks[i]; 1459219974Smav if ((sd->sd_state == G_RAID_SUBDISK_S_STALE || 1460219974Smav sd->sd_state == G_RAID_SUBDISK_S_RESYNC || 1461219974Smav vol->v_dirty) && 1462219974Smav meta->state != NVIDIA_S_REBUILD) 1463219974Smav meta->state = NVIDIA_S_SYNC; 1464219974Smav else if (sd->sd_state == G_RAID_SUBDISK_S_NEW || 1465219974Smav sd->sd_state == G_RAID_SUBDISK_S_REBUILD) 1466219974Smav meta->state = NVIDIA_S_REBUILD; 1467219974Smav } 1468219974Smav 1469219974Smav /* We are done. Print meta data and store them to disks. */ 1470219974Smav if (mdi->mdio_meta != NULL) 1471219974Smav free(mdi->mdio_meta, M_MD_NVIDIA); 1472219974Smav mdi->mdio_meta = meta; 1473219974Smav spares = 0; 1474219974Smav TAILQ_FOREACH(disk, &sc->sc_disks, d_next) { 1475219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 1476219974Smav if (disk->d_state != G_RAID_DISK_S_ACTIVE && 1477219974Smav disk->d_state != G_RAID_DISK_S_SPARE) 1478219974Smav continue; 1479219974Smav if (pd->pd_meta != NULL) { 1480219974Smav free(pd->pd_meta, M_MD_NVIDIA); 1481219974Smav pd->pd_meta = NULL; 1482219974Smav } 1483219974Smav pd->pd_meta = nvidia_meta_copy(meta); 1484219974Smav if ((sd = TAILQ_FIRST(&disk->d_subdisks)) != NULL) { 1485219974Smav /* For RAID0+1 we need to translate order. */ 1486219974Smav pd->pd_meta->disk_number = 1487219974Smav nvidia_meta_translate_disk(meta, sd->sd_pos); 1488219974Smav if (sd->sd_state != G_RAID_SUBDISK_S_ACTIVE) { 1489219974Smav pd->pd_meta->disk_status = 0x100; 1490219974Smav pd->pd_meta->rebuild_lba = 1491219974Smav sd->sd_rebuild_pos / vol->v_sectorsize * 1492219974Smav meta->array_width; 1493219974Smav } 1494219974Smav } else 1495219974Smav pd->pd_meta->disk_number = meta->total_disks + spares++; 1496219974Smav G_RAID_DEBUG(1, "Writing NVIDIA metadata to %s", 1497219974Smav g_raid_get_diskname(disk)); 1498219974Smav g_raid_md_nvidia_print(pd->pd_meta); 1499219974Smav nvidia_meta_write(disk->d_consumer, pd->pd_meta); 1500219974Smav } 1501219974Smav return (0); 1502219974Smav} 1503219974Smav 1504219974Smavstatic int 1505219974Smavg_raid_md_fail_disk_nvidia(struct g_raid_md_object *md, 1506219974Smav struct g_raid_subdisk *tsd, struct g_raid_disk *tdisk) 1507219974Smav{ 1508219974Smav struct g_raid_softc *sc; 1509219974Smav struct g_raid_md_nvidia_perdisk *pd; 1510219974Smav struct g_raid_subdisk *sd; 1511219974Smav 1512219974Smav sc = md->mdo_softc; 1513219974Smav pd = (struct g_raid_md_nvidia_perdisk *)tdisk->d_md_data; 1514219974Smav 1515219974Smav /* We can't fail disk that is not a part of array now. */ 1516219974Smav if (pd->pd_disk_pos < 0) 1517219974Smav return (-1); 1518219974Smav 1519219974Smav /* Erase metadata to prevent disks's later resurrection. */ 1520219974Smav if (tdisk->d_consumer) 1521219974Smav nvidia_meta_erase(tdisk->d_consumer); 1522219974Smav 1523219974Smav /* Change states. */ 1524219974Smav g_raid_change_disk_state(tdisk, G_RAID_DISK_S_FAILED); 1525219974Smav TAILQ_FOREACH(sd, &tdisk->d_subdisks, sd_next) { 1526219974Smav g_raid_change_subdisk_state(sd, 1527219974Smav G_RAID_SUBDISK_S_FAILED); 1528219974Smav g_raid_event_send(sd, G_RAID_SUBDISK_E_FAILED, 1529219974Smav G_RAID_EVENT_SUBDISK); 1530219974Smav } 1531219974Smav 1532219974Smav /* Write updated metadata to remaining disks. */ 1533219974Smav g_raid_md_write_nvidia(md, NULL, NULL, tdisk); 1534219974Smav 1535219974Smav /* Check if anything left except placeholders. */ 1536219974Smav if (g_raid_ndisks(sc, -1) == 1537219974Smav g_raid_ndisks(sc, G_RAID_DISK_S_OFFLINE)) 1538219974Smav g_raid_destroy_node(sc, 0); 1539219974Smav else 1540219974Smav g_raid_md_nvidia_refill(sc); 1541219974Smav return (0); 1542219974Smav} 1543219974Smav 1544219974Smavstatic int 1545219974Smavg_raid_md_free_disk_nvidia(struct g_raid_md_object *md, 1546219974Smav struct g_raid_disk *disk) 1547219974Smav{ 1548219974Smav struct g_raid_md_nvidia_perdisk *pd; 1549219974Smav 1550219974Smav pd = (struct g_raid_md_nvidia_perdisk *)disk->d_md_data; 1551219974Smav if (pd->pd_meta != NULL) { 1552219974Smav free(pd->pd_meta, M_MD_NVIDIA); 1553219974Smav pd->pd_meta = NULL; 1554219974Smav } 1555219974Smav free(pd, M_MD_NVIDIA); 1556219974Smav disk->d_md_data = NULL; 1557219974Smav return (0); 1558219974Smav} 1559219974Smav 1560219974Smavstatic int 1561219974Smavg_raid_md_free_nvidia(struct g_raid_md_object *md) 1562219974Smav{ 1563219974Smav struct g_raid_md_nvidia_object *mdi; 1564219974Smav 1565219974Smav mdi = (struct g_raid_md_nvidia_object *)md; 1566219974Smav if (!mdi->mdio_started) { 1567219974Smav mdi->mdio_started = 0; 1568219974Smav callout_stop(&mdi->mdio_start_co); 1569219974Smav G_RAID_DEBUG1(1, md->mdo_softc, 1570219974Smav "root_mount_rel %p", mdi->mdio_rootmount); 1571219974Smav root_mount_rel(mdi->mdio_rootmount); 1572219974Smav mdi->mdio_rootmount = NULL; 1573219974Smav } 1574219974Smav if (mdi->mdio_meta != NULL) { 1575219974Smav free(mdi->mdio_meta, M_MD_NVIDIA); 1576219974Smav mdi->mdio_meta = NULL; 1577219974Smav } 1578219974Smav return (0); 1579219974Smav} 1580219974Smav 1581240552SmavG_RAID_MD_DECLARE(nvidia, "NVIDIA"); 1582