geom_disk.c revision 112002
192108Sphk/*- 292108Sphk * Copyright (c) 2002 Poul-Henning Kamp 392108Sphk * Copyright (c) 2002 Networks Associates Technology, Inc. 492108Sphk * All rights reserved. 592108Sphk * 692108Sphk * This software was developed for the FreeBSD Project by Poul-Henning Kamp 792108Sphk * and NAI Labs, the Security Research Division of Network Associates, Inc. 892108Sphk * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the 992108Sphk * DARPA CHATS research program. 1092108Sphk * 1192108Sphk * Redistribution and use in source and binary forms, with or without 1292108Sphk * modification, are permitted provided that the following conditions 1392108Sphk * are met: 1492108Sphk * 1. Redistributions of source code must retain the above copyright 1592108Sphk * notice, this list of conditions and the following disclaimer. 1692108Sphk * 2. Redistributions in binary form must reproduce the above copyright 1792108Sphk * notice, this list of conditions and the following disclaimer in the 1892108Sphk * documentation and/or other materials provided with the distribution. 1992108Sphk * 3. The names of the authors may not be used to endorse or promote 2092108Sphk * products derived from this software without specific prior written 2192108Sphk * permission. 2292108Sphk * 2392108Sphk * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 2492108Sphk * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2592108Sphk * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2692108Sphk * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 2792108Sphk * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 2892108Sphk * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 2992108Sphk * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 3092108Sphk * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 3192108Sphk * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 3292108Sphk * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 3392108Sphk * SUCH DAMAGE. 3492108Sphk * 3592108Sphk * $FreeBSD: head/sys/geom/geom_disk.c 112002 2003-03-08 20:00:11Z phk $ 3692108Sphk */ 3792108Sphk 38104519Sphk#include "opt_geom.h" 39104519Sphk 4092108Sphk#include <sys/param.h> 4192108Sphk#include <sys/systm.h> 4292108Sphk#include <sys/kernel.h> 4392108Sphk#include <sys/sysctl.h> 4492108Sphk#include <sys/bio.h> 4592108Sphk#include <sys/conf.h> 4692108Sphk#include <sys/disk.h> 47110119Sphk#include <sys/fcntl.h> 4892108Sphk#include <sys/malloc.h> 4992108Sphk#include <sys/sysctl.h> 50103284Sphk#include <sys/stdint.h> 51111979Sphk#include <sys/devicestat.h> 5292108Sphk#include <machine/md_var.h> 5392108Sphk 5492108Sphk#include <sys/lock.h> 5592108Sphk#include <sys/mutex.h> 5692108Sphk#include <geom/geom.h> 5792108Sphk 58110720Sphkstatic struct mtx g_disk_done_mtx; 59110720Sphk 6092108Sphkstatic g_access_t g_disk_access; 6192108Sphk 6293248Sphkstruct g_class g_disk_class = { 6397075Sphk "DISK", 6492108Sphk NULL, 6592108Sphk NULL, 6698066Sphk G_CLASS_INITIALIZER 6792108Sphk}; 6892108Sphk 69110720Sphkstatic void 70110720Sphkg_disk_init(void) 71110720Sphk{ 72110720Sphk mtx_unlock(&Giant); 73110720Sphk g_add_class(&g_disk_class); 74110720Sphk mtx_init(&g_disk_done_mtx, "g_disk_done", MTX_DEF, 0); 75110720Sphk mtx_lock(&Giant); 76110720Sphk} 77104936Sphk 78110720SphkDECLARE_GEOM_CLASS_INIT(g_disk_class, g_disk, g_disk_init); 79110720Sphk 80110052Sphkstatic void __inline 81110052Sphkg_disk_lock_giant(struct disk *dp) 82110052Sphk{ 83110119Sphk if (dp->d_flags & DISKFLAG_NOGIANT) 84110119Sphk return; 85110119Sphk mtx_lock(&Giant); 86110052Sphk} 87110052Sphk 88110052Sphkstatic void __inline 89110052Sphkg_disk_unlock_giant(struct disk *dp) 90110052Sphk{ 91110119Sphk if (dp->d_flags & DISKFLAG_NOGIANT) 92110119Sphk return; 93110119Sphk mtx_unlock(&Giant); 94110052Sphk} 95110052Sphk 9692108Sphkstatic int 9792108Sphkg_disk_access(struct g_provider *pp, int r, int w, int e) 9892108Sphk{ 9992108Sphk struct disk *dp; 10092108Sphk int error; 10192108Sphk 10292108Sphk g_trace(G_T_ACCESS, "g_disk_access(%s, %d, %d, %d)", 10392108Sphk pp->name, r, w, e); 10492108Sphk g_topology_assert(); 10592108Sphk r += pp->acr; 10692108Sphk w += pp->acw; 10792108Sphk e += pp->ace; 10892108Sphk dp = pp->geom->softc; 109110119Sphk error = 0; 11092108Sphk if ((pp->acr + pp->acw + pp->ace) == 0 && (r + w + e) > 0) { 111111668Sphk if (dp->d_open != NULL) { 112110119Sphk g_disk_lock_giant(dp); 113111668Sphk error = dp->d_open(dp); 114110119Sphk if (error != 0) 115110119Sphk printf("Opened disk %s -> %d\n", 116110119Sphk pp->name, error); 117110119Sphk g_disk_unlock_giant(dp); 118110119Sphk } 119105551Sphk pp->mediasize = dp->d_mediasize; 120105551Sphk pp->sectorsize = dp->d_sectorsize; 121110119Sphk dp->d_flags |= DISKFLAG_OPEN; 122110727Sphk if (dp->d_maxsize == 0) { 123110727Sphk printf("WARNING: Disk drive %s%d has no d_maxsize\n", 124110727Sphk dp->d_name, dp->d_unit); 125110727Sphk dp->d_maxsize = DFLTPHYS; 126110727Sphk } 12792108Sphk } else if ((pp->acr + pp->acw + pp->ace) > 0 && (r + w + e) == 0) { 128111668Sphk if (dp->d_close != NULL) { 129110119Sphk g_disk_lock_giant(dp); 130111668Sphk error = dp->d_close(dp); 131110119Sphk if (error != 0) 132110119Sphk printf("Closed disk %s -> %d\n", 133110119Sphk pp->name, error); 134110119Sphk g_disk_unlock_giant(dp); 135110119Sphk } 136110119Sphk dp->d_flags &= ~DISKFLAG_OPEN; 13792108Sphk } 13892108Sphk return (error); 13992108Sphk} 14092108Sphk 14192108Sphkstatic void 14295038Sphkg_disk_kerneldump(struct bio *bp, struct disk *dp) 14395038Sphk{ 14495038Sphk int error; 14595038Sphk struct g_kerneldump *gkd; 14695038Sphk struct dumperinfo di; 147104450Sphk struct g_geom *gp; 14895038Sphk 14995038Sphk gkd = (struct g_kerneldump*)bp->bio_data; 150104450Sphk gp = bp->bio_to->geom; 151104450Sphk g_trace(G_T_TOPOLOGY, "g_disk_kernedump(%s, %jd, %jd)", 152104450Sphk gp->name, (intmax_t)gkd->offset, (intmax_t)gkd->length); 153110119Sphk di.dumper = dp->d_dump; 154111220Sphk di.priv = dp; 155103714Sphk di.blocksize = dp->d_sectorsize; 15695038Sphk di.mediaoffset = gkd->offset; 15795038Sphk di.mediasize = gkd->length; 15895038Sphk error = set_dumper(&di); 159104195Sphk g_io_deliver(bp, error); 16095038Sphk} 16195038Sphk 16295038Sphkstatic void 16392108Sphkg_disk_done(struct bio *bp) 16492108Sphk{ 165111979Sphk struct bio *bp2; 166111979Sphk struct disk *dp; 167111979Sphk devstat_trans_flags flg; 16892108Sphk 169110720Sphk /* See "notes" for why we need a mutex here */ 170110720Sphk /* XXX: will witness accept a mix of Giant/unGiant drivers here ? */ 171110720Sphk mtx_lock(&g_disk_done_mtx); 17292108Sphk bp->bio_completed = bp->bio_length - bp->bio_resid; 173111979Sphk 174111979Sphk bp2 = bp->bio_parent; 175111979Sphk dp = bp2->bio_to->geom->softc; 176111979Sphk if (bp2->bio_error == 0) 177111979Sphk bp2->bio_error = bp->bio_error; 178111979Sphk bp2->bio_completed += bp->bio_completed; 179111979Sphk g_destroy_bio(bp); 180111979Sphk bp2->bio_inbed++; 181111979Sphk if (bp2->bio_children == bp2->bio_inbed) { 182111979Sphk if (bp2->bio_cmd == BIO_DELETE) 183111979Sphk flg = DEVSTAT_FREE; 184111979Sphk else if (bp2->bio_cmd == BIO_READ) 185111979Sphk flg = DEVSTAT_READ; 186111979Sphk else 187111979Sphk flg = DEVSTAT_WRITE; 188111979Sphk devstat_end_transaction(dp->d_devstat, bp2->bio_completed, 189111979Sphk DEVSTAT_TAG_SIMPLE, flg); 190111979Sphk g_io_deliver(bp2, bp2->bio_error); 191111979Sphk } 192110720Sphk mtx_unlock(&g_disk_done_mtx); 19392108Sphk} 19492108Sphk 19592108Sphkstatic void 19692108Sphkg_disk_start(struct bio *bp) 19792108Sphk{ 198110720Sphk struct bio *bp2, *bp3; 19992108Sphk struct disk *dp; 20092403Sphk struct g_ioctl *gio; 20192403Sphk int error; 202110720Sphk off_t off; 20392108Sphk 20492108Sphk dp = bp->bio_to->geom->softc; 205104609Sphk error = EJUSTRETURN; 20692108Sphk switch(bp->bio_cmd) { 207104609Sphk case BIO_DELETE: 208110119Sphk if (!(dp->d_flags & DISKFLAG_CANDELETE)) { 209104609Sphk error = 0; 210104609Sphk break; 211104609Sphk } 212104609Sphk /* fall-through */ 21392108Sphk case BIO_READ: 21492108Sphk case BIO_WRITE: 215110720Sphk off = 0; 216110720Sphk bp3 = NULL; 21792108Sphk bp2 = g_clone_bio(bp); 218110477Sphk if (bp2 == NULL) { 219110477Sphk error = ENOMEM; 220110477Sphk break; 221110477Sphk } 222111979Sphk devstat_start_transaction(dp->d_devstat); 223110720Sphk do { 224110720Sphk bp2->bio_offset += off; 225110720Sphk bp2->bio_length -= off; 226110766Stegge bp2->bio_data += off; 227110720Sphk if (bp2->bio_length > dp->d_maxsize) { 228110720Sphk /* 229110720Sphk * XXX: If we have a stripesize we should really 230110720Sphk * use it here. 231110720Sphk */ 232110720Sphk bp2->bio_length = dp->d_maxsize; 233110720Sphk off += dp->d_maxsize; 234110720Sphk /* 235110720Sphk * To avoid a race, we need to grab the next bio 236110720Sphk * before we schedule this one. See "notes". 237110720Sphk */ 238110720Sphk bp3 = g_clone_bio(bp); 239110720Sphk if (bp3 == NULL) 240110720Sphk bp->bio_error = ENOMEM; 241110720Sphk } 242110720Sphk bp2->bio_done = g_disk_done; 243110720Sphk bp2->bio_blkno = bp2->bio_offset >> DEV_BSHIFT; 244110720Sphk bp2->bio_pblkno = bp2->bio_offset / dp->d_sectorsize; 245110720Sphk bp2->bio_bcount = bp2->bio_length; 246110720Sphk bp2->bio_disk = dp; 247110720Sphk g_disk_lock_giant(dp); 248110720Sphk dp->d_strategy(bp2); 249110720Sphk g_disk_unlock_giant(dp); 250110720Sphk bp2 = bp3; 251110720Sphk bp3 = NULL; 252110720Sphk } while (bp2 != NULL); 25392108Sphk break; 25492108Sphk case BIO_GETATTR: 255105551Sphk if (g_handleattr_int(bp, "GEOM::fwsectors", dp->d_fwsectors)) 25692403Sphk break; 257103714Sphk else if (g_handleattr_int(bp, "GEOM::fwheads", dp->d_fwheads)) 25892403Sphk break; 25998066Sphk else if (g_handleattr_off_t(bp, "GEOM::frontstuff", 0)) 26094287Sphk break; 26195038Sphk else if (!strcmp(bp->bio_attribute, "GEOM::kerneldump")) 26295038Sphk g_disk_kerneldump(bp, dp); 263111668Sphk else if ((dp->d_ioctl != NULL) && 264110119Sphk !strcmp(bp->bio_attribute, "GEOM::ioctl") && 26592403Sphk bp->bio_length == sizeof *gio) { 266104602Sphk gio = (struct g_ioctl *)bp->bio_data; 267111668Sphk gio->dev = dp; 268111668Sphk gio->func = (d_ioctl_t *)(dp->d_ioctl); 269104602Sphk error = EDIRIOCTL; 27092403Sphk } else 27192403Sphk error = ENOIOCTL; 27292403Sphk break; 273104542Sphk case BIO_SETATTR: 274111668Sphk error = ENOIOCTL; 275104542Sphk break; 27692108Sphk default: 27792403Sphk error = EOPNOTSUPP; 27892403Sphk break; 27992403Sphk } 280104609Sphk if (error != EJUSTRETURN) 281104195Sphk g_io_deliver(bp, error); 28292403Sphk return; 28392108Sphk} 28492108Sphk 285104936Sphkstatic void 286107953Sphkg_disk_dumpconf(struct sbuf *sb, const char *indent, struct g_geom *gp, struct g_consumer *cp, struct g_provider *pp) 287105537Sphk{ 288105537Sphk struct disk *dp; 289105537Sphk 290105537Sphk dp = gp->softc; 291106101Sphk if (indent == NULL) { 292106101Sphk sbuf_printf(sb, " hd %u", dp->d_fwheads); 293106101Sphk sbuf_printf(sb, " sc %u", dp->d_fwsectors); 294106101Sphk return; 295106101Sphk } 296105539Sphk if (pp != NULL) { 297105537Sphk sbuf_printf(sb, "%s<fwheads>%u</fwheads>\n", 298105537Sphk indent, dp->d_fwheads); 299105537Sphk sbuf_printf(sb, "%s<fwsectors>%u</fwsectors>\n", 300105537Sphk indent, dp->d_fwsectors); 301105537Sphk } 302105537Sphk} 303105537Sphk 304105537Sphkstatic void 305104936Sphkg_disk_create(void *arg) 30692108Sphk{ 30792108Sphk struct g_geom *gp; 30892108Sphk struct g_provider *pp; 309110708Sphk struct disk *dp; 31092108Sphk 311104936Sphk g_topology_assert(); 312110708Sphk dp = arg; 313110708Sphk gp = g_new_geomf(&g_disk_class, "%s%d", dp->d_name, dp->d_unit); 314104936Sphk gp->start = g_disk_start; 315104936Sphk gp->access = g_disk_access; 316110708Sphk gp->softc = dp; 317105537Sphk gp->dumpconf = g_disk_dumpconf; 318110708Sphk dp->d_geom = gp; 319104936Sphk pp = g_new_providerf(gp, "%s", gp->name); 320110708Sphk pp->mediasize = dp->d_mediasize; 321110708Sphk pp->sectorsize = dp->d_sectorsize; 322110708Sphk if (dp->d_flags & DISKFLAG_CANDELETE) 323110708Sphk pp->flags |= G_PF_CANDELETE; 324110710Sphk pp->stripeoffset = dp->d_stripeoffset; 325110710Sphk pp->stripesize = dp->d_stripesize; 326104936Sphk g_error_provider(pp, 0); 327105957Sphk if (bootverbose) 328105957Sphk printf("GEOM: new disk %s\n", gp->name); 329104936Sphk} 330104936Sphk 331104936Sphk 332104936Sphk 333111668Sphkvoid 334111668Sphkdisk_create(int unit, struct disk *dp, int flags, void *unused __unused, void * unused2 __unused) 335104936Sphk{ 336104936Sphk 337110708Sphk dp->d_unit = unit; 338110119Sphk dp->d_flags = flags; 339110119Sphk KASSERT(dp->d_strategy != NULL, ("disk_create need d_strategy")); 340110119Sphk KASSERT(dp->d_name != NULL, ("disk_create need d_name")); 341110119Sphk KASSERT(*dp->d_name != 0, ("disk_create need d_name")); 342110317Sphk KASSERT(strlen(dp->d_name) < SPECNAMELEN - 4, ("disk name too long")); 343112002Sphk dp->d_devstat = devstat_new_entry(dp->d_name, dp->d_unit, 344111979Sphk dp->d_sectorsize, DEVSTAT_ALL_SUPPORTED, 345111979Sphk DEVSTAT_TYPE_DIRECT, DEVSTAT_PRIORITY_MAX); 346110708Sphk g_call_me(g_disk_create, dp); 34792108Sphk} 34892108Sphk 34992108Sphkvoid 350111216Sphkdisk_destroy(struct disk *dp) 35192108Sphk{ 35292108Sphk struct g_geom *gp; 35392108Sphk 354110419Sphk gp = dp->d_geom; 35592108Sphk gp->flags |= G_GEOM_WITHER; 356110119Sphk gp->softc = NULL; 35792108Sphk g_orphan_provider(LIST_FIRST(&gp->provider), ENXIO); 358111979Sphk devstat_remove_entry(dp->d_devstat); 35992108Sphk} 36092108Sphk 361104451Sphkstatic void 362104451Sphkg_kern_disks(void *p) 363104451Sphk{ 364104451Sphk struct sbuf *sb; 365104451Sphk struct g_geom *gp; 366104451Sphk char *sp; 367104451Sphk 368104451Sphk sb = p; 369104451Sphk sp = ""; 370104451Sphk g_topology_assert(); 371104451Sphk LIST_FOREACH(gp, &g_disk_class.geom, geom) { 372104451Sphk sbuf_printf(sb, "%s%s", sp, gp->name); 373104451Sphk sp = " "; 374104451Sphk } 375104451Sphk sbuf_finish(sb); 376104451Sphk wakeup(sb); 377104451Sphk} 378104451Sphk 379104451Sphkstatic int 380104451Sphksysctl_disks(SYSCTL_HANDLER_ARGS) 381104451Sphk{ 382104451Sphk int error; 383104451Sphk struct sbuf *sb; 384104451Sphk 385104451Sphk sb = sbuf_new(NULL, NULL, 0, SBUF_AUTOEXTEND); 386104451Sphk sbuf_clear(sb); 387104451Sphk g_call_me(g_kern_disks, sb); 388104451Sphk do { 389104451Sphk tsleep(sb, PZERO, "kern.disks", hz); 390104451Sphk } while(!sbuf_done(sb)); 391105350Sphk error = SYSCTL_OUT(req, sbuf_data(sb), sbuf_len(sb) + 1); 392104451Sphk sbuf_delete(sb); 393104451Sphk return error; 394104451Sphk} 395104451Sphk 396104451SphkSYSCTL_PROC(_kern, OID_AUTO, disks, CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_NOLOCK, 0, 0, 397104451Sphk sysctl_disks, "A", "names of available disks"); 398104519Sphk 399