kern_conf.c revision 120529
1/*- 2 * Copyright (c) 1999-2002 Poul-Henning Kamp 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 17 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 24 * SUCH DAMAGE. 25 */ 26 27#include <sys/cdefs.h> 28__FBSDID("$FreeBSD: head/sys/kern/kern_conf.c 120529 2003-09-27 21:50:00Z phk $"); 29 30#include <sys/param.h> 31#include <sys/kernel.h> 32#include <sys/systm.h> 33#include <sys/bio.h> 34#include <sys/lock.h> 35#include <sys/mutex.h> 36#include <sys/sysctl.h> 37#include <sys/module.h> 38#include <sys/malloc.h> 39#include <sys/conf.h> 40#include <sys/vnode.h> 41#include <sys/queue.h> 42#include <sys/poll.h> 43#include <sys/ctype.h> 44#include <machine/stdarg.h> 45 46static MALLOC_DEFINE(M_DEVT, "dev_t", "dev_t storage"); 47 48/* Built at compile time from sys/conf/majors */ 49extern unsigned char reserved_majors[256]; 50 51/* 52 * This is the number of hash-buckets. Experiements with 'real-life' 53 * udev_t's show that a prime halfway between two powers of two works 54 * best. 55 */ 56#define DEVT_HASH 83 57 58/* The number of dev_t's we can create before malloc(9) kick in. */ 59#define DEVT_STASH 50 60 61static struct cdev devt_stash[DEVT_STASH]; 62 63static LIST_HEAD(, cdev) dev_hash[DEVT_HASH]; 64 65static LIST_HEAD(, cdev) dev_free; 66 67static int ready_for_devs; 68 69static int free_devt; 70SYSCTL_INT(_debug, OID_AUTO, free_devt, CTLFLAG_RW, &free_devt, 0, ""); 71 72int 73nullop(void) 74{ 75 76 return (0); 77} 78 79int 80eopnotsupp(void) 81{ 82 83 return (EOPNOTSUPP); 84} 85 86static int 87enxio(void) 88{ 89 return (ENXIO); 90} 91 92static int 93enodev(void) 94{ 95 return (ENODEV); 96} 97 98/* Define a dead_cdevsw for use when devices leave unexpectedly. */ 99 100#define dead_open (d_open_t *)enxio 101#define dead_close (d_close_t *)enxio 102#define dead_read (d_read_t *)enxio 103#define dead_write (d_write_t *)enxio 104#define dead_ioctl (d_ioctl_t *)enxio 105#define dead_poll (d_poll_t *)enodev 106#define dead_mmap (d_mmap_t *)enodev 107 108static void 109dead_strategy(struct bio *bp) 110{ 111 112 biofinish(bp, NULL, ENXIO); 113} 114 115#define dead_dump (dumper_t *)enxio 116#define dead_kqfilter (d_kqfilter_t *)enxio 117 118static struct cdevsw dead_cdevsw = { 119 .d_open = dead_open, 120 .d_close = dead_close, 121 .d_read = dead_read, 122 .d_write = dead_write, 123 .d_ioctl = dead_ioctl, 124 .d_poll = dead_poll, 125 .d_mmap = dead_mmap, 126 .d_strategy = dead_strategy, 127 .d_name = "dead", 128 .d_maj = 255, 129 .d_dump = dead_dump, 130 .d_kqfilter = dead_kqfilter 131}; 132 133/* Default methods if driver does not specify method */ 134 135#define null_open (d_open_t *)nullop 136#define null_close (d_close_t *)nullop 137#define no_read (d_read_t *)enodev 138#define no_write (d_write_t *)enodev 139#define no_ioctl (d_ioctl_t *)enodev 140#define no_mmap (d_mmap_t *)enodev 141 142static int 143no_kqfilter(dev_t dev __unused, struct knote *kn __unused) 144{ 145 146 return (1); 147} 148 149static void 150no_strategy(struct bio *bp) 151{ 152 153 biofinish(bp, NULL, ENODEV); 154} 155 156static int 157no_poll(dev_t dev __unused, int events, struct thread *td __unused) 158{ 159 /* 160 * Return true for read/write. If the user asked for something 161 * special, return POLLNVAL, so that clients have a way of 162 * determining reliably whether or not the extended 163 * functionality is present without hard-coding knowledge 164 * of specific filesystem implementations. 165 * Stay in sync with vop_nopoll(). 166 */ 167 if (events & ~POLLSTANDARD) 168 return (POLLNVAL); 169 170 return (events & (POLLIN | POLLOUT | POLLRDNORM | POLLWRNORM)); 171} 172 173#define no_dump (dumper_t *)enodev 174 175struct cdevsw * 176devsw(dev_t dev) 177{ 178 if (dev->si_devsw) 179 return (dev->si_devsw); 180 return (&dead_cdevsw); 181} 182 183/* 184 * dev_t and u_dev_t primitives 185 */ 186 187int 188major(dev_t x) 189{ 190 if (x == NODEV) 191 return NOUDEV; 192 return((x->si_udev >> 8) & 0xff); 193} 194 195int 196minor(dev_t x) 197{ 198 if (x == NODEV) 199 return NOUDEV; 200 return(x->si_udev & 0xffff00ff); 201} 202 203int 204dev2unit(dev_t x) 205{ 206 int i; 207 208 if (x == NODEV) 209 return NOUDEV; 210 i = minor(x); 211 return ((i & 0xff) | (i >> 8)); 212} 213 214int 215unit2minor(int unit) 216{ 217 218 KASSERT(unit <= 0xffffff, ("Invalid unit (%d) in unit2minor", unit)); 219 return ((unit & 0xff) | ((unit << 8) & ~0xffff)); 220} 221 222static dev_t 223allocdev(void) 224{ 225 static int stashed; 226 struct cdev *si; 227 228 if (LIST_FIRST(&dev_free)) { 229 si = LIST_FIRST(&dev_free); 230 LIST_REMOVE(si, si_hash); 231 } else if (stashed >= DEVT_STASH) { 232 MALLOC(si, struct cdev *, sizeof(*si), M_DEVT, 233 M_USE_RESERVE | M_ZERO | M_WAITOK); 234 } else { 235 si = devt_stash + stashed++; 236 bzero(si, sizeof *si); 237 si->si_flags |= SI_STASHED; 238 } 239 si->__si_namebuf[0] = '\0'; 240 si->si_name = si->__si_namebuf; 241 LIST_INIT(&si->si_children); 242 TAILQ_INIT(&si->si_snapshots); 243 return (si); 244} 245 246dev_t 247makedev(int x, int y) 248{ 249 struct cdev *si; 250 udev_t udev; 251 int hash; 252 253 if (x == umajor(NOUDEV) && y == uminor(NOUDEV)) 254 panic("makedev of NOUDEV"); 255 udev = (x << 8) | y; 256 hash = udev % DEVT_HASH; 257 LIST_FOREACH(si, &dev_hash[hash], si_hash) { 258 if (si->si_udev == udev) 259 return (si); 260 } 261 si = allocdev(); 262 si->si_udev = udev; 263 LIST_INSERT_HEAD(&dev_hash[hash], si, si_hash); 264 return (si); 265} 266 267void 268freedev(dev_t dev) 269{ 270 271 if (!free_devt) 272 return; 273 if (SLIST_FIRST(&dev->si_hlist)) 274 return; 275 if (dev->si_devsw || dev->si_drv1 || dev->si_drv2) 276 return; 277 LIST_REMOVE(dev, si_hash); 278 if (dev->si_flags & SI_STASHED) { 279 bzero(dev, sizeof(*dev)); 280 dev->si_flags |= SI_STASHED; 281 LIST_INSERT_HEAD(&dev_free, dev, si_hash); 282 } else { 283 FREE(dev, M_DEVT); 284 } 285} 286 287udev_t 288dev2udev(dev_t x) 289{ 290 if (x == NODEV) 291 return NOUDEV; 292 return (x->si_udev); 293} 294 295dev_t 296udev2dev(udev_t x, int b) 297{ 298 299 if (x == NOUDEV) 300 return (NODEV); 301 switch (b) { 302 case 0: 303 return makedev(umajor(x), uminor(x)); 304 case 1: 305 return (NODEV); 306 default: 307 Debugger("udev2dev(...,X)"); 308 return NODEV; 309 } 310} 311 312int 313uminor(udev_t dev) 314{ 315 return(dev & 0xffff00ff); 316} 317 318int 319umajor(udev_t dev) 320{ 321 return((dev & 0xff00) >> 8); 322} 323 324udev_t 325makeudev(int x, int y) 326{ 327 return ((x << 8) | y); 328} 329 330dev_t 331make_dev(struct cdevsw *devsw, int minor, uid_t uid, gid_t gid, int perms, const char *fmt, ...) 332{ 333 dev_t dev; 334 va_list ap; 335 int i; 336 337 KASSERT((minor & ~0xffff00ff) == 0, 338 ("Invalid minor (0x%x) in make_dev", minor)); 339 340 if (devsw->d_open == NULL) devsw->d_open = null_open; 341 if (devsw->d_close == NULL) devsw->d_close = null_close; 342 if (devsw->d_read == NULL) devsw->d_read = no_read; 343 if (devsw->d_write == NULL) devsw->d_write = no_write; 344 if (devsw->d_ioctl == NULL) devsw->d_ioctl = no_ioctl; 345 if (devsw->d_poll == NULL) devsw->d_poll = no_poll; 346 if (devsw->d_mmap == NULL) devsw->d_mmap = no_mmap; 347 if (devsw->d_strategy == NULL) devsw->d_strategy = no_strategy; 348 if (devsw->d_dump == NULL) devsw->d_dump = no_dump; 349 if (devsw->d_kqfilter == NULL) devsw->d_kqfilter = no_kqfilter; 350 351 if (devsw->d_maj == MAJOR_AUTO) { 352 for (i = NUMCDEVSW - 1; i > 0; i--) 353 if (reserved_majors[i] != i) 354 break; 355 KASSERT(i > 0, ("Out of major numbers (%s)", devsw->d_name)); 356 devsw->d_maj = i; 357 reserved_majors[i] = i; 358 } else { 359 if (devsw->d_maj == 256) /* XXX: tty_cons.c is magic */ 360 devsw->d_maj = 0; 361 KASSERT(devsw->d_maj >= 0 && devsw->d_maj < 256, 362 ("Invalid major (%d) in make_dev", devsw->d_maj)); 363 if (reserved_majors[devsw->d_maj] != devsw->d_maj) { 364 printf("WARNING: driver \"%s\" used %s %d\n", 365 devsw->d_name, "unreserved major device number", 366 devsw->d_maj); 367 reserved_majors[devsw->d_maj] = devsw->d_maj; 368 } 369 } 370 371 if (!ready_for_devs) { 372 printf("WARNING: Driver mistake: make_dev(%s) called before SI_SUB_DRIVERS\n", 373 fmt); 374 /* XXX panic here once drivers are cleaned up */ 375 } 376 377 dev = makedev(devsw->d_maj, minor); 378 if (dev->si_flags & SI_CHEAPCLONE && 379 dev->si_flags & SI_NAMED && 380 dev->si_devsw == devsw) { 381 /* 382 * This is allowed as it removes races and generally 383 * simplifies cloning devices. 384 */ 385 return (dev); 386 } 387 if (dev->si_flags & SI_NAMED) { 388 printf( "WARNING: Driver mistake: repeat make_dev(\"%s\")\n", 389 dev->si_name); 390 panic("don't do that"); 391 } 392 va_start(ap, fmt); 393 i = vsnrprintf(dev->__si_namebuf, sizeof dev->__si_namebuf, 32, fmt, ap); 394 if (i > (sizeof dev->__si_namebuf - 1)) { 395 printf("WARNING: Device name truncated! (%s)", 396 dev->__si_namebuf); 397 } 398 va_end(ap); 399 dev->si_devsw = devsw; 400 dev->si_uid = uid; 401 dev->si_gid = gid; 402 dev->si_mode = perms; 403 dev->si_flags |= SI_NAMED; 404 405 devfs_create(dev); 406 return (dev); 407} 408 409int 410dev_named(dev_t pdev, const char *name) 411{ 412 dev_t cdev; 413 414 if (strcmp(devtoname(pdev), name) == 0) 415 return (1); 416 LIST_FOREACH(cdev, &pdev->si_children, si_siblings) 417 if (strcmp(devtoname(cdev), name) == 0) 418 return (1); 419 return (0); 420} 421 422void 423dev_depends(dev_t pdev, dev_t cdev) 424{ 425 426 cdev->si_parent = pdev; 427 cdev->si_flags |= SI_CHILD; 428 LIST_INSERT_HEAD(&pdev->si_children, cdev, si_siblings); 429} 430 431dev_t 432make_dev_alias(dev_t pdev, const char *fmt, ...) 433{ 434 dev_t dev; 435 va_list ap; 436 int i; 437 438 dev = allocdev(); 439 dev->si_flags |= SI_ALIAS; 440 dev->si_flags |= SI_NAMED; 441 dev_depends(pdev, dev); 442 va_start(ap, fmt); 443 i = vsnrprintf(dev->__si_namebuf, sizeof dev->__si_namebuf, 32, fmt, ap); 444 if (i > (sizeof dev->__si_namebuf - 1)) { 445 printf("WARNING: Device name truncated! (%s)", 446 dev->__si_namebuf); 447 } 448 va_end(ap); 449 450 devfs_create(dev); 451 return (dev); 452} 453 454void 455revoke_and_destroy_dev(dev_t dev) 456{ 457 struct vnode *vp; 458 459 GIANT_REQUIRED; 460 461 vp = SLIST_FIRST(&dev->si_hlist); 462 if (vp != NULL) 463 VOP_REVOKE(vp, REVOKEALL); 464 destroy_dev(dev); 465} 466 467void 468destroy_dev(dev_t dev) 469{ 470 471 if (!(dev->si_flags & SI_NAMED)) { 472 printf( "WARNING: Driver mistake: destroy_dev on %d/%d\n", 473 major(dev), minor(dev)); 474 panic("don't do that"); 475 } 476 477 devfs_destroy(dev); 478 if (dev->si_flags & SI_CHILD) { 479 LIST_REMOVE(dev, si_siblings); 480 dev->si_flags &= ~SI_CHILD; 481 } 482 while (!LIST_EMPTY(&dev->si_children)) 483 destroy_dev(LIST_FIRST(&dev->si_children)); 484 dev->si_drv1 = 0; 485 dev->si_drv2 = 0; 486 dev->si_devsw = 0; 487 bzero(&dev->__si_u, sizeof(dev->__si_u)); 488 dev->si_flags &= ~SI_NAMED; 489 dev->si_flags &= ~SI_ALIAS; 490 freedev(dev); 491} 492 493const char * 494devtoname(dev_t dev) 495{ 496 char *p; 497 int mynor; 498 499 if (dev->si_name[0] == '#' || dev->si_name[0] == '\0') { 500 p = dev->si_name; 501 if (devsw(dev)) 502 sprintf(p, "#%s/", devsw(dev)->d_name); 503 else 504 sprintf(p, "#%d/", major(dev)); 505 p += strlen(p); 506 mynor = minor(dev); 507 if (mynor < 0 || mynor > 255) 508 sprintf(p, "%#x", (u_int)mynor); 509 else 510 sprintf(p, "%d", mynor); 511 } 512 return (dev->si_name); 513} 514 515int 516dev_stdclone(char *name, char **namep, const char *stem, int *unit) 517{ 518 int u, i; 519 520 i = strlen(stem); 521 if (bcmp(stem, name, i) != 0) 522 return (0); 523 if (!isdigit(name[i])) 524 return (0); 525 u = 0; 526 if (name[i] == '0' && isdigit(name[i+1])) 527 return (0); 528 while (isdigit(name[i])) { 529 u *= 10; 530 u += name[i++] - '0'; 531 } 532 if (u > 0xffffff) 533 return (0); 534 *unit = u; 535 if (namep) 536 *namep = &name[i]; 537 if (name[i]) 538 return (2); 539 return (1); 540} 541 542/* 543 * Helper sysctl for devname(3). We're given a {u}dev_t and return 544 * the name, if any, registered by the device driver. 545 */ 546static int 547sysctl_devname(SYSCTL_HANDLER_ARGS) 548{ 549 int error; 550 udev_t ud; 551 dev_t dev; 552 553 error = SYSCTL_IN(req, &ud, sizeof (ud)); 554 if (error) 555 return (error); 556 if (ud == NOUDEV) 557 return(EINVAL); 558 dev = makedev(umajor(ud), uminor(ud)); 559 if (dev->si_name[0] == '\0') 560 error = ENOENT; 561 else 562 error = SYSCTL_OUT(req, dev->si_name, strlen(dev->si_name) + 1); 563 freedev(dev); 564 return (error); 565} 566 567SYSCTL_PROC(_kern, OID_AUTO, devname, CTLTYPE_OPAQUE|CTLFLAG_RW|CTLFLAG_ANYBODY, 568 NULL, 0, sysctl_devname, "", "devname(3) handler"); 569 570/* 571 * Set ready_for_devs; prior to this point, device creation is not allowed. 572 */ 573static void 574dev_set_ready(void *junk) 575{ 576 ready_for_devs = 1; 577} 578 579SYSINIT(dev_ready, SI_SUB_DEVFS, SI_ORDER_FIRST, dev_set_ready, NULL); 580