kern_conf.c revision 144385
1/*-
2 * Copyright (c) 1999-2002 Poul-Henning Kamp
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24 * SUCH DAMAGE.
25 */
26
27#include <sys/cdefs.h>
28__FBSDID("$FreeBSD: head/sys/kern/kern_conf.c 144385 2005-03-31 10:29:57Z phk $");
29
30#include <sys/param.h>
31#include <sys/kernel.h>
32#include <sys/systm.h>
33#include <sys/bio.h>
34#include <sys/lock.h>
35#include <sys/mutex.h>
36#include <sys/sysctl.h>
37#include <sys/module.h>
38#include <sys/malloc.h>
39#include <sys/conf.h>
40#include <sys/vnode.h>
41#include <sys/queue.h>
42#include <sys/poll.h>
43#include <sys/ctype.h>
44#include <sys/tty.h>
45#include <machine/stdarg.h>
46
47static MALLOC_DEFINE(M_DEVT, "cdev", "cdev storage");
48
49/* Built at compile time from sys/conf/majors */
50
51static struct mtx devmtx;
52static void freedev(struct cdev *dev);
53static void destroy_devl(struct cdev *dev);
54
55void
56dev_lock(void)
57{
58	if (!mtx_initialized(&devmtx))
59		mtx_init(&devmtx, "cdev", NULL, MTX_DEF);
60	mtx_lock(&devmtx);
61}
62
63void
64dev_unlock(void)
65{
66
67	mtx_unlock(&devmtx);
68}
69
70void
71dev_ref(struct cdev *dev)
72{
73
74	mtx_assert(&devmtx, MA_NOTOWNED);
75	mtx_lock(&devmtx);
76	dev->si_refcount++;
77	mtx_unlock(&devmtx);
78}
79
80void
81dev_refl(struct cdev *dev)
82{
83
84	mtx_assert(&devmtx, MA_OWNED);
85	dev->si_refcount++;
86}
87
88void
89dev_rel(struct cdev *dev)
90{
91	int flag = 0;
92
93	mtx_assert(&devmtx, MA_NOTOWNED);
94	dev_lock();
95	dev->si_refcount--;
96	KASSERT(dev->si_refcount >= 0,
97	    ("dev_rel(%s) gave negative count", devtoname(dev)));
98	if (dev->si_usecount == 0 &&
99	    (dev->si_flags & SI_CHEAPCLONE) && (dev->si_flags & SI_NAMED))
100	if (dev->si_devsw == NULL && dev->si_refcount == 0) {
101		LIST_REMOVE(dev, si_list);
102		flag = 1;
103	}
104	dev_unlock();
105	if (flag)
106		freedev(dev);
107}
108
109struct cdevsw *
110dev_refthread(struct cdev *dev)
111{
112	struct cdevsw *csw;
113
114	mtx_assert(&devmtx, MA_NOTOWNED);
115	dev_lock();
116	csw = dev->si_devsw;
117	if (csw != NULL)
118		dev->si_threadcount++;
119	dev_unlock();
120	return (csw);
121}
122
123void
124dev_relthread(struct cdev *dev)
125{
126
127	mtx_assert(&devmtx, MA_NOTOWNED);
128	dev_lock();
129	dev->si_threadcount--;
130	dev_unlock();
131}
132
133int
134nullop(void)
135{
136
137	return (0);
138}
139
140int
141eopnotsupp(void)
142{
143
144	return (EOPNOTSUPP);
145}
146
147static int
148enxio(void)
149{
150	return (ENXIO);
151}
152
153static int
154enodev(void)
155{
156	return (ENODEV);
157}
158
159/* Define a dead_cdevsw for use when devices leave unexpectedly. */
160
161#define dead_open	(d_open_t *)enxio
162#define dead_close	(d_close_t *)enxio
163#define dead_read	(d_read_t *)enxio
164#define dead_write	(d_write_t *)enxio
165#define dead_ioctl	(d_ioctl_t *)enxio
166#define dead_poll	(d_poll_t *)enodev
167#define dead_mmap	(d_mmap_t *)enodev
168
169static void
170dead_strategy(struct bio *bp)
171{
172
173	biofinish(bp, NULL, ENXIO);
174}
175
176#define dead_dump	(dumper_t *)enxio
177#define dead_kqfilter	(d_kqfilter_t *)enxio
178
179static struct cdevsw dead_cdevsw = {
180	.d_version =	D_VERSION,
181	.d_flags =	D_NEEDGIANT, /* XXX: does dead_strategy need this ? */
182	.d_open =	dead_open,
183	.d_close =	dead_close,
184	.d_read =	dead_read,
185	.d_write =	dead_write,
186	.d_ioctl =	dead_ioctl,
187	.d_poll =	dead_poll,
188	.d_mmap =	dead_mmap,
189	.d_strategy =	dead_strategy,
190	.d_name =	"dead",
191	.d_dump =	dead_dump,
192	.d_kqfilter =	dead_kqfilter
193};
194
195/* Default methods if driver does not specify method */
196
197#define null_open	(d_open_t *)nullop
198#define null_close	(d_close_t *)nullop
199#define no_read		(d_read_t *)enodev
200#define no_write	(d_write_t *)enodev
201#define no_ioctl	(d_ioctl_t *)enodev
202#define no_mmap		(d_mmap_t *)enodev
203#define no_kqfilter	(d_kqfilter_t *)enodev
204
205static void
206no_strategy(struct bio *bp)
207{
208
209	biofinish(bp, NULL, ENODEV);
210}
211
212static int
213no_poll(struct cdev *dev __unused, int events, struct thread *td __unused)
214{
215	/*
216	 * Return true for read/write.  If the user asked for something
217	 * special, return POLLNVAL, so that clients have a way of
218	 * determining reliably whether or not the extended
219	 * functionality is present without hard-coding knowledge
220	 * of specific filesystem implementations.
221	 * Stay in sync with vop_nopoll().
222	 */
223	if (events & ~POLLSTANDARD)
224		return (POLLNVAL);
225
226	return (events & (POLLIN | POLLOUT | POLLRDNORM | POLLWRNORM));
227}
228
229#define no_dump		(dumper_t *)enodev
230
231/*
232 * struct cdev * and u_dev_t primitives
233 */
234
235int
236minor(struct cdev *x)
237{
238	if (x == NULL)
239		return NODEV;
240	return(x->si_drv0 & MAXMINOR);
241}
242
243int
244dev2unit(struct cdev *x)
245{
246
247	if (x == NULL)
248		return NODEV;
249	return (minor2unit(minor(x)));
250}
251
252u_int
253minor2unit(u_int _minor)
254{
255
256	KASSERT((_minor & ~MAXMINOR) == 0, ("Illegal minor %x", _minor));
257	return ((_minor & 0xff) | ((_minor >> 8) & 0xffff00));
258}
259
260int
261unit2minor(int unit)
262{
263
264	KASSERT(unit <= 0xffffff, ("Invalid unit (%d) in unit2minor", unit));
265	return ((unit & 0xff) | ((unit << 8) & ~0xffff));
266}
267
268static struct cdev *
269allocdev(void)
270{
271	struct cdev *si;
272
273	si = malloc(sizeof *si, M_DEVT, M_USE_RESERVE | M_ZERO | M_WAITOK);
274	si->si_name = si->__si_namebuf;
275	LIST_INIT(&si->si_children);
276	LIST_INIT(&si->si_alist);
277	return (si);
278}
279
280static struct cdev *
281newdev(struct cdevsw *csw, int y, struct cdev *si)
282{
283	struct cdev *si2;
284	dev_t	udev;
285
286	mtx_assert(&devmtx, MA_OWNED);
287	udev = y;
288	LIST_FOREACH(si2, &csw->d_devs, si_list) {
289		if (si2->si_drv0 == udev) {
290			freedev(si);
291			return (si2);
292		}
293	}
294	si->si_drv0 = udev;
295	LIST_INSERT_HEAD(&csw->d_devs, si, si_list);
296	return (si);
297}
298
299static void
300freedev(struct cdev *dev)
301{
302
303	free(dev, M_DEVT);
304}
305
306int
307uminor(dev_t dev)
308{
309	return (dev & MAXMINOR);
310}
311
312int
313umajor(dev_t dev)
314{
315	return ((dev & ~MAXMINOR) >> 8);
316}
317
318static void
319fini_cdevsw(struct cdevsw *devsw)
320{
321
322	devsw->d_flags &= ~D_INIT;
323}
324
325static void
326prep_cdevsw(struct cdevsw *devsw)
327{
328
329	dev_lock();
330
331	if (devsw->d_version != D_VERSION_01) {
332		printf(
333		    "WARNING: Device driver \"%s\" has wrong version %s\n",
334		    devsw->d_name, "and is disabled.  Recompile KLD module.");
335		devsw->d_open = dead_open;
336		devsw->d_close = dead_close;
337		devsw->d_read = dead_read;
338		devsw->d_write = dead_write;
339		devsw->d_ioctl = dead_ioctl;
340		devsw->d_poll = dead_poll;
341		devsw->d_mmap = dead_mmap;
342		devsw->d_strategy = dead_strategy;
343		devsw->d_dump = dead_dump;
344		devsw->d_kqfilter = dead_kqfilter;
345	}
346
347	if (devsw->d_flags & D_TTY) {
348		if (devsw->d_ioctl == NULL)	devsw->d_ioctl = ttyioctl;
349		if (devsw->d_read == NULL)	devsw->d_read = ttyread;
350		if (devsw->d_write == NULL)	devsw->d_write = ttywrite;
351		if (devsw->d_kqfilter == NULL)	devsw->d_kqfilter = ttykqfilter;
352		if (devsw->d_poll == NULL)	devsw->d_poll = ttypoll;
353	}
354
355	if (devsw->d_open == NULL)	devsw->d_open = null_open;
356	if (devsw->d_close == NULL)	devsw->d_close = null_close;
357	if (devsw->d_read == NULL)	devsw->d_read = no_read;
358	if (devsw->d_write == NULL)	devsw->d_write = no_write;
359	if (devsw->d_ioctl == NULL)	devsw->d_ioctl = no_ioctl;
360	if (devsw->d_poll == NULL)	devsw->d_poll = no_poll;
361	if (devsw->d_mmap == NULL)	devsw->d_mmap = no_mmap;
362	if (devsw->d_strategy == NULL)	devsw->d_strategy = no_strategy;
363	if (devsw->d_dump == NULL)	devsw->d_dump = no_dump;
364	if (devsw->d_kqfilter == NULL)	devsw->d_kqfilter = no_kqfilter;
365
366	LIST_INIT(&devsw->d_devs);
367
368	devsw->d_flags |= D_INIT;
369
370	dev_unlock();
371}
372
373struct cdev *
374make_dev(struct cdevsw *devsw, int minornr, uid_t uid, gid_t gid, int mode, const char *fmt, ...)
375{
376	struct cdev *dev;
377	va_list ap;
378	int i;
379
380	KASSERT((minornr & ~MAXMINOR) == 0,
381	    ("Invalid minor (0x%x) in make_dev", minornr));
382
383	if (!(devsw->d_flags & D_INIT))
384		prep_cdevsw(devsw);
385	dev = allocdev();
386	dev_lock();
387	dev = newdev(devsw, minornr, dev);
388	if (dev->si_flags & SI_CHEAPCLONE &&
389	    dev->si_flags & SI_NAMED &&
390	    dev->si_devsw == devsw) {
391		/*
392		 * This is allowed as it removes races and generally
393		 * simplifies cloning devices.
394		 * XXX: still ??
395		 */
396		dev_unlock();
397		return (dev);
398	}
399	KASSERT(!(dev->si_flags & SI_NAMED),
400	    ("make_dev() by driver %s on pre-existing device (min=%x, name=%s)",
401	    devsw->d_name, minor(dev), devtoname(dev)));
402
403	va_start(ap, fmt);
404	i = vsnrprintf(dev->__si_namebuf, sizeof dev->__si_namebuf, 32, fmt, ap);
405	if (i > (sizeof dev->__si_namebuf - 1)) {
406		printf("WARNING: Device name truncated! (%s)\n",
407		    dev->__si_namebuf);
408	}
409	va_end(ap);
410
411	dev->si_devsw = devsw;
412	dev->si_flags |= SI_NAMED;
413	dev->si_uid = uid;
414	dev->si_gid = gid;
415	dev->si_mode = mode;
416
417	devfs_create(dev);
418	dev_unlock();
419	return (dev);
420}
421
422int
423dev_named(struct cdev *pdev, const char *name)
424{
425	struct cdev *cdev;
426
427	if (strcmp(devtoname(pdev), name) == 0)
428		return (1);
429	LIST_FOREACH(cdev, &pdev->si_children, si_siblings)
430		if (strcmp(devtoname(cdev), name) == 0)
431			return (1);
432	return (0);
433}
434
435void
436dev_depends(struct cdev *pdev, struct cdev *cdev)
437{
438
439	dev_lock();
440	cdev->si_parent = pdev;
441	cdev->si_flags |= SI_CHILD;
442	LIST_INSERT_HEAD(&pdev->si_children, cdev, si_siblings);
443	dev_unlock();
444}
445
446struct cdev *
447make_dev_alias(struct cdev *pdev, const char *fmt, ...)
448{
449	struct cdev *dev;
450	va_list ap;
451	int i;
452
453	dev = allocdev();
454	dev_lock();
455	dev->si_flags |= SI_ALIAS;
456	dev->si_flags |= SI_NAMED;
457	va_start(ap, fmt);
458	i = vsnrprintf(dev->__si_namebuf, sizeof dev->__si_namebuf, 32, fmt, ap);
459	if (i > (sizeof dev->__si_namebuf - 1)) {
460		printf("WARNING: Device name truncated! (%s)\n",
461		    dev->__si_namebuf);
462	}
463	va_end(ap);
464
465	devfs_create(dev);
466	dev_unlock();
467	dev_depends(pdev, dev);
468	return (dev);
469}
470
471static void
472destroy_devl(struct cdev *dev)
473{
474	struct cdevsw *csw;
475
476	mtx_assert(&devmtx, MA_OWNED);
477	KASSERT(dev->si_flags & SI_NAMED,
478	    ("WARNING: Driver mistake: destroy_dev on %d\n", minor(dev)));
479
480	devfs_destroy(dev);
481
482	/* Remove name marking */
483	dev->si_flags &= ~SI_NAMED;
484
485	/* If we are a child, remove us from the parents list */
486	if (dev->si_flags & SI_CHILD) {
487		LIST_REMOVE(dev, si_siblings);
488		dev->si_flags &= ~SI_CHILD;
489	}
490
491	/* Kill our children */
492	while (!LIST_EMPTY(&dev->si_children))
493		destroy_devl(LIST_FIRST(&dev->si_children));
494
495	/* Remove from clone list */
496	if (dev->si_flags & SI_CLONELIST) {
497		LIST_REMOVE(dev, si_clone);
498		dev->si_flags &= ~SI_CLONELIST;
499	}
500
501	csw = dev->si_devsw;
502	dev->si_devsw = NULL;	/* already NULL for SI_ALIAS */
503	while (csw != NULL && csw->d_purge != NULL && dev->si_threadcount) {
504		printf("Purging %lu threads from %s\n",
505		    dev->si_threadcount, devtoname(dev));
506		csw->d_purge(dev);
507		msleep(csw, &devmtx, PRIBIO, "devprg", hz/10);
508	}
509	if (csw != NULL && csw->d_purge != NULL)
510		printf("All threads purged from %s\n", devtoname(dev));
511
512	dev->si_drv1 = 0;
513	dev->si_drv2 = 0;
514	bzero(&dev->__si_u, sizeof(dev->__si_u));
515
516	if (!(dev->si_flags & SI_ALIAS)) {
517		/* Remove from cdevsw list */
518		LIST_REMOVE(dev, si_list);
519
520		/* If cdevsw has no struct cdev *'s, clean it */
521		if (LIST_EMPTY(&csw->d_devs))
522			fini_cdevsw(csw);
523	}
524	dev->si_flags &= ~SI_ALIAS;
525
526	if (dev->si_refcount > 0) {
527		LIST_INSERT_HEAD(&dead_cdevsw.d_devs, dev, si_list);
528	} else {
529		freedev(dev);
530	}
531}
532
533void
534destroy_dev(struct cdev *dev)
535{
536
537	dev_lock();
538	destroy_devl(dev);
539	dev_unlock();
540}
541
542const char *
543devtoname(struct cdev *dev)
544{
545	char *p;
546	struct cdevsw *csw;
547	int mynor;
548
549	if (dev->si_name[0] == '#' || dev->si_name[0] == '\0') {
550		p = dev->si_name;
551		csw = dev_refthread(dev);
552		if (csw != NULL) {
553			sprintf(p, "(%s)", csw->d_name);
554			dev_relthread(dev);
555		}
556		p += strlen(p);
557		mynor = minor(dev);
558		if (mynor < 0 || mynor > 255)
559			sprintf(p, "/%#x", (u_int)mynor);
560		else
561			sprintf(p, "/%d", mynor);
562	}
563	return (dev->si_name);
564}
565
566int
567dev_stdclone(char *name, char **namep, const char *stem, int *unit)
568{
569	int u, i;
570
571	i = strlen(stem);
572	if (bcmp(stem, name, i) != 0)
573		return (0);
574	if (!isdigit(name[i]))
575		return (0);
576	u = 0;
577	if (name[i] == '0' && isdigit(name[i+1]))
578		return (0);
579	while (isdigit(name[i])) {
580		u *= 10;
581		u += name[i++] - '0';
582	}
583	if (u > 0xffffff)
584		return (0);
585	*unit = u;
586	if (namep)
587		*namep = &name[i];
588	if (name[i])
589		return (2);
590	return (1);
591}
592
593/*
594 * Helper functions for cloning device drivers.
595 *
596 * The objective here is to make it unnecessary for the device drivers to
597 * use rman or similar to manage their unit number space.  Due to the way
598 * we do "on-demand" devices, using rman or other "private" methods
599 * will be very tricky to lock down properly once we lock down this file.
600 *
601 * Instead we give the drivers these routines which puts the struct cdev *'s
602 * that are to be managed on their own list, and gives the driver the ability
603 * to ask for the first free unit number or a given specified unit number.
604 *
605 * In addition these routines support paired devices (pty, nmdm and similar)
606 * by respecting a number of "flag" bits in the minor number.
607 *
608 */
609
610struct clonedevs {
611	LIST_HEAD(,cdev)	head;
612};
613
614void
615clone_setup(struct clonedevs **cdp)
616{
617
618	*cdp = malloc(sizeof **cdp, M_DEVBUF, M_WAITOK | M_ZERO);
619	LIST_INIT(&(*cdp)->head);
620}
621
622int
623clone_create(struct clonedevs **cdp, struct cdevsw *csw, int *up, struct cdev **dp, u_int extra)
624{
625	struct clonedevs *cd;
626	struct cdev *dev, *ndev, *dl, *de;
627	int unit, low, u;
628
629	KASSERT(*cdp != NULL,
630	    ("clone_setup() not called in driver \"%s\"", csw->d_name));
631	KASSERT(!(extra & CLONE_UNITMASK),
632	    ("Illegal extra bits (0x%x) in clone_create", extra));
633	KASSERT(*up <= CLONE_UNITMASK,
634	    ("Too high unit (0x%x) in clone_create", *up));
635
636	if (!(csw->d_flags & D_INIT))
637		prep_cdevsw(csw);
638
639	/*
640	 * Search the list for a lot of things in one go:
641	 *   A preexisting match is returned immediately.
642	 *   The lowest free unit number if we are passed -1, and the place
643	 *	 in the list where we should insert that new element.
644	 *   The place to insert a specified unit number, if applicable
645	 *       the end of the list.
646	 */
647	unit = *up;
648	ndev = allocdev();
649	dev_lock();
650	low = extra;
651	de = dl = NULL;
652	cd = *cdp;
653	LIST_FOREACH(dev, &cd->head, si_clone) {
654		KASSERT(dev->si_flags & SI_CLONELIST,
655		    ("Dev %p(%s) should be on clonelist", dev, dev->si_name));
656		u = dev2unit(dev);
657		if (u == (unit | extra)) {
658			*dp = dev;
659			freedev(ndev);
660			dev_unlock();
661			return (0);
662		}
663		if (unit == -1 && u == low) {
664			low++;
665			de = dev;
666			continue;
667		}
668		if (u > (unit | extra)) {
669			dl = dev;
670			break;
671		}
672	}
673	if (unit == -1)
674		unit = low & CLONE_UNITMASK;
675	dev = newdev(csw, unit2minor(unit | extra), ndev);
676	if (dev->si_flags & SI_CLONELIST) {
677		printf("dev %p (%s) is on clonelist\n", dev, dev->si_name);
678		printf("unit=%d\n", unit);
679		LIST_FOREACH(dev, &cd->head, si_clone) {
680			printf("\t%p %s\n", dev, dev->si_name);
681		}
682		panic("foo");
683	}
684	KASSERT(!(dev->si_flags & SI_CLONELIST),
685	    ("Dev %p(%s) should not be on clonelist", dev, dev->si_name));
686	if (dl != NULL)
687		LIST_INSERT_BEFORE(dl, dev, si_clone);
688	else if (de != NULL)
689		LIST_INSERT_AFTER(de, dev, si_clone);
690	else
691		LIST_INSERT_HEAD(&cd->head, dev, si_clone);
692	dev->si_flags |= SI_CLONELIST;
693	*up = unit;
694	dev_unlock();
695	return (1);
696}
697
698/*
699 * Kill everything still on the list.  The driver should already have
700 * disposed of any softc hung of the struct cdev *'s at this time.
701 */
702void
703clone_cleanup(struct clonedevs **cdp)
704{
705	struct cdev *dev, *tdev;
706	struct clonedevs *cd;
707
708	cd = *cdp;
709	if (cd == NULL)
710		return;
711	dev_lock();
712	LIST_FOREACH_SAFE(dev, &cd->head, si_clone, tdev) {
713		KASSERT(dev->si_flags & SI_CLONELIST,
714		    ("Dev %p(%s) should be on clonelist", dev, dev->si_name));
715		KASSERT(dev->si_flags & SI_NAMED,
716		    ("Driver has goofed in cloning underways udev %x", dev->si_drv0));
717		destroy_devl(dev);
718	}
719	dev_unlock();
720	free(cd, M_DEVBUF);
721	*cdp = NULL;
722}
723