vm_machdep.c revision 122780
136865Sdfr/*-
236865Sdfr * Copyright (c) 1982, 1986 The Regents of the University of California.
336865Sdfr * Copyright (c) 1989, 1990 William Jolitz
436865Sdfr * Copyright (c) 1994 John Dyson
536865Sdfr * All rights reserved.
636865Sdfr *
736865Sdfr * This code is derived from software contributed to Berkeley by
836865Sdfr * the Systems Programming Group of the University of Utah Computer
936865Sdfr * Science Department, and William Jolitz.
1036865Sdfr *
1136865Sdfr * Redistribution and use in source and binary forms, with or without
1236865Sdfr * modification, are permitted provided that the following conditions
1336865Sdfr * are met:
1436865Sdfr * 1. Redistributions of source code must retain the above copyright
1536865Sdfr *    notice, this list of conditions and the following disclaimer.
1636865Sdfr * 2. Redistributions in binary form must reproduce the above copyright
1736865Sdfr *    notice, this list of conditions and the following disclaimer in the
1836865Sdfr *    documentation and/or other materials provided with the distribution.
1936865Sdfr * 3. All advertising materials mentioning features or use of this software
2036865Sdfr *    must display the following acknowledgement:
2136865Sdfr *	This product includes software developed by the University of
2236865Sdfr *	California, Berkeley and its contributors.
2336865Sdfr * 4. Neither the name of the University nor the names of its contributors
2436865Sdfr *    may be used to endorse or promote products derived from this software
2536865Sdfr *    without specific prior written permission.
2636865Sdfr *
2736865Sdfr * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
2836865Sdfr * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2936865Sdfr * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
3036865Sdfr * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
3136865Sdfr * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
3236865Sdfr * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
3336865Sdfr * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
3436865Sdfr * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
3536865Sdfr * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
3636865Sdfr * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
3736865Sdfr * SUCH DAMAGE.
3836865Sdfr *
3936865Sdfr *	from: @(#)vm_machdep.c	7.3 (Berkeley) 5/13/91
4036865Sdfr *	Utah $Hdr: vm_machdep.c 1.16.1.1 89/06/23$
4150477Speter * $FreeBSD: head/sys/powerpc/aim/vm_machdep.c 122780 2003-11-16 06:11:26Z alc $
4236865Sdfr */
4336865Sdfr/*
4436865Sdfr * Copyright (c) 1994, 1995, 1996 Carnegie-Mellon University.
4536865Sdfr * All rights reserved.
4636865Sdfr *
4736865Sdfr * Author: Chris G. Demetriou
4836865Sdfr *
4936865Sdfr * Permission to use, copy, modify and distribute this software and
5036865Sdfr * its documentation is hereby granted, provided that both the copyright
5136865Sdfr * notice and this permission notice appear in all copies of the
5236865Sdfr * software, derivative works or modified versions, and any portions
5336865Sdfr * thereof, and that both notices appear in supporting documentation.
5436865Sdfr *
5536865Sdfr * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
5636865Sdfr * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
5736865Sdfr * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
5836865Sdfr *
5936865Sdfr * Carnegie Mellon requests users of this software to return to
6036865Sdfr *
6136865Sdfr *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
6236865Sdfr *  School of Computer Science
6336865Sdfr *  Carnegie Mellon University
6436865Sdfr *  Pittsburgh PA 15213-3890
6536865Sdfr *
6636865Sdfr * any improvements or extensions that they make and grant Carnegie the
6736865Sdfr * rights to redistribute these changes.
6836865Sdfr */
6936865Sdfr
70118239Speter#include "opt_kstack_pages.h"
71118239Speter
7236865Sdfr#include <sys/param.h>
7336865Sdfr#include <sys/systm.h>
7436865Sdfr#include <sys/proc.h>
7536865Sdfr#include <sys/malloc.h>
7660041Sphk#include <sys/bio.h>
7736865Sdfr#include <sys/buf.h>
7885201Smp#include <sys/ktr.h>
7985201Smp#include <sys/lock.h>
8067365Sjhb#include <sys/mutex.h>
8136865Sdfr#include <sys/vnode.h>
8236865Sdfr#include <sys/vmmeter.h>
8336865Sdfr#include <sys/kernel.h>
84119563Salc#include <sys/mbuf.h>
85122780Salc#include <sys/sf_buf.h>
8636865Sdfr#include <sys/sysctl.h>
8754207Speter#include <sys/unistd.h>
8836865Sdfr
8936865Sdfr#include <machine/clock.h>
9036865Sdfr#include <machine/cpu.h>
9141499Sdfr#include <machine/fpu.h>
9297397Sbenno#include <machine/frame.h>
9336865Sdfr#include <machine/md_var.h>
9436865Sdfr
9578342Sbenno#include <dev/ofw/openfirm.h>
9678342Sbenno
9736865Sdfr#include <vm/vm.h>
9836865Sdfr#include <vm/vm_param.h>
9936865Sdfr#include <vm/vm_kern.h>
10036865Sdfr#include <vm/vm_page.h>
10136865Sdfr#include <vm/vm_map.h>
10236865Sdfr#include <vm/vm_extern.h>
10336865Sdfr
10436865Sdfr#include <sys/user.h>
10536865Sdfr
106119563Salcstatic void	sf_buf_init(void *arg);
107119563SalcSYSINIT(sock_sf, SI_SUB_MBUF, SI_ORDER_ANY, sf_buf_init, NULL)
108119563Salc
10936865Sdfr/*
110119563Salc * Expanded sf_freelist head. Really an SLIST_HEAD() in disguise, with the
111119563Salc * sf_freelist head with the sf_lock mutex.
112119563Salc */
113119563Salcstatic struct {
114119563Salc	SLIST_HEAD(, sf_buf) sf_head;
115119563Salc	struct mtx sf_lock;
116119563Salc} sf_freelist;
117119563Salc
118119563Salcstatic u_int	sf_buf_alloc_want;
119119563Salc
120119563Salc/*
12136865Sdfr * Finish a fork operation, with process p2 nearly set up.
12236865Sdfr * Copy and update the pcb, set up the stack so that the child
12336865Sdfr * ready to run and return to user mode.
12436865Sdfr */
12536865Sdfrvoid
12690361Sjuliancpu_fork(struct thread *td1, struct proc *p2, struct thread *td2, int flags)
12736865Sdfr{
12884977Sbenno	struct	proc *p1;
12984977Sbenno	struct	trapframe *tf;
13084977Sbenno	struct	callframe *cf;
13190643Sbenno	struct	pcb *pcb;
13284977Sbenno
13391467Sbenno	KASSERT(td1 == curthread || td1 == &thread0,
13490643Sbenno	    ("cpu_fork: p1 not curproc and not proc0"));
13584977Sbenno	CTR3(KTR_PROC, "cpu_fork: called td1=%08x p2=%08x flags=%x", (u_int)td1, (u_int)p2, flags);
13684977Sbenno
13784977Sbenno	if ((flags & RFPROC) == 0)
13884977Sbenno		return;
13984977Sbenno
14084977Sbenno	p1 = td1->td_proc;
14184977Sbenno
14291467Sbenno	pcb = (struct pcb *)((td2->td_kstack + KSTACK_PAGES * PAGE_SIZE -
14391467Sbenno	    sizeof(struct pcb)) & ~0x2fU);
14490643Sbenno	td2->td_pcb = pcb;
14584977Sbenno
14690643Sbenno	/* Copy the pcb */
14790643Sbenno	bcopy(td1->td_pcb, pcb, sizeof(struct pcb));
14884977Sbenno
14984977Sbenno	/*
15090643Sbenno	 * Create a fresh stack for the new process.
15184977Sbenno	 * Copy the trap frame for the return to user mode as if from a
15284977Sbenno	 * syscall.  This copies most of the user mode register values.
15384977Sbenno	 */
15490643Sbenno	tf = (struct trapframe *)pcb - 1;
15590643Sbenno	bcopy(td1->td_frame, tf, sizeof(*tf));
15684977Sbenno
15797397Sbenno	/* Set up trap frame. */
15897397Sbenno	tf->fixreg[FIRSTARG] = 0;
15997397Sbenno	tf->fixreg[FIRSTARG + 1] = 0;
16097397Sbenno	tf->cr &= ~0x10000000;
16190643Sbenno
16290643Sbenno	td2->td_frame = tf;
16390643Sbenno
16490643Sbenno	cf = (struct callframe *)tf - 1;
16591467Sbenno	cf->cf_func = (register_t)fork_return;
16691467Sbenno	cf->cf_arg0 = (register_t)td2;
16791467Sbenno	cf->cf_arg1 = (register_t)tf;
16884977Sbenno
16991467Sbenno	pcb->pcb_sp = (register_t)cf;
17091467Sbenno	pcb->pcb_lr = (register_t)fork_trampoline;
171105611Sgrehan	pcb->pcb_usr = kernel_pmap->pm_sr[USER_SR];
17284977Sbenno
17390643Sbenno	/*
17490643Sbenno 	 * Now cpu_switch() can schedule the new process.
17590643Sbenno	 */
17636865Sdfr}
17736865Sdfr
17836865Sdfr/*
17936865Sdfr * Intercept the return address from a freshly forked process that has NOT
18036865Sdfr * been scheduled yet.
18136865Sdfr *
18236865Sdfr * This is needed to make kernel threads stay in kernel mode.
18336865Sdfr */
18436865Sdfrvoid
18583682Smpcpu_set_fork_handler(td, func, arg)
18683682Smp	struct thread *td;
18792842Salfred	void (*func)(void *);
18848391Speter	void *arg;
18936865Sdfr{
19084977Sbenno	struct	callframe *cf;
19184977Sbenno
19284977Sbenno	CTR3(KTR_PROC, "cpu_set_fork_handler: called with td=%08x func=%08x arg=%08x",
19384977Sbenno	    (u_int)td, (u_int)func, (u_int)arg);
19484977Sbenno
19591467Sbenno	cf = (struct callframe *)td->td_pcb->pcb_sp;
19684977Sbenno
19791467Sbenno	cf->cf_func = (register_t)func;
19891467Sbenno	cf->cf_arg0 = (register_t)arg;
19936865Sdfr}
20036865Sdfr
20136865Sdfr/*
20236865Sdfr * cpu_exit is called as the last action during exit.
20336865Sdfr * We release the address space of the process, block interrupts,
20436865Sdfr * and call switch_exit.  switch_exit switches to proc0's PCB and stack,
20536865Sdfr * then jumps into the middle of cpu_switch, as if it were switching
20636865Sdfr * from proc0.
20736865Sdfr */
20836865Sdfrvoid
20983682Smpcpu_exit(td)
21083682Smp	register struct thread *td;
21136865Sdfr{
21236865Sdfr}
21336865Sdfr
21436865Sdfrvoid
21598765Sjakecpu_sched_exit(td)
21698765Sjake	register struct thread *td;
21798765Sjake{
21898765Sjake}
21998765Sjake
22083276Speter/* Temporary helper */
22183276Spetervoid
222118893Sgrehancpu_throw(struct thread *old, struct thread *new)
22383276Speter{
22483276Speter
225118893Sgrehan	cpu_switch(old, new);
22683276Speter	panic("cpu_throw() didn't");
22736865Sdfr}
22836865Sdfr
22936865Sdfr/*
23065557Sjasone * Reset back to firmware.
23136865Sdfr */
23236865Sdfrvoid
23336865Sdfrcpu_reset()
23436865Sdfr{
23578342Sbenno	OF_exit();
23636865Sdfr}
23736865Sdfr
23836865Sdfr/*
239119563Salc * Allocate a pool of sf_bufs (sendfile(2) or "super-fast" if you prefer. :-))
240119563Salc */
241119563Salcstatic void
242119563Salcsf_buf_init(void *arg)
243119563Salc{
244119563Salc	struct sf_buf *sf_bufs;
245119563Salc	vm_offset_t sf_base;
246119563Salc	int i;
247119563Salc
248119563Salc	mtx_init(&sf_freelist.sf_lock, "sf_bufs list lock", NULL, MTX_DEF);
249119563Salc	mtx_lock(&sf_freelist.sf_lock);
250119563Salc	SLIST_INIT(&sf_freelist.sf_head);
251119563Salc	sf_base = kmem_alloc_nofault(kernel_map, nsfbufs * PAGE_SIZE);
252119563Salc	sf_bufs = malloc(nsfbufs * sizeof(struct sf_buf), M_TEMP,
253119563Salc	    M_NOWAIT | M_ZERO);
254119563Salc	for (i = 0; i < nsfbufs; i++) {
255119563Salc		sf_bufs[i].kva = sf_base + i * PAGE_SIZE;
256119563Salc		SLIST_INSERT_HEAD(&sf_freelist.sf_head, &sf_bufs[i], free_list);
257119563Salc	}
258119563Salc	sf_buf_alloc_want = 0;
259119563Salc	mtx_unlock(&sf_freelist.sf_lock);
260119563Salc}
261119563Salc
262119563Salc/*
263119563Salc * Get an sf_buf from the freelist. Will block if none are available.
264119563Salc */
265119563Salcstruct sf_buf *
266119563Salcsf_buf_alloc(struct vm_page *m)
267119563Salc{
268119563Salc	struct sf_buf *sf;
269119563Salc	int error;
270119563Salc
271119563Salc	mtx_lock(&sf_freelist.sf_lock);
272119563Salc	while ((sf = SLIST_FIRST(&sf_freelist.sf_head)) == NULL) {
273119563Salc		sf_buf_alloc_want++;
274119563Salc		error = msleep(&sf_freelist, &sf_freelist.sf_lock, PVM|PCATCH,
275119563Salc		    "sfbufa", 0);
276119563Salc		sf_buf_alloc_want--;
277119563Salc
278119563Salc		/*
279119563Salc		 * If we got a signal, don't risk going back to sleep.
280119563Salc		 */
281119563Salc		if (error)
282119563Salc			break;
283119563Salc	}
284119563Salc	if (sf != NULL) {
285119563Salc		SLIST_REMOVE_HEAD(&sf_freelist.sf_head, free_list);
286119563Salc		sf->m = m;
287119563Salc		pmap_qenter(sf->kva, &sf->m, 1);
288119563Salc	}
289119563Salc	mtx_unlock(&sf_freelist.sf_lock);
290119563Salc	return (sf);
291119563Salc}
292119563Salc
293119563Salc/*
294119563Salc * Detatch mapped page and release resources back to the system.
295119563Salc */
296119563Salcvoid
297119563Salcsf_buf_free(void *addr, void *args)
298119563Salc{
299119563Salc	struct sf_buf *sf;
300119563Salc	struct vm_page *m;
301119563Salc
302119563Salc	sf = args;
303119563Salc	pmap_qremove((vm_offset_t)addr, 1);
304119563Salc	m = sf->m;
305119563Salc	vm_page_lock_queues();
306119563Salc	vm_page_unwire(m, 0);
307119563Salc	/*
308119563Salc	 * Check for the object going away on us. This can
309119563Salc	 * happen since we don't hold a reference to it.
310119563Salc	 * If so, we're responsible for freeing the page.
311119563Salc	 */
312119563Salc	if (m->wire_count == 0 && m->object == NULL)
313119563Salc		vm_page_free(m);
314119563Salc	vm_page_unlock_queues();
315119563Salc	sf->m = NULL;
316119563Salc	mtx_lock(&sf_freelist.sf_lock);
317119563Salc	SLIST_INSERT_HEAD(&sf_freelist.sf_head, sf, free_list);
318119563Salc	if (sf_buf_alloc_want > 0)
319119563Salc		wakeup_one(&sf_freelist);
320119563Salc	mtx_unlock(&sf_freelist.sf_lock);
321119563Salc}
322119563Salc
323119563Salc/*
32436865Sdfr * Software interrupt handler for queued VM system processing.
32536865Sdfr */
32636865Sdfrvoid
32767551Sjhbswi_vm(void *dummy)
32836865Sdfr{
32978342Sbenno#if 0 /* XXX: Don't have busdma stuff yet */
33036865Sdfr	if (busdma_swi_pending != 0)
33136865Sdfr		busdma_swi();
33278342Sbenno#endif
33336865Sdfr}
33436865Sdfr
33536865Sdfr/*
33636865Sdfr * Tell whether this address is in some physical memory region.
33736865Sdfr * Currently used by the kernel coredump code in order to avoid
33836865Sdfr * dumping the ``ISA memory hole'' which could cause indefinite hangs,
33936865Sdfr * or other unpredictable behaviour.
34036865Sdfr */
34136865Sdfr
34236865Sdfr
34336865Sdfrint
34436865Sdfris_physical_memory(addr)
34536865Sdfr	vm_offset_t addr;
34636865Sdfr{
34736865Sdfr	/*
34836865Sdfr	 * stuff other tests for known memory-mapped devices (PCI?)
34936865Sdfr	 * here
35036865Sdfr	 */
35136865Sdfr
35236865Sdfr	return 1;
35336865Sdfr}
35499659Sbenno
35599659Sbenno/*
35699659Sbenno * KSE functions
35799659Sbenno */
35899659Sbennovoid
35999659Sbennocpu_thread_exit(struct thread *td)
36099659Sbenno{
36199659Sbenno}
36299659Sbenno
36399659Sbennovoid
364107719Sjuliancpu_thread_clean(struct thread *td)
365107180Smux{
366107180Smux}
367107180Smux
368107180Smuxvoid
36999659Sbennocpu_thread_setup(struct thread *td)
37099659Sbenno{
371119004Smarcel}
37299659Sbenno
373119004Smarcelvoid
374119004Smarcelcpu_thread_swapin(struct thread *td)
375119004Smarcel{
37699659Sbenno}
37799659Sbenno
37899659Sbennovoid
379119004Smarcelcpu_thread_swapout(struct thread *td)
380119004Smarcel{
381119004Smarcel}
382119004Smarcel
383119004Smarcelvoid
384115858Smarcelcpu_set_upcall(struct thread *td, struct thread *td0)
38599659Sbenno{
38699659Sbenno}
38799659Sbenno
38899659Sbennovoid
389111028Sjeffcpu_set_upcall_kse(struct thread *td, struct kse_upcall *ku)
39099659Sbenno{
39199659Sbenno}
392