ia32_syscall.c revision 114987
1114987Speter/*- 2114987Speter * Copyright (C) 1994, David Greenman 3114987Speter * Copyright (c) 1990, 1993 4114987Speter * The Regents of the University of California. All rights reserved. 5114987Speter * 6114987Speter * This code is derived from software contributed to Berkeley by 7114987Speter * the University of Utah, and William Jolitz. 8114987Speter * 9114987Speter * Redistribution and use in source and binary forms, with or without 10114987Speter * modification, are permitted provided that the following conditions 11114987Speter * are met: 12114987Speter * 1. Redistributions of source code must retain the above copyright 13114987Speter * notice, this list of conditions and the following disclaimer. 14114987Speter * 2. Redistributions in binary form must reproduce the above copyright 15114987Speter * notice, this list of conditions and the following disclaimer in the 16114987Speter * documentation and/or other materials provided with the distribution. 17114987Speter * 3. All advertising materials mentioning features or use of this software 18114987Speter * must display the following acknowledgement: 19114987Speter * This product includes software developed by the University of 20114987Speter * California, Berkeley and its contributors. 21114987Speter * 4. Neither the name of the University nor the names of its contributors 22114987Speter * may be used to endorse or promote products derived from this software 23114987Speter * without specific prior written permission. 24114987Speter * 25114987Speter * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 26114987Speter * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 27114987Speter * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 28114987Speter * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 29114987Speter * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 30114987Speter * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 31114987Speter * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 32114987Speter * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 33114987Speter * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 34114987Speter * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 35114987Speter * SUCH DAMAGE. 36114987Speter * 37114987Speter * $FreeBSD: head/sys/amd64/ia32/ia32_syscall.c 114987 2003-05-14 04:10:49Z peter $ 38114987Speter */ 39114987Speter 40114987Speter/* 41114987Speter * 386 Trap and System call handling 42114987Speter */ 43114987Speter 44114987Speter#include "opt_clock.h" 45114987Speter#include "opt_cpu.h" 46114987Speter#include "opt_isa.h" 47114987Speter#include "opt_ktrace.h" 48114987Speter 49114987Speter#include <sys/param.h> 50114987Speter#include <sys/bus.h> 51114987Speter#include <sys/systm.h> 52114987Speter#include <sys/proc.h> 53114987Speter#include <sys/pioctl.h> 54114987Speter#include <sys/kernel.h> 55114987Speter#include <sys/ktr.h> 56114987Speter#include <sys/lock.h> 57114987Speter#include <sys/mutex.h> 58114987Speter#include <sys/resourcevar.h> 59114987Speter#include <sys/signalvar.h> 60114987Speter#include <sys/syscall.h> 61114987Speter#include <sys/sysctl.h> 62114987Speter#include <sys/sysent.h> 63114987Speter#include <sys/uio.h> 64114987Speter#include <sys/vmmeter.h> 65114987Speter#ifdef KTRACE 66114987Speter#include <sys/ktrace.h> 67114987Speter#endif 68114987Speter 69114987Speter#include <vm/vm.h> 70114987Speter#include <vm/vm_param.h> 71114987Speter#include <vm/pmap.h> 72114987Speter#include <vm/vm_kern.h> 73114987Speter#include <vm/vm_map.h> 74114987Speter#include <vm/vm_page.h> 75114987Speter#include <vm/vm_extern.h> 76114987Speter 77114987Speter#include <machine/cpu.h> 78114987Speter#include <machine/md_var.h> 79114987Speter 80114987Speter#include <amd64/isa/icu.h> 81114987Speter#include <amd64/isa/intr_machdep.h> 82114987Speter 83114987Speter#define IDTVEC(name) __CONCAT(X,name) 84114987Speter 85114987Speterextern inthand_t IDTVEC(int0x80_syscall), IDTVEC(rsvd); 86114987Speter 87114987Spetervoid ia32_syscall(struct trapframe frame); /* Called from asm code */ 88114987Speter 89114987Spetervoid 90114987Speteria32_syscall(struct trapframe frame) 91114987Speter{ 92114987Speter caddr_t params; 93114987Speter int i; 94114987Speter struct sysent *callp; 95114987Speter struct thread *td = curthread; 96114987Speter struct proc *p = td->td_proc; 97114987Speter register_t orig_tf_rflags; 98114987Speter u_int sticks; 99114987Speter int error; 100114987Speter int narg; 101114987Speter u_int32_t args[8]; 102114987Speter u_int64_t args64[8]; 103114987Speter u_int code; 104114987Speter 105114987Speter /* 106114987Speter * note: PCPU_LAZY_INC() can only be used if we can afford 107114987Speter * occassional inaccuracy in the count. 108114987Speter */ 109114987Speter cnt.v_syscall++; 110114987Speter 111114987Speter sticks = td->td_sticks; 112114987Speter td->td_frame = &frame; 113114987Speter if (td->td_ucred != p->p_ucred) 114114987Speter cred_update_thread(td); 115114987Speter params = (caddr_t)frame.tf_rsp + sizeof(u_int32_t); 116114987Speter code = frame.tf_rax; 117114987Speter orig_tf_rflags = frame.tf_rflags; 118114987Speter 119114987Speter if (p->p_sysent->sv_prepsyscall) { 120114987Speter /* 121114987Speter * The prep code is MP aware. 122114987Speter */ 123114987Speter (*p->p_sysent->sv_prepsyscall)(&frame, args, &code, ¶ms); 124114987Speter } else { 125114987Speter /* 126114987Speter * Need to check if this is a 32 bit or 64 bit syscall. 127114987Speter * fuword is MP aware. 128114987Speter */ 129114987Speter if (code == SYS_syscall) { 130114987Speter /* 131114987Speter * Code is first argument, followed by actual args. 132114987Speter */ 133114987Speter code = fuword32(params); 134114987Speter params += sizeof(int); 135114987Speter } else if (code == SYS___syscall) { 136114987Speter /* 137114987Speter * Like syscall, but code is a quad, so as to maintain 138114987Speter * quad alignment for the rest of the arguments. 139114987Speter * We use a 32-bit fetch in case params is not 140114987Speter * aligned. 141114987Speter */ 142114987Speter code = fuword32(params); 143114987Speter params += sizeof(quad_t); 144114987Speter } 145114987Speter } 146114987Speter 147114987Speter if (p->p_sysent->sv_mask) 148114987Speter code &= p->p_sysent->sv_mask; 149114987Speter 150114987Speter if (code >= p->p_sysent->sv_size) 151114987Speter callp = &p->p_sysent->sv_table[0]; 152114987Speter else 153114987Speter callp = &p->p_sysent->sv_table[code]; 154114987Speter 155114987Speter narg = callp->sy_narg & SYF_ARGMASK; 156114987Speter 157114987Speter /* 158114987Speter * copyin and the ktrsyscall()/ktrsysret() code is MP-aware 159114987Speter */ 160114987Speter if (params != NULL && narg != 0) 161114987Speter error = copyin(params, (caddr_t)args, 162114987Speter (u_int)(narg * sizeof(int))); 163114987Speter else 164114987Speter error = 0; 165114987Speter 166114987Speter for (i = 0; i < narg; i++) 167114987Speter args64[i] = args[i]; 168114987Speter 169114987Speter#ifdef KTRACE 170114987Speter if (KTRPOINT(td, KTR_SYSCALL)) 171114987Speter ktrsyscall(code, narg, args64); 172114987Speter#endif 173114987Speter /* 174114987Speter * Try to run the syscall without Giant if the syscall 175114987Speter * is MP safe. 176114987Speter */ 177114987Speter if ((callp->sy_narg & SYF_MPSAFE) == 0) 178114987Speter mtx_lock(&Giant); 179114987Speter 180114987Speter if (error == 0) { 181114987Speter td->td_retval[0] = 0; 182114987Speter td->td_retval[1] = frame.tf_rdx; 183114987Speter 184114987Speter STOPEVENT(p, S_SCE, narg); 185114987Speter 186114987Speter error = (*callp->sy_call)(td, args64); 187114987Speter } 188114987Speter 189114987Speter switch (error) { 190114987Speter case 0: 191114987Speter frame.tf_rax = td->td_retval[0]; 192114987Speter frame.tf_rdx = td->td_retval[1]; 193114987Speter frame.tf_rflags &= ~PSL_C; 194114987Speter break; 195114987Speter 196114987Speter case ERESTART: 197114987Speter /* 198114987Speter * Reconstruct pc, assuming lcall $X,y is 7 bytes, 199114987Speter * int 0x80 is 2 bytes. We saved this in tf_err. 200114987Speter */ 201114987Speter frame.tf_rip -= frame.tf_err; 202114987Speter break; 203114987Speter 204114987Speter case EJUSTRETURN: 205114987Speter break; 206114987Speter 207114987Speter default: 208114987Speter if (p->p_sysent->sv_errsize) { 209114987Speter if (error >= p->p_sysent->sv_errsize) 210114987Speter error = -1; /* XXX */ 211114987Speter else 212114987Speter error = p->p_sysent->sv_errtbl[error]; 213114987Speter } 214114987Speter frame.tf_rax = error; 215114987Speter frame.tf_rflags |= PSL_C; 216114987Speter break; 217114987Speter } 218114987Speter 219114987Speter /* 220114987Speter * Release Giant if we previously set it. 221114987Speter */ 222114987Speter if ((callp->sy_narg & SYF_MPSAFE) == 0) 223114987Speter mtx_unlock(&Giant); 224114987Speter 225114987Speter /* 226114987Speter * Traced syscall. 227114987Speter */ 228114987Speter if (orig_tf_rflags & PSL_T) { 229114987Speter frame.tf_rflags &= ~PSL_T; 230114987Speter trapsignal(td, SIGTRAP, 0); 231114987Speter } 232114987Speter 233114987Speter /* 234114987Speter * Handle reschedule and other end-of-syscall issues 235114987Speter */ 236114987Speter userret(td, &frame, sticks); 237114987Speter 238114987Speter#ifdef KTRACE 239114987Speter if (KTRPOINT(td, KTR_SYSRET)) 240114987Speter ktrsysret(code, error, td->td_retval[0]); 241114987Speter#endif 242114987Speter 243114987Speter /* 244114987Speter * This works because errno is findable through the 245114987Speter * register set. If we ever support an emulation where this 246114987Speter * is not the case, this code will need to be revisited. 247114987Speter */ 248114987Speter STOPEVENT(p, S_SCX, code); 249114987Speter 250114987Speter#ifdef DIAGNOSTIC 251114987Speter cred_free_thread(td); 252114987Speter#endif 253114987Speter WITNESS_WARN(WARN_PANIC, NULL, "System call %s returning", 254114987Speter (code >= 0 && code < SYS_MAXSYSCALL) ? syscallnames[code] : "???"); 255114987Speter mtx_assert(&sched_lock, MA_NOTOWNED); 256114987Speter mtx_assert(&Giant, MA_NOTOWNED); 257114987Speter} 258114987Speter 259114987Speter 260114987Speterstatic void 261114987Speteria32_syscall_enable(void *dummy) 262114987Speter{ 263114987Speter 264114987Speter setidt(0x80, &IDTVEC(int0x80_syscall), SDT_SYSIGT, SEL_UPL, 0); 265114987Speter} 266114987Speter 267114987Speterstatic void 268114987Speteria32_syscall_disable(void *dummy) 269114987Speter{ 270114987Speter 271114987Speter setidt(0x80, &IDTVEC(rsvd), SDT_SYSIGT, SEL_KPL, 0); 272114987Speter} 273114987Speter 274114987SpeterSYSINIT(ia32_syscall, SI_SUB_EXEC, SI_ORDER_ANY, ia32_syscall_enable, NULL); 275114987SpeterSYSUNINIT(ia32_syscall, SI_SUB_EXEC, SI_ORDER_ANY, ia32_syscall_disable, NULL); 276