1/*-
2 * Copyright (c) 1993, David Greenman
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24 * SUCH DAMAGE.
25 */
26
27#include <sys/cdefs.h>
28__FBSDID("$FreeBSD$");
29
30#include <sys/param.h>
31#include <sys/exec.h>
32#include <sys/imgact.h>
33#include <sys/imgact_aout.h>
34#include <sys/kernel.h>
35#include <sys/limits.h>
36#include <sys/lock.h>
37#include <sys/malloc.h>
38#include <sys/mutex.h>
39#include <sys/proc.h>
40#include <sys/racct.h>
41#include <sys/resourcevar.h>
42#include <sys/signalvar.h>
43#include <sys/syscall.h>
44#include <sys/sysent.h>
45#include <sys/systm.h>
46#include <sys/vnode.h>
47
48#include <machine/frame.h>
49#include <machine/md_var.h>
50
51#include <vm/vm.h>
52#include <vm/pmap.h>
53#include <vm/vm_map.h>
54#include <vm/vm_object.h>
55#include <vm/vm_param.h>
56
57#ifdef __amd64__
58#include <compat/freebsd32/freebsd32_signal.h>
59#include <compat/freebsd32/freebsd32_util.h>
60#include <compat/freebsd32/freebsd32_proto.h>
61#include <compat/freebsd32/freebsd32_syscall.h>
62#include <compat/ia32/ia32_signal.h>
63#endif
64
65static int	exec_aout_imgact(struct image_params *imgp);
66static int	aout_fixup(register_t **stack_base, struct image_params *imgp);
67
68#if defined(__i386__)
69struct sysentvec aout_sysvec = {
70	.sv_size	= SYS_MAXSYSCALL,
71	.sv_table	= sysent,
72	.sv_mask	= 0,
73	.sv_sigsize	= 0,
74	.sv_sigtbl	= NULL,
75	.sv_errsize	= 0,
76	.sv_errtbl	= NULL,
77	.sv_transtrap	= NULL,
78	.sv_fixup	= aout_fixup,
79	.sv_sendsig	= sendsig,
80	.sv_sigcode	= sigcode,
81	.sv_szsigcode	= &szsigcode,
82	.sv_prepsyscall	= NULL,
83	.sv_name	= "FreeBSD a.out",
84	.sv_coredump	= NULL,
85	.sv_imgact_try	= NULL,
86	.sv_minsigstksz	= MINSIGSTKSZ,
87	.sv_pagesize	= PAGE_SIZE,
88	.sv_minuser	= VM_MIN_ADDRESS,
89	.sv_maxuser	= VM_MAXUSER_ADDRESS,
90	.sv_usrstack	= USRSTACK,
91	.sv_psstrings	= PS_STRINGS,
92	.sv_stackprot	= VM_PROT_ALL,
93	.sv_copyout_strings	= exec_copyout_strings,
94	.sv_setregs	= exec_setregs,
95	.sv_fixlimit	= NULL,
96	.sv_maxssiz	= NULL,
97	.sv_flags	= SV_ABI_FREEBSD | SV_AOUT | SV_IA32 | SV_ILP32,
98	.sv_set_syscall_retval = cpu_set_syscall_retval,
99	.sv_fetch_syscall_args = cpu_fetch_syscall_args,
100	.sv_syscallnames = syscallnames,
101	.sv_schedtail	= NULL,
102};
103
104#elif defined(__amd64__)
105
106#define	AOUT32_USRSTACK	0xbfc00000
107#define	AOUT32_PS_STRINGS \
108    (AOUT32_USRSTACK - sizeof(struct freebsd32_ps_strings))
109#define	AOUT32_MINUSER	FREEBSD32_MINUSER
110
111extern const char *freebsd32_syscallnames[];
112extern u_long ia32_maxssiz;
113
114struct sysentvec aout_sysvec = {
115	.sv_size	= FREEBSD32_SYS_MAXSYSCALL,
116	.sv_table	= freebsd32_sysent,
117	.sv_mask	= 0,
118	.sv_sigsize	= 0,
119	.sv_sigtbl	= NULL,
120	.sv_errsize	= 0,
121	.sv_errtbl	= NULL,
122	.sv_transtrap	= NULL,
123	.sv_fixup	= aout_fixup,
124	.sv_sendsig	= ia32_sendsig,
125	.sv_sigcode	= ia32_sigcode,
126	.sv_szsigcode	= &sz_ia32_sigcode,
127	.sv_prepsyscall	= NULL,
128	.sv_name	= "FreeBSD a.out",
129	.sv_coredump	= NULL,
130	.sv_imgact_try	= NULL,
131	.sv_minsigstksz	= MINSIGSTKSZ,
132	.sv_pagesize	= IA32_PAGE_SIZE,
133	.sv_minuser	= AOUT32_MINUSER,
134	.sv_maxuser	= AOUT32_USRSTACK,
135	.sv_usrstack	= AOUT32_USRSTACK,
136	.sv_psstrings	= AOUT32_PS_STRINGS,
137	.sv_stackprot	= VM_PROT_ALL,
138	.sv_copyout_strings	= freebsd32_copyout_strings,
139	.sv_setregs	= ia32_setregs,
140	.sv_fixlimit	= ia32_fixlimit,
141	.sv_maxssiz	= &ia32_maxssiz,
142	.sv_flags	= SV_ABI_FREEBSD | SV_AOUT | SV_IA32 | SV_ILP32,
143	.sv_set_syscall_retval = ia32_set_syscall_retval,
144	.sv_fetch_syscall_args = ia32_fetch_syscall_args,
145	.sv_syscallnames = freebsd32_syscallnames,
146};
147#else
148#error "Port me"
149#endif
150
151static int
152aout_fixup(register_t **stack_base, struct image_params *imgp)
153{
154
155	*(char **)stack_base -= sizeof(uint32_t);
156	return (suword32(*stack_base, imgp->args->argc));
157}
158
159static int
160exec_aout_imgact(struct image_params *imgp)
161{
162	const struct exec *a_out = (const struct exec *) imgp->image_header;
163	struct vmspace *vmspace;
164	vm_map_t map;
165	vm_object_t object;
166	vm_offset_t text_end, data_end;
167	unsigned long virtual_offset;
168	unsigned long file_offset;
169	unsigned long bss_size;
170	int error;
171
172	/*
173	 * Linux and *BSD binaries look very much alike,
174	 * only the machine id is different:
175	 * 0x64 for Linux, 0x86 for *BSD, 0x00 for BSDI.
176	 * NetBSD is in network byte order.. ugh.
177	 */
178	if (((a_out->a_magic >> 16) & 0xff) != 0x86 &&
179	    ((a_out->a_magic >> 16) & 0xff) != 0 &&
180	    ((((int)ntohl(a_out->a_magic)) >> 16) & 0xff) != 0x86)
181                return -1;
182
183	/*
184	 * Set file/virtual offset based on a.out variant.
185	 *	We do two cases: host byte order and network byte order
186	 *	(for NetBSD compatibility)
187	 */
188	switch ((int)(a_out->a_magic & 0xffff)) {
189	case ZMAGIC:
190		virtual_offset = 0;
191		if (a_out->a_text) {
192			file_offset = PAGE_SIZE;
193		} else {
194			/* Bill's "screwball mode" */
195			file_offset = 0;
196		}
197		break;
198	case QMAGIC:
199		virtual_offset = PAGE_SIZE;
200		file_offset = 0;
201		/* Pass PS_STRINGS for BSD/OS binaries only. */
202		if (N_GETMID(*a_out) == MID_ZERO)
203			imgp->ps_strings = aout_sysvec.sv_psstrings;
204		break;
205	default:
206		/* NetBSD compatibility */
207		switch ((int)(ntohl(a_out->a_magic) & 0xffff)) {
208		case ZMAGIC:
209		case QMAGIC:
210			virtual_offset = PAGE_SIZE;
211			file_offset = 0;
212			break;
213		default:
214			return (-1);
215		}
216	}
217
218	bss_size = roundup(a_out->a_bss, PAGE_SIZE);
219
220	/*
221	 * Check various fields in header for validity/bounds.
222	 */
223	if (/* entry point must lay with text region */
224	    a_out->a_entry < virtual_offset ||
225	    a_out->a_entry >= virtual_offset + a_out->a_text ||
226
227	    /* text and data size must each be page rounded */
228	    a_out->a_text & PAGE_MASK || a_out->a_data & PAGE_MASK
229
230#ifdef __amd64__
231	    ||
232	    /* overflows */
233	    virtual_offset + a_out->a_text + a_out->a_data + bss_size > UINT_MAX
234#endif
235	    )
236		return (-1);
237
238	/* text + data can't exceed file size */
239	if (a_out->a_data + a_out->a_text > imgp->attr->va_size)
240		return (EFAULT);
241
242	/*
243	 * text/data/bss must not exceed limits
244	 */
245	PROC_LOCK(imgp->proc);
246	if (/* text can't exceed maximum text size */
247	    a_out->a_text > maxtsiz ||
248
249	    /* data + bss can't exceed rlimit */
250	    a_out->a_data + bss_size > lim_cur(imgp->proc, RLIMIT_DATA) ||
251	    racct_set(imgp->proc, RACCT_DATA, a_out->a_data + bss_size) != 0) {
252			PROC_UNLOCK(imgp->proc);
253			return (ENOMEM);
254	}
255	PROC_UNLOCK(imgp->proc);
256
257	/*
258	 * Avoid a possible deadlock if the current address space is destroyed
259	 * and that address space maps the locked vnode.  In the common case,
260	 * the locked vnode's v_usecount is decremented but remains greater
261	 * than zero.  Consequently, the vnode lock is not needed by vrele().
262	 * However, in cases where the vnode lock is external, such as nullfs,
263	 * v_usecount may become zero.
264	 */
265	VOP_UNLOCK(imgp->vp, 0);
266
267	/*
268	 * Destroy old process VM and create a new one (with a new stack)
269	 */
270	error = exec_new_vmspace(imgp, &aout_sysvec);
271
272	vn_lock(imgp->vp, LK_EXCLUSIVE | LK_RETRY);
273	if (error)
274		return (error);
275
276	/*
277	 * The vm space can be changed by exec_new_vmspace
278	 */
279	vmspace = imgp->proc->p_vmspace;
280
281	object = imgp->object;
282	map = &vmspace->vm_map;
283	vm_map_lock(map);
284	vm_object_reference(object);
285
286	text_end = virtual_offset + a_out->a_text;
287	error = vm_map_insert(map, object,
288		file_offset,
289		virtual_offset, text_end,
290		VM_PROT_READ | VM_PROT_EXECUTE, VM_PROT_ALL,
291		MAP_COPY_ON_WRITE | MAP_PREFAULT);
292	if (error) {
293		vm_map_unlock(map);
294		vm_object_deallocate(object);
295		return (error);
296	}
297	data_end = text_end + a_out->a_data;
298	if (a_out->a_data) {
299		vm_object_reference(object);
300		error = vm_map_insert(map, object,
301			file_offset + a_out->a_text,
302			text_end, data_end,
303			VM_PROT_ALL, VM_PROT_ALL,
304			MAP_COPY_ON_WRITE | MAP_PREFAULT);
305		if (error) {
306			vm_map_unlock(map);
307			vm_object_deallocate(object);
308			return (error);
309		}
310	}
311
312	if (bss_size) {
313		error = vm_map_insert(map, NULL, 0,
314			data_end, data_end + bss_size,
315			VM_PROT_ALL, VM_PROT_ALL, 0);
316		if (error) {
317			vm_map_unlock(map);
318			return (error);
319		}
320	}
321	vm_map_unlock(map);
322
323	/* Fill in process VM information */
324	vmspace->vm_tsize = a_out->a_text >> PAGE_SHIFT;
325	vmspace->vm_dsize = (a_out->a_data + bss_size) >> PAGE_SHIFT;
326	vmspace->vm_taddr = (caddr_t) (uintptr_t) virtual_offset;
327	vmspace->vm_daddr = (caddr_t) (uintptr_t)
328			    (virtual_offset + a_out->a_text);
329
330	/* Fill in image_params */
331	imgp->interpreted = 0;
332	imgp->entry_addr = a_out->a_entry;
333
334	imgp->proc->p_sysent = &aout_sysvec;
335
336	return (0);
337}
338
339/*
340 * Tell kern_execve.c about it, with a little help from the linker.
341 */
342static struct execsw aout_execsw = { exec_aout_imgact, "a.out" };
343EXEC_SET(aout, aout_execsw);
344