xref: /f-stack/freebsd/i386/linux/linux_sysvec.c (revision 22ce4aff)
1a9643ea8Slogwang /*-
2*22ce4affSfengbojiang  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3*22ce4affSfengbojiang  *
4a9643ea8Slogwang  * Copyright (c) 1994-1996 Søren Schmidt
5a9643ea8Slogwang  * All rights reserved.
6a9643ea8Slogwang  *
7a9643ea8Slogwang  * Redistribution and use in source and binary forms, with or without
8a9643ea8Slogwang  * modification, are permitted provided that the following conditions
9a9643ea8Slogwang  * are met:
10a9643ea8Slogwang  * 1. Redistributions of source code must retain the above copyright
11*22ce4affSfengbojiang  *    notice, this list of conditions and the following disclaimer.
12a9643ea8Slogwang  * 2. Redistributions in binary form must reproduce the above copyright
13a9643ea8Slogwang  *    notice, this list of conditions and the following disclaimer in the
14a9643ea8Slogwang  *    documentation and/or other materials provided with the distribution.
15a9643ea8Slogwang  *
16*22ce4affSfengbojiang  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17*22ce4affSfengbojiang  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18*22ce4affSfengbojiang  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19*22ce4affSfengbojiang  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20*22ce4affSfengbojiang  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21*22ce4affSfengbojiang  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22*22ce4affSfengbojiang  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23*22ce4affSfengbojiang  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24*22ce4affSfengbojiang  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25*22ce4affSfengbojiang  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26*22ce4affSfengbojiang  * SUCH DAMAGE.
27a9643ea8Slogwang  */
28a9643ea8Slogwang 
29a9643ea8Slogwang #include <sys/cdefs.h>
30a9643ea8Slogwang __FBSDID("$FreeBSD$");
31a9643ea8Slogwang 
32a9643ea8Slogwang #include <sys/param.h>
33a9643ea8Slogwang #include <sys/systm.h>
34a9643ea8Slogwang #include <sys/exec.h>
35a9643ea8Slogwang #include <sys/fcntl.h>
36a9643ea8Slogwang #include <sys/imgact.h>
37a9643ea8Slogwang #include <sys/imgact_aout.h>
38a9643ea8Slogwang #include <sys/imgact_elf.h>
39a9643ea8Slogwang #include <sys/kernel.h>
40a9643ea8Slogwang #include <sys/lock.h>
41a9643ea8Slogwang #include <sys/malloc.h>
42a9643ea8Slogwang #include <sys/module.h>
43a9643ea8Slogwang #include <sys/mutex.h>
44a9643ea8Slogwang #include <sys/proc.h>
45a9643ea8Slogwang #include <sys/signalvar.h>
46a9643ea8Slogwang #include <sys/syscallsubr.h>
47a9643ea8Slogwang #include <sys/sysctl.h>
48a9643ea8Slogwang #include <sys/sysent.h>
49a9643ea8Slogwang #include <sys/sysproto.h>
50a9643ea8Slogwang #include <sys/vnode.h>
51a9643ea8Slogwang 
52a9643ea8Slogwang #include <vm/vm.h>
53a9643ea8Slogwang #include <vm/pmap.h>
54a9643ea8Slogwang #include <vm/vm_extern.h>
55a9643ea8Slogwang #include <vm/vm_map.h>
56a9643ea8Slogwang #include <vm/vm_object.h>
57a9643ea8Slogwang #include <vm/vm_page.h>
58a9643ea8Slogwang #include <vm/vm_param.h>
59a9643ea8Slogwang 
60a9643ea8Slogwang #include <machine/cpu.h>
61a9643ea8Slogwang #include <machine/cputypes.h>
62a9643ea8Slogwang #include <machine/md_var.h>
63a9643ea8Slogwang #include <machine/pcb.h>
64*22ce4affSfengbojiang #include <machine/trap.h>
65a9643ea8Slogwang 
66a9643ea8Slogwang #include <i386/linux/linux.h>
67a9643ea8Slogwang #include <i386/linux/linux_proto.h>
68a9643ea8Slogwang #include <compat/linux/linux_emul.h>
69a9643ea8Slogwang #include <compat/linux/linux_ioctl.h>
70a9643ea8Slogwang #include <compat/linux/linux_mib.h>
71a9643ea8Slogwang #include <compat/linux/linux_misc.h>
72a9643ea8Slogwang #include <compat/linux/linux_signal.h>
73a9643ea8Slogwang #include <compat/linux/linux_util.h>
74a9643ea8Slogwang #include <compat/linux/linux_vdso.h>
75a9643ea8Slogwang 
76a9643ea8Slogwang MODULE_VERSION(linux, 1);
77a9643ea8Slogwang 
78a9643ea8Slogwang #define	LINUX_PS_STRINGS	(LINUX_USRSTACK - sizeof(struct ps_strings))
79a9643ea8Slogwang 
80a9643ea8Slogwang static int linux_szsigcode;
81a9643ea8Slogwang static vm_object_t linux_shared_page_obj;
82a9643ea8Slogwang static char *linux_shared_page_mapping;
83a9643ea8Slogwang extern char _binary_linux_locore_o_start;
84a9643ea8Slogwang extern char _binary_linux_locore_o_end;
85a9643ea8Slogwang 
86a9643ea8Slogwang extern struct sysent linux_sysent[LINUX_SYS_MAXSYSCALL];
87a9643ea8Slogwang 
88a9643ea8Slogwang SET_DECLARE(linux_ioctl_handler_set, struct linux_ioctl_handler);
89a9643ea8Slogwang 
90*22ce4affSfengbojiang static int	linux_fixup(uintptr_t *stack_base,
91a9643ea8Slogwang 		    struct image_params *iparams);
92*22ce4affSfengbojiang static int	linux_fixup_elf(uintptr_t *stack_base,
93a9643ea8Slogwang 		    struct image_params *iparams);
94a9643ea8Slogwang static void     linux_sendsig(sig_t catcher, ksiginfo_t *ksi, sigset_t *mask);
95*22ce4affSfengbojiang static void	linux_exec_setregs(struct thread *td,
96*22ce4affSfengbojiang 		    struct image_params *imgp, uintptr_t stack);
97*22ce4affSfengbojiang static int	linux_copyout_strings(struct image_params *imgp,
98*22ce4affSfengbojiang 		    uintptr_t *stack_base);
99*22ce4affSfengbojiang static bool	linux_trans_osrel(const Elf_Note *note, int32_t *osrel);
100a9643ea8Slogwang static void	linux_vdso_install(void *param);
101a9643ea8Slogwang static void	linux_vdso_deinstall(void *param);
102a9643ea8Slogwang 
103a9643ea8Slogwang static int linux_szplatform;
104a9643ea8Slogwang const char *linux_kplatform;
105a9643ea8Slogwang 
106a9643ea8Slogwang #define LINUX_T_UNKNOWN  255
107a9643ea8Slogwang static int _bsd_to_linux_trapcode[] = {
108a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 0 */
109a9643ea8Slogwang 	6,			/* 1  T_PRIVINFLT */
110a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 2 */
111a9643ea8Slogwang 	3,			/* 3  T_BPTFLT */
112a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 4 */
113a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 5 */
114a9643ea8Slogwang 	16,			/* 6  T_ARITHTRAP */
115a9643ea8Slogwang 	254,			/* 7  T_ASTFLT */
116a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 8 */
117a9643ea8Slogwang 	13,			/* 9  T_PROTFLT */
118a9643ea8Slogwang 	1,			/* 10 T_TRCTRAP */
119a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 11 */
120a9643ea8Slogwang 	14,			/* 12 T_PAGEFLT */
121a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 13 */
122a9643ea8Slogwang 	17,			/* 14 T_ALIGNFLT */
123a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 15 */
124a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 16 */
125a9643ea8Slogwang 	LINUX_T_UNKNOWN,	/* 17 */
126a9643ea8Slogwang 	0,			/* 18 T_DIVIDE */
127a9643ea8Slogwang 	2,			/* 19 T_NMI */
128a9643ea8Slogwang 	4,			/* 20 T_OFLOW */
129a9643ea8Slogwang 	5,			/* 21 T_BOUND */
130a9643ea8Slogwang 	7,			/* 22 T_DNA */
131a9643ea8Slogwang 	8,			/* 23 T_DOUBLEFLT */
132a9643ea8Slogwang 	9,			/* 24 T_FPOPFLT */
133a9643ea8Slogwang 	10,			/* 25 T_TSSFLT */
134a9643ea8Slogwang 	11,			/* 26 T_SEGNPFLT */
135a9643ea8Slogwang 	12,			/* 27 T_STKFLT */
136a9643ea8Slogwang 	18,			/* 28 T_MCHK */
137a9643ea8Slogwang 	19,			/* 29 T_XMMFLT */
138a9643ea8Slogwang 	15			/* 30 T_RESERVED */
139a9643ea8Slogwang };
140a9643ea8Slogwang #define bsd_to_linux_trapcode(code) \
141a9643ea8Slogwang     ((code)<nitems(_bsd_to_linux_trapcode)? \
142a9643ea8Slogwang      _bsd_to_linux_trapcode[(code)]: \
143a9643ea8Slogwang      LINUX_T_UNKNOWN)
144a9643ea8Slogwang 
145a9643ea8Slogwang LINUX_VDSO_SYM_INTPTR(linux_sigcode);
146a9643ea8Slogwang LINUX_VDSO_SYM_INTPTR(linux_rt_sigcode);
147a9643ea8Slogwang LINUX_VDSO_SYM_INTPTR(linux_vsyscall);
148a9643ea8Slogwang 
149a9643ea8Slogwang /*
150a9643ea8Slogwang  * If FreeBSD & Linux have a difference of opinion about what a trap
151a9643ea8Slogwang  * means, deal with it here.
152a9643ea8Slogwang  *
153a9643ea8Slogwang  * MPSAFE
154a9643ea8Slogwang  */
155a9643ea8Slogwang static int
linux_translate_traps(int signal,int trap_code)156*22ce4affSfengbojiang linux_translate_traps(int signal, int trap_code)
157a9643ea8Slogwang {
158a9643ea8Slogwang 	if (signal != SIGBUS)
159a9643ea8Slogwang 		return (signal);
160a9643ea8Slogwang 	switch (trap_code) {
161a9643ea8Slogwang 	case T_PROTFLT:
162a9643ea8Slogwang 	case T_TSSFLT:
163a9643ea8Slogwang 	case T_DOUBLEFLT:
164a9643ea8Slogwang 	case T_PAGEFLT:
165a9643ea8Slogwang 		return (SIGSEGV);
166a9643ea8Slogwang 	default:
167a9643ea8Slogwang 		return (signal);
168a9643ea8Slogwang 	}
169a9643ea8Slogwang }
170a9643ea8Slogwang 
171a9643ea8Slogwang static int
linux_fixup(uintptr_t * stack_base,struct image_params * imgp)172*22ce4affSfengbojiang linux_fixup(uintptr_t *stack_base, struct image_params *imgp)
173a9643ea8Slogwang {
174*22ce4affSfengbojiang 	register_t *base, *argv, *envp;
175a9643ea8Slogwang 
176*22ce4affSfengbojiang 	base = (register_t *)*stack_base;
177*22ce4affSfengbojiang 	argv = base;
178*22ce4affSfengbojiang 	envp = base + (imgp->args->argc + 1);
179*22ce4affSfengbojiang 	base--;
180*22ce4affSfengbojiang 	suword(base, (intptr_t)envp);
181*22ce4affSfengbojiang 	base--;
182*22ce4affSfengbojiang 	suword(base, (intptr_t)argv);
183*22ce4affSfengbojiang 	base--;
184*22ce4affSfengbojiang 	suword(base, imgp->args->argc);
185*22ce4affSfengbojiang 	*stack_base = (uintptr_t)base;
186a9643ea8Slogwang 	return (0);
187a9643ea8Slogwang }
188a9643ea8Slogwang 
189a9643ea8Slogwang static int
linux_copyout_auxargs(struct image_params * imgp,uintptr_t base)190*22ce4affSfengbojiang linux_copyout_auxargs(struct image_params *imgp, uintptr_t base)
191a9643ea8Slogwang {
192a9643ea8Slogwang 	struct proc *p;
193a9643ea8Slogwang 	Elf32_Auxargs *args;
194*22ce4affSfengbojiang 	Elf32_Auxinfo *argarray, *pos;
195a9643ea8Slogwang 	Elf32_Addr *uplatform;
196a9643ea8Slogwang 	struct ps_strings *arginfo;
197*22ce4affSfengbojiang 	int error, issetugid;
198a9643ea8Slogwang 
199a9643ea8Slogwang 	p = imgp->proc;
200a9643ea8Slogwang 	issetugid = imgp->proc->p_flag & P_SUGID ? 1 : 0;
201a9643ea8Slogwang 	arginfo = (struct ps_strings *)p->p_sysent->sv_psstrings;
202a9643ea8Slogwang 	uplatform = (Elf32_Addr *)((caddr_t)arginfo - linux_szplatform);
203a9643ea8Slogwang 	args = (Elf32_Auxargs *)imgp->auxargs;
204*22ce4affSfengbojiang 	argarray = pos = malloc(LINUX_AT_COUNT * sizeof(*pos), M_TEMP,
205*22ce4affSfengbojiang 	    M_WAITOK | M_ZERO);
206a9643ea8Slogwang 
207a9643ea8Slogwang 	AUXARGS_ENTRY(pos, LINUX_AT_SYSINFO_EHDR,
208a9643ea8Slogwang 	    imgp->proc->p_sysent->sv_shared_page_base);
209a9643ea8Slogwang 	AUXARGS_ENTRY(pos, LINUX_AT_SYSINFO, linux_vsyscall);
210a9643ea8Slogwang 	AUXARGS_ENTRY(pos, LINUX_AT_HWCAP, cpu_feature);
211a9643ea8Slogwang 
212a9643ea8Slogwang 	/*
213a9643ea8Slogwang 	 * Do not export AT_CLKTCK when emulating Linux kernel prior to 2.4.0,
214a9643ea8Slogwang 	 * as it has appeared in the 2.4.0-rc7 first time.
215a9643ea8Slogwang 	 * Being exported, AT_CLKTCK is returned by sysconf(_SC_CLK_TCK),
216a9643ea8Slogwang 	 * glibc falls back to the hard-coded CLK_TCK value when aux entry
217a9643ea8Slogwang 	 * is not present.
218a9643ea8Slogwang 	 * Also see linux_times() implementation.
219a9643ea8Slogwang 	 */
220a9643ea8Slogwang 	if (linux_kernver(curthread) >= LINUX_KERNVER_2004000)
221a9643ea8Slogwang 		AUXARGS_ENTRY(pos, LINUX_AT_CLKTCK, stclohz);
222a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_PHDR, args->phdr);
223a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_PHENT, args->phent);
224a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_PHNUM, args->phnum);
225a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_PAGESZ, args->pagesz);
226a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_FLAGS, args->flags);
227a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_ENTRY, args->entry);
228a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_BASE, args->base);
229a9643ea8Slogwang 	AUXARGS_ENTRY(pos, LINUX_AT_SECURE, issetugid);
230a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_UID, imgp->proc->p_ucred->cr_ruid);
231a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_EUID, imgp->proc->p_ucred->cr_svuid);
232a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_GID, imgp->proc->p_ucred->cr_rgid);
233a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_EGID, imgp->proc->p_ucred->cr_svgid);
234a9643ea8Slogwang 	AUXARGS_ENTRY(pos, LINUX_AT_PLATFORM, PTROUT(uplatform));
235*22ce4affSfengbojiang 	AUXARGS_ENTRY_PTR(pos, LINUX_AT_RANDOM, imgp->canary);
236a9643ea8Slogwang 	if (imgp->execpathp != 0)
237*22ce4affSfengbojiang 		AUXARGS_ENTRY_PTR(pos, LINUX_AT_EXECFN, imgp->execpathp);
238a9643ea8Slogwang 	if (args->execfd != -1)
239a9643ea8Slogwang 		AUXARGS_ENTRY(pos, AT_EXECFD, args->execfd);
240a9643ea8Slogwang 	AUXARGS_ENTRY(pos, AT_NULL, 0);
241a9643ea8Slogwang 
242a9643ea8Slogwang 	free(imgp->auxargs, M_TEMP);
243a9643ea8Slogwang 	imgp->auxargs = NULL;
244*22ce4affSfengbojiang 	KASSERT(pos - argarray <= LINUX_AT_COUNT, ("Too many auxargs"));
245a9643ea8Slogwang 
246*22ce4affSfengbojiang 	error = copyout(argarray, (void *)base,
247*22ce4affSfengbojiang 	    sizeof(*argarray) * LINUX_AT_COUNT);
248*22ce4affSfengbojiang 	free(argarray, M_TEMP);
249*22ce4affSfengbojiang 	return (error);
250*22ce4affSfengbojiang }
251*22ce4affSfengbojiang 
252*22ce4affSfengbojiang static int
linux_fixup_elf(uintptr_t * stack_base,struct image_params * imgp)253*22ce4affSfengbojiang linux_fixup_elf(uintptr_t *stack_base, struct image_params *imgp)
254*22ce4affSfengbojiang {
255*22ce4affSfengbojiang 	register_t *base;
256*22ce4affSfengbojiang 
257*22ce4affSfengbojiang 	base = (register_t *)*stack_base;
258*22ce4affSfengbojiang 	base--;
259*22ce4affSfengbojiang 	if (suword(base, (register_t)imgp->args->argc) == -1)
260*22ce4affSfengbojiang 		return (EFAULT);
261*22ce4affSfengbojiang 	*stack_base = (uintptr_t)base;
262a9643ea8Slogwang 	return (0);
263a9643ea8Slogwang }
264a9643ea8Slogwang 
265a9643ea8Slogwang /*
266a9643ea8Slogwang  * Copied from kern/kern_exec.c
267a9643ea8Slogwang  */
268*22ce4affSfengbojiang static int
linux_copyout_strings(struct image_params * imgp,uintptr_t * stack_base)269*22ce4affSfengbojiang linux_copyout_strings(struct image_params *imgp, uintptr_t *stack_base)
270a9643ea8Slogwang {
271*22ce4affSfengbojiang 	int argc, envc, error;
272a9643ea8Slogwang 	char **vectp;
273*22ce4affSfengbojiang 	char *stringp;
274*22ce4affSfengbojiang 	uintptr_t destp, ustringp;
275a9643ea8Slogwang 	struct ps_strings *arginfo;
276a9643ea8Slogwang 	char canary[LINUX_AT_RANDOM_LEN];
277a9643ea8Slogwang 	size_t execpath_len;
278a9643ea8Slogwang 	struct proc *p;
279a9643ea8Slogwang 
280*22ce4affSfengbojiang 	/* Calculate string base and vector table pointers. */
281a9643ea8Slogwang 	p = imgp->proc;
282a9643ea8Slogwang 	if (imgp->execpath != NULL && imgp->auxargs != NULL)
283a9643ea8Slogwang 		execpath_len = strlen(imgp->execpath) + 1;
284a9643ea8Slogwang 	else
285a9643ea8Slogwang 		execpath_len = 0;
286a9643ea8Slogwang 	arginfo = (struct ps_strings *)p->p_sysent->sv_psstrings;
287*22ce4affSfengbojiang 	destp = (uintptr_t)arginfo;
288a9643ea8Slogwang 
289*22ce4affSfengbojiang 	/* Install LINUX_PLATFORM. */
290*22ce4affSfengbojiang 	destp -= linux_szplatform;
291*22ce4affSfengbojiang 	destp = rounddown2(destp, sizeof(void *));
292*22ce4affSfengbojiang 	error = copyout(linux_kplatform, (void *)destp, linux_szplatform);
293*22ce4affSfengbojiang 	if (error != 0)
294*22ce4affSfengbojiang 		return (error);
295a9643ea8Slogwang 
296a9643ea8Slogwang 	if (execpath_len != 0) {
297*22ce4affSfengbojiang 		destp -= execpath_len;
298*22ce4affSfengbojiang 		destp = rounddown2(destp, sizeof(void *));
299*22ce4affSfengbojiang 		imgp->execpathp = (void *)destp;
300*22ce4affSfengbojiang 		error = copyout(imgp->execpath, imgp->execpathp, execpath_len);
301*22ce4affSfengbojiang 		if (error != 0)
302*22ce4affSfengbojiang 			return (error);
303a9643ea8Slogwang 	}
304a9643ea8Slogwang 
305*22ce4affSfengbojiang 	/* Prepare the canary for SSP. */
306a9643ea8Slogwang 	arc4rand(canary, sizeof(canary), 0);
307*22ce4affSfengbojiang 	destp -= roundup(sizeof(canary), sizeof(void *));
308*22ce4affSfengbojiang 	imgp->canary = (void *)destp;
309*22ce4affSfengbojiang 	error = copyout(canary, imgp->canary, sizeof(canary));
310*22ce4affSfengbojiang 	if (error != 0)
311*22ce4affSfengbojiang 		return (error);
312a9643ea8Slogwang 
313*22ce4affSfengbojiang 	/* Allocate room for the argument and environment strings. */
314*22ce4affSfengbojiang 	destp -= ARG_MAX - imgp->args->stringspace;
315*22ce4affSfengbojiang 	destp = rounddown2(destp, sizeof(void *));
316*22ce4affSfengbojiang 	ustringp = destp;
317*22ce4affSfengbojiang 
318a9643ea8Slogwang 	if (imgp->auxargs) {
319a9643ea8Slogwang 		/*
320*22ce4affSfengbojiang 		 * Allocate room on the stack for the ELF auxargs
321*22ce4affSfengbojiang 		 * array.  It has LINUX_AT_COUNT entries.
322a9643ea8Slogwang 		 */
323*22ce4affSfengbojiang 		destp -= LINUX_AT_COUNT * sizeof(Elf32_Auxinfo);
324*22ce4affSfengbojiang 		destp = rounddown2(destp, sizeof(void *));
325a9643ea8Slogwang 	}
326a9643ea8Slogwang 
327*22ce4affSfengbojiang 	vectp = (char **)destp;
328*22ce4affSfengbojiang 
329a9643ea8Slogwang 	/*
330*22ce4affSfengbojiang 	 * Allocate room for the argv[] and env vectors including the
331*22ce4affSfengbojiang 	 * terminating NULL pointers.
332a9643ea8Slogwang 	 */
333*22ce4affSfengbojiang 	vectp -= imgp->args->argc + 1 + imgp->args->envc + 1;
334*22ce4affSfengbojiang 
335*22ce4affSfengbojiang 	/* vectp also becomes our initial stack base. */
336*22ce4affSfengbojiang 	*stack_base = (uintptr_t)vectp;
337a9643ea8Slogwang 
338a9643ea8Slogwang 	stringp = imgp->args->begin_argv;
339a9643ea8Slogwang 	argc = imgp->args->argc;
340a9643ea8Slogwang 	envc = imgp->args->envc;
341a9643ea8Slogwang 
342*22ce4affSfengbojiang 	/* Copy out strings - arguments and environment. */
343*22ce4affSfengbojiang 	error = copyout(stringp, (void *)ustringp,
344*22ce4affSfengbojiang 	    ARG_MAX - imgp->args->stringspace);
345*22ce4affSfengbojiang 	if (error != 0)
346*22ce4affSfengbojiang 		return (error);
347a9643ea8Slogwang 
348*22ce4affSfengbojiang 	/* Fill in "ps_strings" struct for ps, w, etc. */
349*22ce4affSfengbojiang 	if (suword(&arginfo->ps_argvstr, (long)(intptr_t)vectp) != 0 ||
350*22ce4affSfengbojiang 	    suword(&arginfo->ps_nargvstr, argc) != 0)
351*22ce4affSfengbojiang 		return (EFAULT);
352a9643ea8Slogwang 
353*22ce4affSfengbojiang 	/* Fill in argument portion of vector table. */
354a9643ea8Slogwang 	for (; argc > 0; --argc) {
355*22ce4affSfengbojiang 		if (suword(vectp++, ustringp) != 0)
356*22ce4affSfengbojiang 			return (EFAULT);
357a9643ea8Slogwang 		while (*stringp++ != 0)
358*22ce4affSfengbojiang 			ustringp++;
359*22ce4affSfengbojiang 		ustringp++;
360a9643ea8Slogwang 	}
361a9643ea8Slogwang 
362*22ce4affSfengbojiang 	/* A null vector table pointer separates the argp's from the envp's. */
363*22ce4affSfengbojiang 	if (suword(vectp++, 0) != 0)
364*22ce4affSfengbojiang 		return (EFAULT);
365a9643ea8Slogwang 
366*22ce4affSfengbojiang 	if (suword(&arginfo->ps_envstr, (long)(intptr_t)vectp) != 0 ||
367*22ce4affSfengbojiang 	    suword(&arginfo->ps_nenvstr, envc) != 0)
368*22ce4affSfengbojiang 		return (EFAULT);
369a9643ea8Slogwang 
370*22ce4affSfengbojiang 	/* Fill in environment portion of vector table. */
371a9643ea8Slogwang 	for (; envc > 0; --envc) {
372*22ce4affSfengbojiang 		if (suword(vectp++, ustringp) != 0)
373*22ce4affSfengbojiang 			return (EFAULT);
374a9643ea8Slogwang 		while (*stringp++ != 0)
375*22ce4affSfengbojiang 			ustringp++;
376*22ce4affSfengbojiang 		ustringp++;
377a9643ea8Slogwang 	}
378a9643ea8Slogwang 
379*22ce4affSfengbojiang 	/* The end of the vector table is a null pointer. */
380*22ce4affSfengbojiang 	if (suword(vectp, 0) != 0)
381*22ce4affSfengbojiang 		return (EFAULT);
382a9643ea8Slogwang 
383*22ce4affSfengbojiang 	if (imgp->auxargs) {
384*22ce4affSfengbojiang 		vectp++;
385*22ce4affSfengbojiang 		error = imgp->sysent->sv_copyout_auxargs(imgp,
386*22ce4affSfengbojiang 		    (uintptr_t)vectp);
387*22ce4affSfengbojiang 		if (error != 0)
388*22ce4affSfengbojiang 			return (error);
389*22ce4affSfengbojiang 	}
390*22ce4affSfengbojiang 
391*22ce4affSfengbojiang 	return (0);
392a9643ea8Slogwang }
393a9643ea8Slogwang 
394a9643ea8Slogwang static void
linux_rt_sendsig(sig_t catcher,ksiginfo_t * ksi,sigset_t * mask)395a9643ea8Slogwang linux_rt_sendsig(sig_t catcher, ksiginfo_t *ksi, sigset_t *mask)
396a9643ea8Slogwang {
397a9643ea8Slogwang 	struct thread *td = curthread;
398a9643ea8Slogwang 	struct proc *p = td->td_proc;
399a9643ea8Slogwang 	struct sigacts *psp;
400a9643ea8Slogwang 	struct trapframe *regs;
401a9643ea8Slogwang 	struct l_rt_sigframe *fp, frame;
402a9643ea8Slogwang 	int sig, code;
403a9643ea8Slogwang 	int oonstack;
404a9643ea8Slogwang 
405a9643ea8Slogwang 	sig = ksi->ksi_signo;
406a9643ea8Slogwang 	code = ksi->ksi_code;
407a9643ea8Slogwang 	PROC_LOCK_ASSERT(p, MA_OWNED);
408a9643ea8Slogwang 	psp = p->p_sigacts;
409a9643ea8Slogwang 	mtx_assert(&psp->ps_mtx, MA_OWNED);
410a9643ea8Slogwang 	regs = td->td_frame;
411a9643ea8Slogwang 	oonstack = sigonstack(regs->tf_esp);
412a9643ea8Slogwang 
413*22ce4affSfengbojiang 	/* Allocate space for the signal handler context. */
414a9643ea8Slogwang 	if ((td->td_pflags & TDP_ALTSTACK) && !oonstack &&
415a9643ea8Slogwang 	    SIGISMEMBER(psp->ps_sigonstack, sig)) {
416a9643ea8Slogwang 		fp = (struct l_rt_sigframe *)((uintptr_t)td->td_sigstk.ss_sp +
417a9643ea8Slogwang 		    td->td_sigstk.ss_size - sizeof(struct l_rt_sigframe));
418a9643ea8Slogwang 	} else
419a9643ea8Slogwang 		fp = (struct l_rt_sigframe *)regs->tf_esp - 1;
420a9643ea8Slogwang 	mtx_unlock(&psp->ps_mtx);
421a9643ea8Slogwang 
422*22ce4affSfengbojiang 	/* Build the argument list for the signal handler. */
423a9643ea8Slogwang 	sig = bsd_to_linux_signal(sig);
424a9643ea8Slogwang 
425a9643ea8Slogwang 	bzero(&frame, sizeof(frame));
426a9643ea8Slogwang 
427a9643ea8Slogwang 	frame.sf_handler = catcher;
428a9643ea8Slogwang 	frame.sf_sig = sig;
429a9643ea8Slogwang 	frame.sf_siginfo = &fp->sf_si;
430a9643ea8Slogwang 	frame.sf_ucontext = &fp->sf_sc;
431a9643ea8Slogwang 
432*22ce4affSfengbojiang 	/* Fill in POSIX parts. */
433a9643ea8Slogwang 	ksiginfo_to_lsiginfo(ksi, &frame.sf_si, sig);
434a9643ea8Slogwang 
435*22ce4affSfengbojiang 	/* Build the signal context to be used by sigreturn. */
436a9643ea8Slogwang 	frame.sf_sc.uc_flags = 0;		/* XXX ??? */
437a9643ea8Slogwang 	frame.sf_sc.uc_link = NULL;		/* XXX ??? */
438a9643ea8Slogwang 
439a9643ea8Slogwang 	frame.sf_sc.uc_stack.ss_sp = td->td_sigstk.ss_sp;
440a9643ea8Slogwang 	frame.sf_sc.uc_stack.ss_size = td->td_sigstk.ss_size;
441a9643ea8Slogwang 	frame.sf_sc.uc_stack.ss_flags = (td->td_pflags & TDP_ALTSTACK)
442a9643ea8Slogwang 	    ? ((oonstack) ? LINUX_SS_ONSTACK : 0) : LINUX_SS_DISABLE;
443a9643ea8Slogwang 	PROC_UNLOCK(p);
444a9643ea8Slogwang 
445a9643ea8Slogwang 	bsd_to_linux_sigset(mask, &frame.sf_sc.uc_sigmask);
446a9643ea8Slogwang 
447a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_mask   = frame.sf_sc.uc_sigmask.__mask;
448a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_gs     = rgs();
449a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_fs     = regs->tf_fs;
450a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_es     = regs->tf_es;
451a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_ds     = regs->tf_ds;
452a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_edi    = regs->tf_edi;
453a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_esi    = regs->tf_esi;
454a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_ebp    = regs->tf_ebp;
455a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_ebx    = regs->tf_ebx;
456a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_esp    = regs->tf_esp;
457a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_edx    = regs->tf_edx;
458a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_ecx    = regs->tf_ecx;
459a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_eax    = regs->tf_eax;
460a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_eip    = regs->tf_eip;
461a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_cs     = regs->tf_cs;
462a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_eflags = regs->tf_eflags;
463a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_esp_at_signal = regs->tf_esp;
464a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_ss     = regs->tf_ss;
465a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_err    = regs->tf_err;
466a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_cr2    = (register_t)ksi->ksi_addr;
467a9643ea8Slogwang 	frame.sf_sc.uc_mcontext.sc_trapno = bsd_to_linux_trapcode(code);
468a9643ea8Slogwang 
469a9643ea8Slogwang 	if (copyout(&frame, fp, sizeof(frame)) != 0) {
470a9643ea8Slogwang 		/*
471a9643ea8Slogwang 		 * Process has trashed its stack; give it an illegal
472a9643ea8Slogwang 		 * instruction to halt it in its tracks.
473a9643ea8Slogwang 		 */
474a9643ea8Slogwang 		PROC_LOCK(p);
475a9643ea8Slogwang 		sigexit(td, SIGILL);
476a9643ea8Slogwang 	}
477a9643ea8Slogwang 
478*22ce4affSfengbojiang 	/* Build context to run handler in. */
479a9643ea8Slogwang 	regs->tf_esp = (int)fp;
480a9643ea8Slogwang 	regs->tf_eip = linux_rt_sigcode;
481a9643ea8Slogwang 	regs->tf_eflags &= ~(PSL_T | PSL_VM | PSL_D);
482a9643ea8Slogwang 	regs->tf_cs = _ucodesel;
483a9643ea8Slogwang 	regs->tf_ds = _udatasel;
484a9643ea8Slogwang 	regs->tf_es = _udatasel;
485a9643ea8Slogwang 	regs->tf_fs = _udatasel;
486a9643ea8Slogwang 	regs->tf_ss = _udatasel;
487a9643ea8Slogwang 	PROC_LOCK(p);
488a9643ea8Slogwang 	mtx_lock(&psp->ps_mtx);
489a9643ea8Slogwang }
490a9643ea8Slogwang 
491a9643ea8Slogwang /*
492a9643ea8Slogwang  * Send an interrupt to process.
493a9643ea8Slogwang  *
494a9643ea8Slogwang  * Stack is set up to allow sigcode stored
495a9643ea8Slogwang  * in u. to call routine, followed by kcall
496a9643ea8Slogwang  * to sigreturn routine below.  After sigreturn
497a9643ea8Slogwang  * resets the signal mask, the stack, and the
498a9643ea8Slogwang  * frame pointer, it returns to the user
499a9643ea8Slogwang  * specified pc, psl.
500a9643ea8Slogwang  */
501a9643ea8Slogwang static void
linux_sendsig(sig_t catcher,ksiginfo_t * ksi,sigset_t * mask)502a9643ea8Slogwang linux_sendsig(sig_t catcher, ksiginfo_t *ksi, sigset_t *mask)
503a9643ea8Slogwang {
504a9643ea8Slogwang 	struct thread *td = curthread;
505a9643ea8Slogwang 	struct proc *p = td->td_proc;
506a9643ea8Slogwang 	struct sigacts *psp;
507a9643ea8Slogwang 	struct trapframe *regs;
508a9643ea8Slogwang 	struct l_sigframe *fp, frame;
509a9643ea8Slogwang 	l_sigset_t lmask;
510a9643ea8Slogwang 	int sig, code;
511a9643ea8Slogwang 	int oonstack;
512a9643ea8Slogwang 
513a9643ea8Slogwang 	PROC_LOCK_ASSERT(p, MA_OWNED);
514a9643ea8Slogwang 	psp = p->p_sigacts;
515a9643ea8Slogwang 	sig = ksi->ksi_signo;
516a9643ea8Slogwang 	code = ksi->ksi_code;
517a9643ea8Slogwang 	mtx_assert(&psp->ps_mtx, MA_OWNED);
518a9643ea8Slogwang 	if (SIGISMEMBER(psp->ps_siginfo, sig)) {
519a9643ea8Slogwang 		/* Signal handler installed with SA_SIGINFO. */
520a9643ea8Slogwang 		linux_rt_sendsig(catcher, ksi, mask);
521a9643ea8Slogwang 		return;
522a9643ea8Slogwang 	}
523a9643ea8Slogwang 	regs = td->td_frame;
524a9643ea8Slogwang 	oonstack = sigonstack(regs->tf_esp);
525a9643ea8Slogwang 
526*22ce4affSfengbojiang 	/* Allocate space for the signal handler context. */
527a9643ea8Slogwang 	if ((td->td_pflags & TDP_ALTSTACK) && !oonstack &&
528a9643ea8Slogwang 	    SIGISMEMBER(psp->ps_sigonstack, sig)) {
529a9643ea8Slogwang 		fp = (struct l_sigframe *)((uintptr_t)td->td_sigstk.ss_sp +
530a9643ea8Slogwang 		    td->td_sigstk.ss_size - sizeof(struct l_sigframe));
531a9643ea8Slogwang 	} else
532a9643ea8Slogwang 		fp = (struct l_sigframe *)regs->tf_esp - 1;
533a9643ea8Slogwang 	mtx_unlock(&psp->ps_mtx);
534a9643ea8Slogwang 	PROC_UNLOCK(p);
535a9643ea8Slogwang 
536*22ce4affSfengbojiang 	/* Build the argument list for the signal handler. */
537a9643ea8Slogwang 	sig = bsd_to_linux_signal(sig);
538a9643ea8Slogwang 
539a9643ea8Slogwang 	bzero(&frame, sizeof(frame));
540a9643ea8Slogwang 
541a9643ea8Slogwang 	frame.sf_handler = catcher;
542a9643ea8Slogwang 	frame.sf_sig = sig;
543a9643ea8Slogwang 
544a9643ea8Slogwang 	bsd_to_linux_sigset(mask, &lmask);
545a9643ea8Slogwang 
546*22ce4affSfengbojiang 	/* Build the signal context to be used by sigreturn. */
547a9643ea8Slogwang 	frame.sf_sc.sc_mask   = lmask.__mask;
548a9643ea8Slogwang 	frame.sf_sc.sc_gs     = rgs();
549a9643ea8Slogwang 	frame.sf_sc.sc_fs     = regs->tf_fs;
550a9643ea8Slogwang 	frame.sf_sc.sc_es     = regs->tf_es;
551a9643ea8Slogwang 	frame.sf_sc.sc_ds     = regs->tf_ds;
552a9643ea8Slogwang 	frame.sf_sc.sc_edi    = regs->tf_edi;
553a9643ea8Slogwang 	frame.sf_sc.sc_esi    = regs->tf_esi;
554a9643ea8Slogwang 	frame.sf_sc.sc_ebp    = regs->tf_ebp;
555a9643ea8Slogwang 	frame.sf_sc.sc_ebx    = regs->tf_ebx;
556a9643ea8Slogwang 	frame.sf_sc.sc_esp    = regs->tf_esp;
557a9643ea8Slogwang 	frame.sf_sc.sc_edx    = regs->tf_edx;
558a9643ea8Slogwang 	frame.sf_sc.sc_ecx    = regs->tf_ecx;
559a9643ea8Slogwang 	frame.sf_sc.sc_eax    = regs->tf_eax;
560a9643ea8Slogwang 	frame.sf_sc.sc_eip    = regs->tf_eip;
561a9643ea8Slogwang 	frame.sf_sc.sc_cs     = regs->tf_cs;
562a9643ea8Slogwang 	frame.sf_sc.sc_eflags = regs->tf_eflags;
563a9643ea8Slogwang 	frame.sf_sc.sc_esp_at_signal = regs->tf_esp;
564a9643ea8Slogwang 	frame.sf_sc.sc_ss     = regs->tf_ss;
565a9643ea8Slogwang 	frame.sf_sc.sc_err    = regs->tf_err;
566a9643ea8Slogwang 	frame.sf_sc.sc_cr2    = (register_t)ksi->ksi_addr;
567a9643ea8Slogwang 	frame.sf_sc.sc_trapno = bsd_to_linux_trapcode(ksi->ksi_trapno);
568a9643ea8Slogwang 
569a9643ea8Slogwang 	frame.sf_extramask[0] = lmask.__mask;
570a9643ea8Slogwang 
571a9643ea8Slogwang 	if (copyout(&frame, fp, sizeof(frame)) != 0) {
572a9643ea8Slogwang 		/*
573a9643ea8Slogwang 		 * Process has trashed its stack; give it an illegal
574a9643ea8Slogwang 		 * instruction to halt it in its tracks.
575a9643ea8Slogwang 		 */
576a9643ea8Slogwang 		PROC_LOCK(p);
577a9643ea8Slogwang 		sigexit(td, SIGILL);
578a9643ea8Slogwang 	}
579a9643ea8Slogwang 
580*22ce4affSfengbojiang 	/* Build context to run handler in. */
581a9643ea8Slogwang 	regs->tf_esp = (int)fp;
582a9643ea8Slogwang 	regs->tf_eip = linux_sigcode;
583a9643ea8Slogwang 	regs->tf_eflags &= ~(PSL_T | PSL_VM | PSL_D);
584a9643ea8Slogwang 	regs->tf_cs = _ucodesel;
585a9643ea8Slogwang 	regs->tf_ds = _udatasel;
586a9643ea8Slogwang 	regs->tf_es = _udatasel;
587a9643ea8Slogwang 	regs->tf_fs = _udatasel;
588a9643ea8Slogwang 	regs->tf_ss = _udatasel;
589a9643ea8Slogwang 	PROC_LOCK(p);
590a9643ea8Slogwang 	mtx_lock(&psp->ps_mtx);
591a9643ea8Slogwang }
592a9643ea8Slogwang 
593a9643ea8Slogwang /*
594a9643ea8Slogwang  * System call to cleanup state after a signal
595a9643ea8Slogwang  * has been taken.  Reset signal mask and
596a9643ea8Slogwang  * stack state from context left by sendsig (above).
597a9643ea8Slogwang  * Return to previous pc and psl as specified by
598a9643ea8Slogwang  * context left by sendsig. Check carefully to
599a9643ea8Slogwang  * make sure that the user has not modified the
600a9643ea8Slogwang  * psl to gain improper privileges or to cause
601a9643ea8Slogwang  * a machine fault.
602a9643ea8Slogwang  */
603a9643ea8Slogwang int
linux_sigreturn(struct thread * td,struct linux_sigreturn_args * args)604a9643ea8Slogwang linux_sigreturn(struct thread *td, struct linux_sigreturn_args *args)
605a9643ea8Slogwang {
606a9643ea8Slogwang 	struct l_sigframe frame;
607a9643ea8Slogwang 	struct trapframe *regs;
608a9643ea8Slogwang 	l_sigset_t lmask;
609a9643ea8Slogwang 	sigset_t bmask;
610a9643ea8Slogwang 	int eflags;
611a9643ea8Slogwang 	ksiginfo_t ksi;
612a9643ea8Slogwang 
613a9643ea8Slogwang 	regs = td->td_frame;
614a9643ea8Slogwang 
615a9643ea8Slogwang 	/*
616a9643ea8Slogwang 	 * The trampoline code hands us the sigframe.
617a9643ea8Slogwang 	 * It is unsafe to keep track of it ourselves, in the event that a
618a9643ea8Slogwang 	 * program jumps out of a signal handler.
619a9643ea8Slogwang 	 */
620a9643ea8Slogwang 	if (copyin(args->sfp, &frame, sizeof(frame)) != 0)
621a9643ea8Slogwang 		return (EFAULT);
622a9643ea8Slogwang 
623*22ce4affSfengbojiang 	/* Check for security violations. */
624a9643ea8Slogwang #define	EFLAGS_SECURE(ef, oef)	((((ef) ^ (oef)) & ~PSL_USERCHANGE) == 0)
625a9643ea8Slogwang 	eflags = frame.sf_sc.sc_eflags;
626a9643ea8Slogwang 	if (!EFLAGS_SECURE(eflags, regs->tf_eflags))
627a9643ea8Slogwang 		return (EINVAL);
628a9643ea8Slogwang 
629a9643ea8Slogwang 	/*
630a9643ea8Slogwang 	 * Don't allow users to load a valid privileged %cs.  Let the
631a9643ea8Slogwang 	 * hardware check for invalid selectors, excess privilege in
632a9643ea8Slogwang 	 * other selectors, invalid %eip's and invalid %esp's.
633a9643ea8Slogwang 	 */
634a9643ea8Slogwang #define	CS_SECURE(cs)	(ISPL(cs) == SEL_UPL)
635a9643ea8Slogwang 	if (!CS_SECURE(frame.sf_sc.sc_cs)) {
636a9643ea8Slogwang 		ksiginfo_init_trap(&ksi);
637a9643ea8Slogwang 		ksi.ksi_signo = SIGBUS;
638a9643ea8Slogwang 		ksi.ksi_code = BUS_OBJERR;
639a9643ea8Slogwang 		ksi.ksi_trapno = T_PROTFLT;
640a9643ea8Slogwang 		ksi.ksi_addr = (void *)regs->tf_eip;
641a9643ea8Slogwang 		trapsignal(td, &ksi);
642a9643ea8Slogwang 		return (EINVAL);
643a9643ea8Slogwang 	}
644a9643ea8Slogwang 
645a9643ea8Slogwang 	lmask.__mask = frame.sf_sc.sc_mask;
646a9643ea8Slogwang 	linux_to_bsd_sigset(&lmask, &bmask);
647a9643ea8Slogwang 	kern_sigprocmask(td, SIG_SETMASK, &bmask, NULL, 0);
648a9643ea8Slogwang 
649*22ce4affSfengbojiang 	/* Restore signal context. */
650a9643ea8Slogwang 	/* %gs was restored by the trampoline. */
651a9643ea8Slogwang 	regs->tf_fs     = frame.sf_sc.sc_fs;
652a9643ea8Slogwang 	regs->tf_es     = frame.sf_sc.sc_es;
653a9643ea8Slogwang 	regs->tf_ds     = frame.sf_sc.sc_ds;
654a9643ea8Slogwang 	regs->tf_edi    = frame.sf_sc.sc_edi;
655a9643ea8Slogwang 	regs->tf_esi    = frame.sf_sc.sc_esi;
656a9643ea8Slogwang 	regs->tf_ebp    = frame.sf_sc.sc_ebp;
657a9643ea8Slogwang 	regs->tf_ebx    = frame.sf_sc.sc_ebx;
658a9643ea8Slogwang 	regs->tf_edx    = frame.sf_sc.sc_edx;
659a9643ea8Slogwang 	regs->tf_ecx    = frame.sf_sc.sc_ecx;
660a9643ea8Slogwang 	regs->tf_eax    = frame.sf_sc.sc_eax;
661a9643ea8Slogwang 	regs->tf_eip    = frame.sf_sc.sc_eip;
662a9643ea8Slogwang 	regs->tf_cs     = frame.sf_sc.sc_cs;
663a9643ea8Slogwang 	regs->tf_eflags = eflags;
664a9643ea8Slogwang 	regs->tf_esp    = frame.sf_sc.sc_esp_at_signal;
665a9643ea8Slogwang 	regs->tf_ss     = frame.sf_sc.sc_ss;
666a9643ea8Slogwang 
667a9643ea8Slogwang 	return (EJUSTRETURN);
668a9643ea8Slogwang }
669a9643ea8Slogwang 
670a9643ea8Slogwang /*
671a9643ea8Slogwang  * System call to cleanup state after a signal
672a9643ea8Slogwang  * has been taken.  Reset signal mask and
673a9643ea8Slogwang  * stack state from context left by rt_sendsig (above).
674a9643ea8Slogwang  * Return to previous pc and psl as specified by
675a9643ea8Slogwang  * context left by sendsig. Check carefully to
676a9643ea8Slogwang  * make sure that the user has not modified the
677a9643ea8Slogwang  * psl to gain improper privileges or to cause
678a9643ea8Slogwang  * a machine fault.
679a9643ea8Slogwang  */
680a9643ea8Slogwang int
linux_rt_sigreturn(struct thread * td,struct linux_rt_sigreturn_args * args)681a9643ea8Slogwang linux_rt_sigreturn(struct thread *td, struct linux_rt_sigreturn_args *args)
682a9643ea8Slogwang {
683a9643ea8Slogwang 	struct l_ucontext uc;
684a9643ea8Slogwang 	struct l_sigcontext *context;
685a9643ea8Slogwang 	sigset_t bmask;
686a9643ea8Slogwang 	l_stack_t *lss;
687a9643ea8Slogwang 	stack_t ss;
688a9643ea8Slogwang 	struct trapframe *regs;
689a9643ea8Slogwang 	int eflags;
690a9643ea8Slogwang 	ksiginfo_t ksi;
691a9643ea8Slogwang 
692a9643ea8Slogwang 	regs = td->td_frame;
693a9643ea8Slogwang 
694a9643ea8Slogwang 	/*
695a9643ea8Slogwang 	 * The trampoline code hands us the ucontext.
696a9643ea8Slogwang 	 * It is unsafe to keep track of it ourselves, in the event that a
697a9643ea8Slogwang 	 * program jumps out of a signal handler.
698a9643ea8Slogwang 	 */
699a9643ea8Slogwang 	if (copyin(args->ucp, &uc, sizeof(uc)) != 0)
700a9643ea8Slogwang 		return (EFAULT);
701a9643ea8Slogwang 
702a9643ea8Slogwang 	context = &uc.uc_mcontext;
703a9643ea8Slogwang 
704*22ce4affSfengbojiang 	/* Check for security violations. */
705a9643ea8Slogwang #define	EFLAGS_SECURE(ef, oef)	((((ef) ^ (oef)) & ~PSL_USERCHANGE) == 0)
706a9643ea8Slogwang 	eflags = context->sc_eflags;
707a9643ea8Slogwang 	if (!EFLAGS_SECURE(eflags, regs->tf_eflags))
708a9643ea8Slogwang 		return (EINVAL);
709a9643ea8Slogwang 
710a9643ea8Slogwang 	/*
711a9643ea8Slogwang 	 * Don't allow users to load a valid privileged %cs.  Let the
712a9643ea8Slogwang 	 * hardware check for invalid selectors, excess privilege in
713a9643ea8Slogwang 	 * other selectors, invalid %eip's and invalid %esp's.
714a9643ea8Slogwang 	 */
715a9643ea8Slogwang #define	CS_SECURE(cs)	(ISPL(cs) == SEL_UPL)
716a9643ea8Slogwang 	if (!CS_SECURE(context->sc_cs)) {
717a9643ea8Slogwang 		ksiginfo_init_trap(&ksi);
718a9643ea8Slogwang 		ksi.ksi_signo = SIGBUS;
719a9643ea8Slogwang 		ksi.ksi_code = BUS_OBJERR;
720a9643ea8Slogwang 		ksi.ksi_trapno = T_PROTFLT;
721a9643ea8Slogwang 		ksi.ksi_addr = (void *)regs->tf_eip;
722a9643ea8Slogwang 		trapsignal(td, &ksi);
723a9643ea8Slogwang 		return (EINVAL);
724a9643ea8Slogwang 	}
725a9643ea8Slogwang 
726a9643ea8Slogwang 	linux_to_bsd_sigset(&uc.uc_sigmask, &bmask);
727a9643ea8Slogwang 	kern_sigprocmask(td, SIG_SETMASK, &bmask, NULL, 0);
728a9643ea8Slogwang 
729*22ce4affSfengbojiang 	/* Restore signal context. */
730a9643ea8Slogwang 	/* %gs was restored by the trampoline. */
731a9643ea8Slogwang 	regs->tf_fs     = context->sc_fs;
732a9643ea8Slogwang 	regs->tf_es     = context->sc_es;
733a9643ea8Slogwang 	regs->tf_ds     = context->sc_ds;
734a9643ea8Slogwang 	regs->tf_edi    = context->sc_edi;
735a9643ea8Slogwang 	regs->tf_esi    = context->sc_esi;
736a9643ea8Slogwang 	regs->tf_ebp    = context->sc_ebp;
737a9643ea8Slogwang 	regs->tf_ebx    = context->sc_ebx;
738a9643ea8Slogwang 	regs->tf_edx    = context->sc_edx;
739a9643ea8Slogwang 	regs->tf_ecx    = context->sc_ecx;
740a9643ea8Slogwang 	regs->tf_eax    = context->sc_eax;
741a9643ea8Slogwang 	regs->tf_eip    = context->sc_eip;
742a9643ea8Slogwang 	regs->tf_cs     = context->sc_cs;
743a9643ea8Slogwang 	regs->tf_eflags = eflags;
744a9643ea8Slogwang 	regs->tf_esp    = context->sc_esp_at_signal;
745a9643ea8Slogwang 	regs->tf_ss     = context->sc_ss;
746a9643ea8Slogwang 
747*22ce4affSfengbojiang 	/* Call sigaltstack & ignore results. */
748a9643ea8Slogwang 	lss = &uc.uc_stack;
749a9643ea8Slogwang 	ss.ss_sp = lss->ss_sp;
750a9643ea8Slogwang 	ss.ss_size = lss->ss_size;
751a9643ea8Slogwang 	ss.ss_flags = linux_to_bsd_sigaltstack(lss->ss_flags);
752a9643ea8Slogwang 
753a9643ea8Slogwang 	(void)kern_sigaltstack(td, &ss, NULL);
754a9643ea8Slogwang 
755a9643ea8Slogwang 	return (EJUSTRETURN);
756a9643ea8Slogwang }
757a9643ea8Slogwang 
758a9643ea8Slogwang static int
linux_fetch_syscall_args(struct thread * td)759*22ce4affSfengbojiang linux_fetch_syscall_args(struct thread *td)
760a9643ea8Slogwang {
761a9643ea8Slogwang 	struct proc *p;
762a9643ea8Slogwang 	struct trapframe *frame;
763*22ce4affSfengbojiang 	struct syscall_args *sa;
764a9643ea8Slogwang 
765a9643ea8Slogwang 	p = td->td_proc;
766a9643ea8Slogwang 	frame = td->td_frame;
767*22ce4affSfengbojiang 	sa = &td->td_sa;
768a9643ea8Slogwang 
769a9643ea8Slogwang 	sa->code = frame->tf_eax;
770a9643ea8Slogwang 	sa->args[0] = frame->tf_ebx;
771a9643ea8Slogwang 	sa->args[1] = frame->tf_ecx;
772a9643ea8Slogwang 	sa->args[2] = frame->tf_edx;
773a9643ea8Slogwang 	sa->args[3] = frame->tf_esi;
774a9643ea8Slogwang 	sa->args[4] = frame->tf_edi;
775a9643ea8Slogwang 	sa->args[5] = frame->tf_ebp;	/* Unconfirmed */
776a9643ea8Slogwang 
777a9643ea8Slogwang 	if (sa->code >= p->p_sysent->sv_size)
778a9643ea8Slogwang 		/* nosys */
779a9643ea8Slogwang 		sa->callp = &p->p_sysent->sv_table[p->p_sysent->sv_size - 1];
780a9643ea8Slogwang 	else
781a9643ea8Slogwang 		sa->callp = &p->p_sysent->sv_table[sa->code];
782a9643ea8Slogwang 
783a9643ea8Slogwang 	td->td_retval[0] = 0;
784a9643ea8Slogwang 	td->td_retval[1] = frame->tf_edx;
785a9643ea8Slogwang 
786a9643ea8Slogwang 	return (0);
787a9643ea8Slogwang }
788a9643ea8Slogwang 
789*22ce4affSfengbojiang static void
linux_set_syscall_retval(struct thread * td,int error)790*22ce4affSfengbojiang linux_set_syscall_retval(struct thread *td, int error)
791a9643ea8Slogwang {
792*22ce4affSfengbojiang 	struct trapframe *frame = td->td_frame;
793a9643ea8Slogwang 
794*22ce4affSfengbojiang 	cpu_set_syscall_retval(td, error);
795*22ce4affSfengbojiang 
796*22ce4affSfengbojiang 	if (__predict_false(error != 0)) {
797*22ce4affSfengbojiang 		if (error != ERESTART && error != EJUSTRETURN)
798*22ce4affSfengbojiang 			frame->tf_eax = bsd_to_linux_errno(error);
799a9643ea8Slogwang 	}
800a9643ea8Slogwang }
801a9643ea8Slogwang 
802a9643ea8Slogwang /*
803a9643ea8Slogwang  * exec_setregs may initialize some registers differently than Linux
804a9643ea8Slogwang  * does, thus potentially confusing Linux binaries. If necessary, we
805a9643ea8Slogwang  * override the exec_setregs default(s) here.
806a9643ea8Slogwang  */
807a9643ea8Slogwang static void
linux_exec_setregs(struct thread * td,struct image_params * imgp,uintptr_t stack)808*22ce4affSfengbojiang linux_exec_setregs(struct thread *td, struct image_params *imgp,
809*22ce4affSfengbojiang     uintptr_t stack)
810a9643ea8Slogwang {
811a9643ea8Slogwang 	struct pcb *pcb = td->td_pcb;
812a9643ea8Slogwang 
813a9643ea8Slogwang 	exec_setregs(td, imgp, stack);
814a9643ea8Slogwang 
815*22ce4affSfengbojiang 	/* Linux sets %gs to 0, we default to _udatasel. */
816a9643ea8Slogwang 	pcb->pcb_gs = 0;
817a9643ea8Slogwang 	load_gs(0);
818a9643ea8Slogwang 
819a9643ea8Slogwang 	pcb->pcb_initial_npxcw = __LINUX_NPXCW__;
820a9643ea8Slogwang }
821a9643ea8Slogwang 
822a9643ea8Slogwang static void
linux_get_machine(const char ** dst)823a9643ea8Slogwang linux_get_machine(const char **dst)
824a9643ea8Slogwang {
825a9643ea8Slogwang 
826a9643ea8Slogwang 	switch (cpu_class) {
827a9643ea8Slogwang 	case CPUCLASS_686:
828a9643ea8Slogwang 		*dst = "i686";
829a9643ea8Slogwang 		break;
830a9643ea8Slogwang 	case CPUCLASS_586:
831a9643ea8Slogwang 		*dst = "i586";
832a9643ea8Slogwang 		break;
833a9643ea8Slogwang 	case CPUCLASS_486:
834a9643ea8Slogwang 		*dst = "i486";
835a9643ea8Slogwang 		break;
836a9643ea8Slogwang 	default:
837a9643ea8Slogwang 		*dst = "i386";
838a9643ea8Slogwang 	}
839a9643ea8Slogwang }
840a9643ea8Slogwang 
841a9643ea8Slogwang struct sysentvec linux_sysvec = {
842a9643ea8Slogwang 	.sv_size	= LINUX_SYS_MAXSYSCALL,
843a9643ea8Slogwang 	.sv_table	= linux_sysent,
844*22ce4affSfengbojiang 	.sv_transtrap	= linux_translate_traps,
845a9643ea8Slogwang 	.sv_fixup	= linux_fixup,
846a9643ea8Slogwang 	.sv_sendsig	= linux_sendsig,
847a9643ea8Slogwang 	.sv_sigcode	= &_binary_linux_locore_o_start,
848a9643ea8Slogwang 	.sv_szsigcode	= &linux_szsigcode,
849a9643ea8Slogwang 	.sv_name	= "Linux a.out",
850a9643ea8Slogwang 	.sv_coredump	= NULL,
851*22ce4affSfengbojiang 	.sv_imgact_try	= linux_exec_imgact_try,
852a9643ea8Slogwang 	.sv_minsigstksz	= LINUX_MINSIGSTKSZ,
853a9643ea8Slogwang 	.sv_minuser	= VM_MIN_ADDRESS,
854a9643ea8Slogwang 	.sv_maxuser	= VM_MAXUSER_ADDRESS,
855a9643ea8Slogwang 	.sv_usrstack	= LINUX_USRSTACK,
856a9643ea8Slogwang 	.sv_psstrings	= PS_STRINGS,
857a9643ea8Slogwang 	.sv_stackprot	= VM_PROT_ALL,
858a9643ea8Slogwang 	.sv_copyout_strings = exec_copyout_strings,
859*22ce4affSfengbojiang 	.sv_setregs	= linux_exec_setregs,
860a9643ea8Slogwang 	.sv_fixlimit	= NULL,
861a9643ea8Slogwang 	.sv_maxssiz	= NULL,
862a9643ea8Slogwang 	.sv_flags	= SV_ABI_LINUX | SV_AOUT | SV_IA32 | SV_ILP32,
863*22ce4affSfengbojiang 	.sv_set_syscall_retval = linux_set_syscall_retval,
864a9643ea8Slogwang 	.sv_fetch_syscall_args = linux_fetch_syscall_args,
865a9643ea8Slogwang 	.sv_syscallnames = NULL,
866a9643ea8Slogwang 	.sv_shared_page_base = LINUX_SHAREDPAGE,
867a9643ea8Slogwang 	.sv_shared_page_len = PAGE_SIZE,
868a9643ea8Slogwang 	.sv_schedtail	= linux_schedtail,
869a9643ea8Slogwang 	.sv_thread_detach = linux_thread_detach,
870a9643ea8Slogwang 	.sv_trap	= NULL,
871*22ce4affSfengbojiang 	.sv_onexec	= linux_on_exec,
872*22ce4affSfengbojiang 	.sv_onexit	= linux_on_exit,
873*22ce4affSfengbojiang 	.sv_ontdexit	= linux_thread_dtor,
874a9643ea8Slogwang };
875a9643ea8Slogwang INIT_SYSENTVEC(aout_sysvec, &linux_sysvec);
876a9643ea8Slogwang 
877a9643ea8Slogwang struct sysentvec elf_linux_sysvec = {
878a9643ea8Slogwang 	.sv_size	= LINUX_SYS_MAXSYSCALL,
879a9643ea8Slogwang 	.sv_table	= linux_sysent,
880*22ce4affSfengbojiang 	.sv_transtrap	= linux_translate_traps,
881*22ce4affSfengbojiang 	.sv_fixup	= linux_fixup_elf,
882a9643ea8Slogwang 	.sv_sendsig	= linux_sendsig,
883a9643ea8Slogwang 	.sv_sigcode	= &_binary_linux_locore_o_start,
884a9643ea8Slogwang 	.sv_szsigcode	= &linux_szsigcode,
885*22ce4affSfengbojiang 	.sv_name	= "Linux ELF32",
886a9643ea8Slogwang 	.sv_coredump	= elf32_coredump,
887*22ce4affSfengbojiang 	.sv_imgact_try	= linux_exec_imgact_try,
888a9643ea8Slogwang 	.sv_minsigstksz	= LINUX_MINSIGSTKSZ,
889a9643ea8Slogwang 	.sv_minuser	= VM_MIN_ADDRESS,
890a9643ea8Slogwang 	.sv_maxuser	= VM_MAXUSER_ADDRESS,
891a9643ea8Slogwang 	.sv_usrstack	= LINUX_USRSTACK,
892a9643ea8Slogwang 	.sv_psstrings	= LINUX_PS_STRINGS,
893a9643ea8Slogwang 	.sv_stackprot	= VM_PROT_ALL,
894*22ce4affSfengbojiang 	.sv_copyout_auxargs = linux_copyout_auxargs,
895a9643ea8Slogwang 	.sv_copyout_strings = linux_copyout_strings,
896*22ce4affSfengbojiang 	.sv_setregs	= linux_exec_setregs,
897a9643ea8Slogwang 	.sv_fixlimit	= NULL,
898a9643ea8Slogwang 	.sv_maxssiz	= NULL,
899a9643ea8Slogwang 	.sv_flags	= SV_ABI_LINUX | SV_IA32 | SV_ILP32 | SV_SHP,
900*22ce4affSfengbojiang 	.sv_set_syscall_retval = linux_set_syscall_retval,
901a9643ea8Slogwang 	.sv_fetch_syscall_args = linux_fetch_syscall_args,
902a9643ea8Slogwang 	.sv_syscallnames = NULL,
903a9643ea8Slogwang 	.sv_shared_page_base = LINUX_SHAREDPAGE,
904a9643ea8Slogwang 	.sv_shared_page_len = PAGE_SIZE,
905a9643ea8Slogwang 	.sv_schedtail	= linux_schedtail,
906a9643ea8Slogwang 	.sv_thread_detach = linux_thread_detach,
907a9643ea8Slogwang 	.sv_trap	= NULL,
908*22ce4affSfengbojiang 	.sv_onexec	= linux_on_exec,
909*22ce4affSfengbojiang 	.sv_onexit	= linux_on_exit,
910*22ce4affSfengbojiang 	.sv_ontdexit	= linux_thread_dtor,
911a9643ea8Slogwang };
912a9643ea8Slogwang 
913a9643ea8Slogwang static void
linux_vdso_install(void * param)914a9643ea8Slogwang linux_vdso_install(void *param)
915a9643ea8Slogwang {
916a9643ea8Slogwang 
917a9643ea8Slogwang 	linux_szsigcode = (&_binary_linux_locore_o_end -
918a9643ea8Slogwang 	    &_binary_linux_locore_o_start);
919a9643ea8Slogwang 
920a9643ea8Slogwang 	if (linux_szsigcode > elf_linux_sysvec.sv_shared_page_len)
921a9643ea8Slogwang 		panic("Linux invalid vdso size\n");
922a9643ea8Slogwang 
923a9643ea8Slogwang 	__elfN(linux_vdso_fixup)(&elf_linux_sysvec);
924a9643ea8Slogwang 
925a9643ea8Slogwang 	linux_shared_page_obj = __elfN(linux_shared_page_init)
926a9643ea8Slogwang 	    (&linux_shared_page_mapping);
927a9643ea8Slogwang 
928*22ce4affSfengbojiang 	__elfN(linux_vdso_reloc)(&elf_linux_sysvec);
929a9643ea8Slogwang 
930a9643ea8Slogwang 	bcopy(elf_linux_sysvec.sv_sigcode, linux_shared_page_mapping,
931a9643ea8Slogwang 	    linux_szsigcode);
932a9643ea8Slogwang 	elf_linux_sysvec.sv_shared_page_obj = linux_shared_page_obj;
933a9643ea8Slogwang }
934a9643ea8Slogwang SYSINIT(elf_linux_vdso_init, SI_SUB_EXEC, SI_ORDER_ANY,
935*22ce4affSfengbojiang     linux_vdso_install, NULL);
936a9643ea8Slogwang 
937a9643ea8Slogwang static void
linux_vdso_deinstall(void * param)938a9643ea8Slogwang linux_vdso_deinstall(void *param)
939a9643ea8Slogwang {
940a9643ea8Slogwang 
941a9643ea8Slogwang 	__elfN(linux_shared_page_fini)(linux_shared_page_obj);
942*22ce4affSfengbojiang }
943a9643ea8Slogwang SYSUNINIT(elf_linux_vdso_uninit, SI_SUB_EXEC, SI_ORDER_FIRST,
944*22ce4affSfengbojiang     linux_vdso_deinstall, NULL);
945a9643ea8Slogwang 
946a9643ea8Slogwang static char GNU_ABI_VENDOR[] = "GNU";
947a9643ea8Slogwang static int GNULINUX_ABI_DESC = 0;
948a9643ea8Slogwang 
949*22ce4affSfengbojiang static bool
linux_trans_osrel(const Elf_Note * note,int32_t * osrel)950a9643ea8Slogwang linux_trans_osrel(const Elf_Note *note, int32_t *osrel)
951a9643ea8Slogwang {
952a9643ea8Slogwang 	const Elf32_Word *desc;
953a9643ea8Slogwang 	uintptr_t p;
954a9643ea8Slogwang 
955a9643ea8Slogwang 	p = (uintptr_t)(note + 1);
956a9643ea8Slogwang 	p += roundup2(note->n_namesz, sizeof(Elf32_Addr));
957a9643ea8Slogwang 
958a9643ea8Slogwang 	desc = (const Elf32_Word *)p;
959a9643ea8Slogwang 	if (desc[0] != GNULINUX_ABI_DESC)
960*22ce4affSfengbojiang 		return (false);
961a9643ea8Slogwang 
962a9643ea8Slogwang 	/*
963*22ce4affSfengbojiang 	 * For Linux we encode osrel using the Linux convention of
964*22ce4affSfengbojiang 	 * 	(version << 16) | (major << 8) | (minor)
965*22ce4affSfengbojiang 	 * See macro in linux_mib.h
966a9643ea8Slogwang 	 */
967*22ce4affSfengbojiang 	*osrel = LINUX_KERNVER(desc[1], desc[2], desc[3]);
968a9643ea8Slogwang 
969*22ce4affSfengbojiang 	return (true);
970a9643ea8Slogwang }
971a9643ea8Slogwang 
972a9643ea8Slogwang static Elf_Brandnote linux_brandnote = {
973a9643ea8Slogwang 	.hdr.n_namesz	= sizeof(GNU_ABI_VENDOR),
974a9643ea8Slogwang 	.hdr.n_descsz	= 16,	/* XXX at least 16 */
975a9643ea8Slogwang 	.hdr.n_type	= 1,
976a9643ea8Slogwang 	.vendor		= GNU_ABI_VENDOR,
977a9643ea8Slogwang 	.flags		= BN_TRANSLATE_OSREL,
978a9643ea8Slogwang 	.trans_osrel	= linux_trans_osrel
979a9643ea8Slogwang };
980a9643ea8Slogwang 
981a9643ea8Slogwang static Elf32_Brandinfo linux_brand = {
982a9643ea8Slogwang 	.brand		= ELFOSABI_LINUX,
983a9643ea8Slogwang 	.machine	= EM_386,
984a9643ea8Slogwang 	.compat_3_brand	= "Linux",
985*22ce4affSfengbojiang 	.emul_path	= linux_emul_path,
986a9643ea8Slogwang 	.interp_path	= "/lib/ld-linux.so.1",
987a9643ea8Slogwang 	.sysvec		= &elf_linux_sysvec,
988a9643ea8Slogwang 	.interp_newpath	= NULL,
989a9643ea8Slogwang 	.brand_note	= &linux_brandnote,
990a9643ea8Slogwang 	.flags		= BI_CAN_EXEC_DYN | BI_BRAND_NOTE
991a9643ea8Slogwang };
992a9643ea8Slogwang 
993a9643ea8Slogwang static Elf32_Brandinfo linux_glibc2brand = {
994a9643ea8Slogwang 	.brand		= ELFOSABI_LINUX,
995a9643ea8Slogwang 	.machine	= EM_386,
996a9643ea8Slogwang 	.compat_3_brand	= "Linux",
997*22ce4affSfengbojiang 	.emul_path	= linux_emul_path,
998a9643ea8Slogwang 	.interp_path	= "/lib/ld-linux.so.2",
999a9643ea8Slogwang 	.sysvec		= &elf_linux_sysvec,
1000a9643ea8Slogwang 	.interp_newpath	= NULL,
1001a9643ea8Slogwang 	.brand_note	= &linux_brandnote,
1002a9643ea8Slogwang 	.flags		= BI_CAN_EXEC_DYN | BI_BRAND_NOTE
1003a9643ea8Slogwang };
1004a9643ea8Slogwang 
1005*22ce4affSfengbojiang static Elf32_Brandinfo linux_muslbrand = {
1006*22ce4affSfengbojiang 	.brand		= ELFOSABI_LINUX,
1007*22ce4affSfengbojiang 	.machine	= EM_386,
1008*22ce4affSfengbojiang 	.compat_3_brand	= "Linux",
1009*22ce4affSfengbojiang 	.emul_path	= linux_emul_path,
1010*22ce4affSfengbojiang 	.interp_path	= "/lib/ld-musl-i386.so.1",
1011*22ce4affSfengbojiang 	.sysvec		= &elf_linux_sysvec,
1012*22ce4affSfengbojiang 	.interp_newpath	= NULL,
1013*22ce4affSfengbojiang 	.brand_note	= &linux_brandnote,
1014*22ce4affSfengbojiang 	.flags		= BI_CAN_EXEC_DYN | BI_BRAND_NOTE
1015*22ce4affSfengbojiang };
1016*22ce4affSfengbojiang 
1017a9643ea8Slogwang Elf32_Brandinfo *linux_brandlist[] = {
1018a9643ea8Slogwang 	&linux_brand,
1019a9643ea8Slogwang 	&linux_glibc2brand,
1020*22ce4affSfengbojiang 	&linux_muslbrand,
1021a9643ea8Slogwang 	NULL
1022a9643ea8Slogwang };
1023a9643ea8Slogwang 
1024a9643ea8Slogwang static int
linux_elf_modevent(module_t mod,int type,void * data)1025a9643ea8Slogwang linux_elf_modevent(module_t mod, int type, void *data)
1026a9643ea8Slogwang {
1027a9643ea8Slogwang 	Elf32_Brandinfo **brandinfo;
1028a9643ea8Slogwang 	int error;
1029a9643ea8Slogwang 	struct linux_ioctl_handler **lihp;
1030a9643ea8Slogwang 
1031a9643ea8Slogwang 	error = 0;
1032a9643ea8Slogwang 
1033a9643ea8Slogwang 	switch(type) {
1034a9643ea8Slogwang 	case MOD_LOAD:
1035a9643ea8Slogwang 		for (brandinfo = &linux_brandlist[0]; *brandinfo != NULL;
1036a9643ea8Slogwang 		     ++brandinfo)
1037a9643ea8Slogwang 			if (elf32_insert_brand_entry(*brandinfo) < 0)
1038a9643ea8Slogwang 				error = EINVAL;
1039a9643ea8Slogwang 		if (error == 0) {
1040a9643ea8Slogwang 			SET_FOREACH(lihp, linux_ioctl_handler_set)
1041a9643ea8Slogwang 				linux_ioctl_register_handler(*lihp);
1042a9643ea8Slogwang 			LIST_INIT(&futex_list);
1043a9643ea8Slogwang 			mtx_init(&futex_mtx, "ftllk", NULL, MTX_DEF);
1044a9643ea8Slogwang 			linux_get_machine(&linux_kplatform);
1045a9643ea8Slogwang 			linux_szplatform = roundup(strlen(linux_kplatform) + 1,
1046a9643ea8Slogwang 			    sizeof(char *));
1047*22ce4affSfengbojiang 			linux_dev_shm_create();
1048a9643ea8Slogwang 			linux_osd_jail_register();
1049a9643ea8Slogwang 			stclohz = (stathz ? stathz : hz);
1050a9643ea8Slogwang 			if (bootverbose)
1051a9643ea8Slogwang 				printf("Linux ELF exec handler installed\n");
1052a9643ea8Slogwang 		} else
1053a9643ea8Slogwang 			printf("cannot insert Linux ELF brand handler\n");
1054a9643ea8Slogwang 		break;
1055a9643ea8Slogwang 	case MOD_UNLOAD:
1056a9643ea8Slogwang 		for (brandinfo = &linux_brandlist[0]; *brandinfo != NULL;
1057a9643ea8Slogwang 		     ++brandinfo)
1058a9643ea8Slogwang 			if (elf32_brand_inuse(*brandinfo))
1059a9643ea8Slogwang 				error = EBUSY;
1060a9643ea8Slogwang 		if (error == 0) {
1061a9643ea8Slogwang 			for (brandinfo = &linux_brandlist[0];
1062a9643ea8Slogwang 			     *brandinfo != NULL; ++brandinfo)
1063a9643ea8Slogwang 				if (elf32_remove_brand_entry(*brandinfo) < 0)
1064a9643ea8Slogwang 					error = EINVAL;
1065a9643ea8Slogwang 		}
1066a9643ea8Slogwang 		if (error == 0) {
1067a9643ea8Slogwang 			SET_FOREACH(lihp, linux_ioctl_handler_set)
1068a9643ea8Slogwang 				linux_ioctl_unregister_handler(*lihp);
1069a9643ea8Slogwang 			mtx_destroy(&futex_mtx);
1070*22ce4affSfengbojiang 			linux_dev_shm_destroy();
1071a9643ea8Slogwang 			linux_osd_jail_deregister();
1072a9643ea8Slogwang 			if (bootverbose)
1073a9643ea8Slogwang 				printf("Linux ELF exec handler removed\n");
1074a9643ea8Slogwang 		} else
1075a9643ea8Slogwang 			printf("Could not deinstall ELF interpreter entry\n");
1076a9643ea8Slogwang 		break;
1077a9643ea8Slogwang 	default:
1078a9643ea8Slogwang 		return (EOPNOTSUPP);
1079a9643ea8Slogwang 	}
1080a9643ea8Slogwang 	return (error);
1081a9643ea8Slogwang }
1082a9643ea8Slogwang 
1083a9643ea8Slogwang static moduledata_t linux_elf_mod = {
1084a9643ea8Slogwang 	"linuxelf",
1085a9643ea8Slogwang 	linux_elf_modevent,
1086a9643ea8Slogwang 	0
1087a9643ea8Slogwang };
1088a9643ea8Slogwang 
1089a9643ea8Slogwang DECLARE_MODULE_TIED(linuxelf, linux_elf_mod, SI_SUB_EXEC, SI_ORDER_ANY);
1090a9643ea8Slogwang FEATURE(linux, "Linux 32bit support");
1091