2 * SPDX-License-Identifier: BSD-2-Clause
4 * Copyright (c) 1994-1996 Søren Schmidt
5 * Copyright (c) 2006 Roman Divacky
7 * Copyright (c) 2013 Dmitry Chagin <dchagin@FreeBSD.org>
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
34 #include <sys/param.h>
35 #include <sys/fcntl.h>
36 #include <sys/imgact.h>
39 #include <sys/malloc.h>
40 #include <sys/mutex.h>
42 #include <sys/resourcevar.h>
44 #include <sys/syscallsubr.h>
45 #include <sys/sysent.h>
47 #include <compat/linux/linux_emul.h>
48 #include <compat/linux/linux_mib.h>
49 #include <compat/linux/linux_misc.h>
50 #include <compat/linux/linux_persona.h>
51 #include <compat/linux/linux_util.h>
53 #if BYTE_ORDER == LITTLE_ENDIAN
54 #define SHELLMAGIC 0x2123 /* #! */
56 #define SHELLMAGIC 0x2321
60 * This returns reference to the thread emuldata entry (if found)
62 * Hold PROC_LOCK when referencing emuldata from other threads.
64 struct linux_emuldata *
65 em_find(struct thread *td)
67 struct linux_emuldata *em;
75 * This returns reference to the proc pemuldata entry (if found)
77 * Hold PROC_LOCK when referencing proc pemuldata from other threads.
78 * Hold LINUX_PEM_LOCK wher referencing pemuldata members.
80 struct linux_pemuldata *
81 pem_find(struct proc *p)
83 struct linux_pemuldata *pem;
91 * Linux apps generally expect the soft open file limit to be set
92 * to 1024, often iterating over all the file descriptors up to that
93 * limit instead of using closefrom(2). Give them what they want,
94 * unless there already is a resource limit in place.
97 linux_set_default_openfiles(struct thread *td, struct proc *p)
100 int error __diagused;
102 if (linux_default_openfiles < 0)
106 lim_rlimit_proc(p, RLIMIT_NOFILE, &rlim);
108 if (rlim.rlim_cur != rlim.rlim_max ||
109 rlim.rlim_cur <= linux_default_openfiles)
111 rlim.rlim_cur = linux_default_openfiles;
112 error = kern_proc_setrlimit(td, p, RLIMIT_NOFILE, &rlim);
113 KASSERT(error == 0, ("kern_proc_setrlimit failed"));
117 * The default stack size limit in Linux is 8MB.
120 linux_set_default_stacksize(struct thread *td, struct proc *p)
123 int error __diagused;
125 if (linux_default_stacksize < 0)
129 lim_rlimit_proc(p, RLIMIT_STACK, &rlim);
131 if (rlim.rlim_cur != rlim.rlim_max ||
132 rlim.rlim_cur <= linux_default_stacksize)
134 rlim.rlim_cur = linux_default_stacksize;
135 error = kern_proc_setrlimit(td, p, RLIMIT_STACK, &rlim);
136 KASSERT(error == 0, ("kern_proc_setrlimit failed"));
140 linux_proc_init(struct thread *td, struct thread *newtd, bool init_thread)
142 struct linux_emuldata *em;
143 struct linux_pemuldata *pem;
150 em = malloc(sizeof(*em), M_TEMP, M_WAITOK | M_ZERO);
152 LINUX_CTR1(proc_init, "thread newtd(%d)",
155 em->em_tid = newtd->td_tid;
157 LINUX_CTR1(proc_init, "fork newtd(%d)", p->p_pid);
159 em->em_tid = p->p_pid;
161 pem = malloc(sizeof(*pem), M_LINUX, M_WAITOK | M_ZERO);
162 sx_init(&pem->pem_sx, "lpemlk");
165 newtd->td_emuldata = em;
167 linux_set_default_openfiles(td, p);
168 linux_set_default_stacksize(td, p);
173 LINUX_CTR1(proc_init, "exec newtd(%d)", p->p_pid);
175 /* lookup the old one */
177 KASSERT(em != NULL, ("proc_init: thread emuldata not found.\n"));
179 em->em_tid = p->p_pid;
181 em->robust_futexes = NULL;
182 em->child_clear_tid = NULL;
183 em->child_set_tid = NULL;
186 KASSERT(pem != NULL, ("proc_init: proc emuldata not found.\n"));
188 pem->oom_score_adj = 0;
193 linux_on_exit(struct proc *p)
195 struct linux_pemuldata *pem;
196 struct thread *td = curthread;
198 MPASS(SV_CURPROC_ABI() == SV_ABI_LINUX);
200 LINUX_CTR3(proc_exit, "thread(%d) proc(%d) p %p",
201 td->td_tid, p->p_pid, p);
206 (p->p_sysent->sv_thread_detach)(td);
208 p->p_emuldata = NULL;
210 sx_destroy(&pem->pem_sx);
215 linux_common_execve(struct thread *td, struct image_args *eargs)
217 struct linux_pemuldata *pem;
218 struct vmspace *oldvmspace;
219 struct linux_emuldata *em;
225 error = pre_execve(td, &oldvmspace);
229 error = kern_execve(td, eargs, NULL, oldvmspace);
230 post_execve(td, error, oldvmspace);
231 if (error != EJUSTRETURN)
235 * In a case of transition from Linux binary execing to
236 * FreeBSD binary we destroy Linux emuldata thread & proc entries.
238 if (SV_CURPROC_ABI() != SV_ABI_LINUX) {
240 /* Clear ABI root directory if set. */
241 linux_pwd_onexec_native(td);
245 KASSERT(em != NULL, ("proc_exec: thread emuldata not found.\n"));
246 td->td_emuldata = NULL;
249 KASSERT(pem != NULL, ("proc_exec: proc pemuldata not found.\n"));
250 p->p_emuldata = NULL;
256 return (EJUSTRETURN);
260 linux_on_exec(struct proc *p, struct image_params *imgp)
263 struct thread *othertd;
264 #if defined(__amd64__)
265 struct linux_pemuldata *pem;
270 MPASS((imgp->sysent->sv_flags & SV_ABI_MASK) == SV_ABI_LINUX);
273 * When execing to Linux binary, we create Linux emuldata
276 if (SV_PROC_ABI(p) == SV_ABI_LINUX) {
278 * Process already was under Linuxolator
279 * before exec. Update emuldata to reflect
280 * single-threaded cleaned state after exec.
282 linux_proc_init(td, NULL, false);
285 * We are switching the process to Linux emulator.
287 linux_proc_init(td, td, false);
290 * Create a transient td_emuldata for all suspended
291 * threads, so that p->p_sysent->sv_thread_detach() ==
292 * linux_thread_detach() can find expected but unused
295 FOREACH_THREAD_IN_PROC(td->td_proc, othertd) {
298 linux_proc_init(td, othertd, true);
301 /* Set ABI root directory. */
302 if ((error = linux_pwd_onexec(td)) != 0)
305 #if defined(__amd64__)
307 * An IA32 executable which has executable stack will have the
308 * READ_IMPLIES_EXEC personality flag set automatically.
310 if (SV_PROC_FLAG(td->td_proc, SV_ILP32) &&
311 imgp->stack_prot & VM_PROT_EXECUTE) {
313 pem->persona |= LINUX_READ_IMPLIES_EXEC;
320 linux_thread_dtor(struct thread *td)
322 struct linux_emuldata *em;
327 td->td_emuldata = NULL;
329 LINUX_CTR1(thread_dtor, "thread(%d)", em->em_tid);
335 linux_schedtail(struct thread *td)
337 struct linux_emuldata *em;
346 KASSERT(em != NULL, ("linux_schedtail: thread emuldata not found.\n"));
347 child_set_tid = em->child_set_tid;
349 if (child_set_tid != NULL) {
350 error = copyout(&em->em_tid, child_set_tid,
352 LINUX_CTR4(schedtail, "thread(%d) %p stored %d error %d",
353 td->td_tid, child_set_tid, em->em_tid, error);
355 LINUX_CTR1(schedtail, "thread(%d)", em->em_tid);