2 * Copyright (c) 1999 Poul-Henning Kamp.
3 * Copyright (c) 2008 Bjoern A. Zeeb.
4 * Copyright (c) 2009 James Gritton.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
32 #include "opt_compat.h"
35 #include "opt_inet6.h"
37 #include <sys/param.h>
38 #include <sys/types.h>
39 #include <sys/kernel.h>
40 #include <sys/systm.h>
41 #include <sys/errno.h>
42 #include <sys/sysproto.h>
43 #include <sys/malloc.h>
47 #include <sys/taskqueue.h>
48 #include <sys/fcntl.h>
51 #include <sys/mutex.h>
52 #include <sys/racct.h>
53 #include <sys/refcount.h>
55 #include <sys/sysent.h>
56 #include <sys/namei.h>
57 #include <sys/mount.h>
58 #include <sys/queue.h>
59 #include <sys/socket.h>
60 #include <sys/syscallsubr.h>
61 #include <sys/sysctl.h>
62 #include <sys/vnode.h>
67 #include <netinet/in.h>
70 prison_qcmp_v4(const void *ip1, const void *ip2)
75 * We need to compare in HBO here to get the list sorted as expected
76 * by the result of the code. Sorting NBO addresses gives you
77 * interesting results. If you do not understand, do not try.
79 iaa = ntohl(((const struct in_addr *)ip1)->s_addr);
80 iab = ntohl(((const struct in_addr *)ip2)->s_addr);
83 * Do not simply return the difference of the two numbers, the int is
95 * Restrict a prison's IP address list with its parent's, possibly replacing
96 * it. Return true if the replacement buffer was used (or would have been).
99 prison_restrict_ip4(struct prison *pr, struct in_addr *newip4)
105 if (!(pr->pr_flags & PR_IP4_USER)) {
106 /* This has no user settings, so just copy the parent's list. */
107 if (pr->pr_ip4s < ppr->pr_ip4s) {
109 * There's no room for the parent's list. Use the
110 * new list buffer, which is assumed to be big enough
111 * (if it was passed). If there's no buffer, try to
115 if (newip4 == NULL) {
116 newip4 = malloc(ppr->pr_ip4s * sizeof(*newip4),
121 if (newip4 != NULL) {
122 bcopy(ppr->pr_ip4, newip4,
123 ppr->pr_ip4s * sizeof(*newip4));
124 free(pr->pr_ip4, M_PRISON);
126 pr->pr_ip4s = ppr->pr_ip4s;
130 pr->pr_ip4s = ppr->pr_ip4s;
132 bcopy(ppr->pr_ip4, pr->pr_ip4,
133 pr->pr_ip4s * sizeof(*newip4));
134 else if (pr->pr_ip4 != NULL) {
135 free(pr->pr_ip4, M_PRISON);
138 } else if (pr->pr_ip4s > 0) {
139 /* Remove addresses that aren't in the parent. */
140 for (ij = 0; ij < ppr->pr_ip4s; ij++)
141 if (pr->pr_ip4[0].s_addr == ppr->pr_ip4[ij].s_addr)
143 if (ij < ppr->pr_ip4s)
146 bcopy(pr->pr_ip4 + 1, pr->pr_ip4,
147 --pr->pr_ip4s * sizeof(*pr->pr_ip4));
150 for (ij = 1; ii < pr->pr_ip4s; ) {
151 if (pr->pr_ip4[ii].s_addr == ppr->pr_ip4[0].s_addr) {
155 switch (ij >= ppr->pr_ip4s ? -1 :
156 prison_qcmp_v4(&pr->pr_ip4[ii], &ppr->pr_ip4[ij])) {
158 bcopy(pr->pr_ip4 + ii + 1, pr->pr_ip4 + ii,
159 (--pr->pr_ip4s - ii) * sizeof(*pr->pr_ip4));
170 if (pr->pr_ip4s == 0) {
171 free(pr->pr_ip4, M_PRISON);
179 * Pass back primary IPv4 address of this jail.
181 * If not restricted return success but do not alter the address. Caller has
182 * to make sure to initialize it correctly (e.g. INADDR_ANY).
184 * Returns 0 on success, EAFNOSUPPORT if the jail doesn't allow IPv4.
185 * Address returned in NBO.
188 prison_get_ip4(struct ucred *cred, struct in_addr *ia)
192 KASSERT(cred != NULL, ("%s: cred is NULL", __func__));
193 KASSERT(ia != NULL, ("%s: ia is NULL", __func__));
195 pr = cred->cr_prison;
196 if (!(pr->pr_flags & PR_IP4))
198 mtx_lock(&pr->pr_mtx);
199 if (!(pr->pr_flags & PR_IP4)) {
200 mtx_unlock(&pr->pr_mtx);
203 if (pr->pr_ip4 == NULL) {
204 mtx_unlock(&pr->pr_mtx);
205 return (EAFNOSUPPORT);
208 ia->s_addr = pr->pr_ip4[0].s_addr;
209 mtx_unlock(&pr->pr_mtx);
214 * Return 1 if we should do proper source address selection or are not jailed.
215 * We will return 0 if we should bypass source address selection in favour
216 * of the primary jail IPv4 address. Only in this case *ia will be updated and
218 * Return EAFNOSUPPORT, in case this jail does not allow IPv4.
221 prison_saddrsel_ip4(struct ucred *cred, struct in_addr *ia)
227 KASSERT(cred != NULL, ("%s: cred is NULL", __func__));
228 KASSERT(ia != NULL, ("%s: ia is NULL", __func__));
233 pr = cred->cr_prison;
234 if (pr->pr_flags & PR_IP4_SADDRSEL)
237 lia.s_addr = INADDR_ANY;
238 error = prison_get_ip4(cred, &lia);
241 if (lia.s_addr == INADDR_ANY)
244 ia->s_addr = lia.s_addr;
249 * Return true if pr1 and pr2 have the same IPv4 address restrictions.
252 prison_equal_ip4(struct prison *pr1, struct prison *pr2)
259 * No need to lock since the PR_IP4_USER flag can't be altered for
262 while (pr1 != &prison0 &&
264 !(pr1->pr_flags & PR_VNET) &&
266 !(pr1->pr_flags & PR_IP4_USER))
267 pr1 = pr1->pr_parent;
268 while (pr2 != &prison0 &&
270 !(pr2->pr_flags & PR_VNET) &&
272 !(pr2->pr_flags & PR_IP4_USER))
273 pr2 = pr2->pr_parent;
278 * Make sure our (source) address is set to something meaningful to this
281 * Returns 0 if jail doesn't restrict IPv4 or if address belongs to jail,
282 * EADDRNOTAVAIL if the address doesn't belong, or EAFNOSUPPORT if the jail
283 * doesn't allow IPv4. Address passed in in NBO and returned in NBO.
286 prison_local_ip4(struct ucred *cred, struct in_addr *ia)
292 KASSERT(cred != NULL, ("%s: cred is NULL", __func__));
293 KASSERT(ia != NULL, ("%s: ia is NULL", __func__));
295 pr = cred->cr_prison;
296 if (!(pr->pr_flags & PR_IP4))
298 mtx_lock(&pr->pr_mtx);
299 if (!(pr->pr_flags & PR_IP4)) {
300 mtx_unlock(&pr->pr_mtx);
303 if (pr->pr_ip4 == NULL) {
304 mtx_unlock(&pr->pr_mtx);
305 return (EAFNOSUPPORT);
308 ia0.s_addr = ntohl(ia->s_addr);
310 if (ia0.s_addr == INADDR_ANY) {
312 * In case there is only 1 IPv4 address, bind directly.
314 if (pr->pr_ip4s == 1)
315 ia->s_addr = pr->pr_ip4[0].s_addr;
316 mtx_unlock(&pr->pr_mtx);
320 error = prison_check_ip4_locked(pr, ia);
321 if (error == EADDRNOTAVAIL && ia0.s_addr == INADDR_LOOPBACK) {
322 ia->s_addr = pr->pr_ip4[0].s_addr;
326 mtx_unlock(&pr->pr_mtx);
331 * Rewrite destination address in case we will connect to loopback address.
333 * Returns 0 on success, EAFNOSUPPORT if the jail doesn't allow IPv4.
334 * Address passed in in NBO and returned in NBO.
337 prison_remote_ip4(struct ucred *cred, struct in_addr *ia)
341 KASSERT(cred != NULL, ("%s: cred is NULL", __func__));
342 KASSERT(ia != NULL, ("%s: ia is NULL", __func__));
344 pr = cred->cr_prison;
345 if (!(pr->pr_flags & PR_IP4))
347 mtx_lock(&pr->pr_mtx);
348 if (!(pr->pr_flags & PR_IP4)) {
349 mtx_unlock(&pr->pr_mtx);
352 if (pr->pr_ip4 == NULL) {
353 mtx_unlock(&pr->pr_mtx);
354 return (EAFNOSUPPORT);
357 if (ntohl(ia->s_addr) == INADDR_LOOPBACK &&
358 prison_check_ip4_locked(pr, ia) == EADDRNOTAVAIL) {
359 ia->s_addr = pr->pr_ip4[0].s_addr;
360 mtx_unlock(&pr->pr_mtx);
365 * Return success because nothing had to be changed.
367 mtx_unlock(&pr->pr_mtx);
372 * Check if given address belongs to the jail referenced by cred/prison.
374 * Returns 0 if address belongs to jail,
375 * EADDRNOTAVAIL if the address doesn't belong to the jail.
378 prison_check_ip4_locked(const struct prison *pr, const struct in_addr *ia)
383 * Check the primary IP.
385 if (pr->pr_ip4[0].s_addr == ia->s_addr)
389 * All the other IPs are sorted so we can do a binary search.
395 d = prison_qcmp_v4(&pr->pr_ip4[i+1], ia);
404 return (EADDRNOTAVAIL);
408 prison_check_ip4(const struct ucred *cred, const struct in_addr *ia)
413 KASSERT(cred != NULL, ("%s: cred is NULL", __func__));
414 KASSERT(ia != NULL, ("%s: ia is NULL", __func__));
416 pr = cred->cr_prison;
417 if (!(pr->pr_flags & PR_IP4))
419 mtx_lock(&pr->pr_mtx);
420 if (!(pr->pr_flags & PR_IP4)) {
421 mtx_unlock(&pr->pr_mtx);
424 if (pr->pr_ip4 == NULL) {
425 mtx_unlock(&pr->pr_mtx);
426 return (EAFNOSUPPORT);
429 error = prison_check_ip4_locked(pr, ia);
430 mtx_unlock(&pr->pr_mtx);