1eda14cbcSMatt Macy /*
2eda14cbcSMatt Macy  * Copyright (c) 2007 Pawel Jakub Dawidek <pjd@FreeBSD.org>
3eda14cbcSMatt Macy  * All rights reserved.
4eda14cbcSMatt Macy  *
5eda14cbcSMatt Macy  * Redistribution and use in source and binary forms, with or without
6eda14cbcSMatt Macy  * modification, are permitted provided that the following conditions
7eda14cbcSMatt Macy  * are met:
8eda14cbcSMatt Macy  * 1. Redistributions of source code must retain the above copyright
9eda14cbcSMatt Macy  *    notice, this list of conditions and the following disclaimer.
10eda14cbcSMatt Macy  * 2. Redistributions in binary form must reproduce the above copyright
11eda14cbcSMatt Macy  *    notice, this list of conditions and the following disclaimer in the
12eda14cbcSMatt Macy  *    documentation and/or other materials provided with the distribution.
13eda14cbcSMatt Macy  *
14eda14cbcSMatt Macy  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
15eda14cbcSMatt Macy  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16eda14cbcSMatt Macy  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17eda14cbcSMatt Macy  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
18eda14cbcSMatt Macy  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19eda14cbcSMatt Macy  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20eda14cbcSMatt Macy  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21eda14cbcSMatt Macy  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22eda14cbcSMatt Macy  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23eda14cbcSMatt Macy  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24eda14cbcSMatt Macy  * SUCH DAMAGE.
25eda14cbcSMatt Macy  */
26eda14cbcSMatt Macy 
27eda14cbcSMatt Macy #include <sys/types.h>
28eda14cbcSMatt Macy #include <sys/param.h>
29eda14cbcSMatt Macy #include <sys/kernel.h>
30eda14cbcSMatt Macy #include <sys/systm.h>
31eda14cbcSMatt Macy #include <sys/proc.h>
32eda14cbcSMatt Macy #include <sys/lock.h>
33eda14cbcSMatt Macy #include <sys/mutex.h>
34eda14cbcSMatt Macy #include <sys/sx.h>
35eda14cbcSMatt Macy #include <sys/malloc.h>
36eda14cbcSMatt Macy #include <sys/queue.h>
37eda14cbcSMatt Macy #include <sys/jail.h>
38eda14cbcSMatt Macy #include <sys/osd.h>
39eda14cbcSMatt Macy #include <sys/priv.h>
40eda14cbcSMatt Macy #include <sys/zone.h>
41eda14cbcSMatt Macy 
42eda14cbcSMatt Macy #include <sys/policy.h>
43eda14cbcSMatt Macy 
44eda14cbcSMatt Macy static MALLOC_DEFINE(M_ZONES, "zones_data", "Zones data");
45eda14cbcSMatt Macy 
46eda14cbcSMatt Macy /*
47eda14cbcSMatt Macy  * Structure to record list of ZFS datasets exported to a zone.
48eda14cbcSMatt Macy  */
49eda14cbcSMatt Macy typedef struct zone_dataset {
50eda14cbcSMatt Macy 	LIST_ENTRY(zone_dataset) zd_next;
51eda14cbcSMatt Macy 	char	zd_dataset[0];
52eda14cbcSMatt Macy } zone_dataset_t;
53eda14cbcSMatt Macy 
54eda14cbcSMatt Macy LIST_HEAD(zone_dataset_head, zone_dataset);
55eda14cbcSMatt Macy 
56eda14cbcSMatt Macy static int zone_slot;
57eda14cbcSMatt Macy 
58eda14cbcSMatt Macy int
zone_dataset_attach(struct ucred * cred,const char * dataset,int jailid)59eda14cbcSMatt Macy zone_dataset_attach(struct ucred *cred, const char *dataset, int jailid)
60eda14cbcSMatt Macy {
61eda14cbcSMatt Macy 	struct zone_dataset_head *head;
62eda14cbcSMatt Macy 	zone_dataset_t *zd, *zd2;
63eda14cbcSMatt Macy 	struct prison *pr;
64eda14cbcSMatt Macy 	int dofree, error;
65eda14cbcSMatt Macy 
66eda14cbcSMatt Macy 	if ((error = spl_priv_check_cred(cred, PRIV_ZFS_JAIL)) != 0)
67eda14cbcSMatt Macy 		return (error);
68eda14cbcSMatt Macy 
69eda14cbcSMatt Macy 	/* Allocate memory before we grab prison's mutex. */
70eda14cbcSMatt Macy 	zd = malloc(sizeof (*zd) + strlen(dataset) + 1, M_ZONES, M_WAITOK);
71eda14cbcSMatt Macy 
72eda14cbcSMatt Macy 	sx_slock(&allprison_lock);
73eda14cbcSMatt Macy 	pr = prison_find(jailid);	/* Locks &pr->pr_mtx. */
74eda14cbcSMatt Macy 	sx_sunlock(&allprison_lock);
75eda14cbcSMatt Macy 	if (pr == NULL) {
76eda14cbcSMatt Macy 		free(zd, M_ZONES);
77eda14cbcSMatt Macy 		return (ENOENT);
78eda14cbcSMatt Macy 	}
79eda14cbcSMatt Macy 
80eda14cbcSMatt Macy 	head = osd_jail_get(pr, zone_slot);
81eda14cbcSMatt Macy 	if (head != NULL) {
82eda14cbcSMatt Macy 		dofree = 0;
83eda14cbcSMatt Macy 		LIST_FOREACH(zd2, head, zd_next) {
84eda14cbcSMatt Macy 			if (strcmp(dataset, zd2->zd_dataset) == 0) {
85eda14cbcSMatt Macy 				free(zd, M_ZONES);
86eda14cbcSMatt Macy 				error = EEXIST;
87eda14cbcSMatt Macy 				goto end;
88eda14cbcSMatt Macy 			}
89eda14cbcSMatt Macy 		}
90eda14cbcSMatt Macy 	} else {
91eda14cbcSMatt Macy 		dofree = 1;
92eda14cbcSMatt Macy 		prison_hold_locked(pr);
93eda14cbcSMatt Macy 		mtx_unlock(&pr->pr_mtx);
94eda14cbcSMatt Macy 		head = malloc(sizeof (*head), M_ZONES, M_WAITOK);
95eda14cbcSMatt Macy 		LIST_INIT(head);
96eda14cbcSMatt Macy 		mtx_lock(&pr->pr_mtx);
97eda14cbcSMatt Macy 		error = osd_jail_set(pr, zone_slot, head);
98eda14cbcSMatt Macy 		KASSERT(error == 0, ("osd_jail_set() failed (error=%d)",
99eda14cbcSMatt Macy 		    error));
100eda14cbcSMatt Macy 	}
101eda14cbcSMatt Macy 	strcpy(zd->zd_dataset, dataset);
102eda14cbcSMatt Macy 	LIST_INSERT_HEAD(head, zd, zd_next);
103eda14cbcSMatt Macy end:
104eda14cbcSMatt Macy 	if (dofree)
105eda14cbcSMatt Macy 		prison_free_locked(pr);
106eda14cbcSMatt Macy 	else
107eda14cbcSMatt Macy 		mtx_unlock(&pr->pr_mtx);
108eda14cbcSMatt Macy 	return (error);
109eda14cbcSMatt Macy }
110eda14cbcSMatt Macy 
111eda14cbcSMatt Macy int
zone_dataset_detach(struct ucred * cred,const char * dataset,int jailid)112eda14cbcSMatt Macy zone_dataset_detach(struct ucred *cred, const char *dataset, int jailid)
113eda14cbcSMatt Macy {
114eda14cbcSMatt Macy 	struct zone_dataset_head *head;
115eda14cbcSMatt Macy 	zone_dataset_t *zd;
116eda14cbcSMatt Macy 	struct prison *pr;
117eda14cbcSMatt Macy 	int error;
118eda14cbcSMatt Macy 
119eda14cbcSMatt Macy 	if ((error = spl_priv_check_cred(cred, PRIV_ZFS_JAIL)) != 0)
120eda14cbcSMatt Macy 		return (error);
121eda14cbcSMatt Macy 
122eda14cbcSMatt Macy 	sx_slock(&allprison_lock);
123eda14cbcSMatt Macy 	pr = prison_find(jailid);
124eda14cbcSMatt Macy 	sx_sunlock(&allprison_lock);
125eda14cbcSMatt Macy 	if (pr == NULL)
126eda14cbcSMatt Macy 		return (ENOENT);
127eda14cbcSMatt Macy 	head = osd_jail_get(pr, zone_slot);
128eda14cbcSMatt Macy 	if (head == NULL) {
129eda14cbcSMatt Macy 		error = ENOENT;
130eda14cbcSMatt Macy 		goto end;
131eda14cbcSMatt Macy 	}
132eda14cbcSMatt Macy 	LIST_FOREACH(zd, head, zd_next) {
133eda14cbcSMatt Macy 		if (strcmp(dataset, zd->zd_dataset) == 0)
134eda14cbcSMatt Macy 			break;
135eda14cbcSMatt Macy 	}
136eda14cbcSMatt Macy 	if (zd == NULL)
137eda14cbcSMatt Macy 		error = ENOENT;
138eda14cbcSMatt Macy 	else {
139eda14cbcSMatt Macy 		LIST_REMOVE(zd, zd_next);
140eda14cbcSMatt Macy 		free(zd, M_ZONES);
141eda14cbcSMatt Macy 		if (LIST_EMPTY(head))
142eda14cbcSMatt Macy 			osd_jail_del(pr, zone_slot);
143eda14cbcSMatt Macy 		error = 0;
144eda14cbcSMatt Macy 	}
145eda14cbcSMatt Macy end:
146eda14cbcSMatt Macy 	mtx_unlock(&pr->pr_mtx);
147eda14cbcSMatt Macy 	return (error);
148eda14cbcSMatt Macy }
149eda14cbcSMatt Macy 
150eda14cbcSMatt Macy /*
151eda14cbcSMatt Macy  * Returns true if the named dataset is visible in the current zone.
152eda14cbcSMatt Macy  * The 'write' parameter is set to 1 if the dataset is also writable.
153eda14cbcSMatt Macy  */
154eda14cbcSMatt Macy int
zone_dataset_visible(const char * dataset,int * write)155eda14cbcSMatt Macy zone_dataset_visible(const char *dataset, int *write)
156eda14cbcSMatt Macy {
157eda14cbcSMatt Macy 	struct zone_dataset_head *head;
158eda14cbcSMatt Macy 	zone_dataset_t *zd;
159eda14cbcSMatt Macy 	struct prison *pr;
160eda14cbcSMatt Macy 	size_t len;
161eda14cbcSMatt Macy 	int ret = 0;
162eda14cbcSMatt Macy 
163eda14cbcSMatt Macy 	if (dataset[0] == '\0')
164eda14cbcSMatt Macy 		return (0);
165eda14cbcSMatt Macy 	if (INGLOBALZONE(curproc)) {
166eda14cbcSMatt Macy 		if (write != NULL)
167eda14cbcSMatt Macy 			*write = 1;
168eda14cbcSMatt Macy 		return (1);
169eda14cbcSMatt Macy 	}
170eda14cbcSMatt Macy 	pr = curthread->td_ucred->cr_prison;
171eda14cbcSMatt Macy 	mtx_lock(&pr->pr_mtx);
172eda14cbcSMatt Macy 	head = osd_jail_get(pr, zone_slot);
173eda14cbcSMatt Macy 	if (head == NULL)
174eda14cbcSMatt Macy 		goto end;
175eda14cbcSMatt Macy 
176eda14cbcSMatt Macy 	/*
177eda14cbcSMatt Macy 	 * Walk the list once, looking for datasets which match exactly, or
178eda14cbcSMatt Macy 	 * specify a dataset underneath an exported dataset.  If found, return
179eda14cbcSMatt Macy 	 * true and note that it is writable.
180eda14cbcSMatt Macy 	 */
181eda14cbcSMatt Macy 	LIST_FOREACH(zd, head, zd_next) {
182eda14cbcSMatt Macy 		len = strlen(zd->zd_dataset);
183eda14cbcSMatt Macy 		if (strlen(dataset) >= len &&
184*da5137abSMartin Matuska 		    memcmp(dataset, zd->zd_dataset, len) == 0 &&
185eda14cbcSMatt Macy 		    (dataset[len] == '\0' || dataset[len] == '/' ||
186eda14cbcSMatt Macy 		    dataset[len] == '@')) {
187eda14cbcSMatt Macy 			if (write)
188eda14cbcSMatt Macy 				*write = 1;
189eda14cbcSMatt Macy 			ret = 1;
190eda14cbcSMatt Macy 			goto end;
191eda14cbcSMatt Macy 		}
192eda14cbcSMatt Macy 	}
193eda14cbcSMatt Macy 
194eda14cbcSMatt Macy 	/*
195eda14cbcSMatt Macy 	 * Walk the list a second time, searching for datasets which are parents
196eda14cbcSMatt Macy 	 * of exported datasets.  These should be visible, but read-only.
197eda14cbcSMatt Macy 	 *
198eda14cbcSMatt Macy 	 * Note that we also have to support forms such as 'pool/dataset/', with
199eda14cbcSMatt Macy 	 * a trailing slash.
200eda14cbcSMatt Macy 	 */
201eda14cbcSMatt Macy 	LIST_FOREACH(zd, head, zd_next) {
202eda14cbcSMatt Macy 		len = strlen(dataset);
203eda14cbcSMatt Macy 		if (dataset[len - 1] == '/')
204eda14cbcSMatt Macy 			len--;	/* Ignore trailing slash */
205eda14cbcSMatt Macy 		if (len < strlen(zd->zd_dataset) &&
206*da5137abSMartin Matuska 		    memcmp(dataset, zd->zd_dataset, len) == 0 &&
207eda14cbcSMatt Macy 		    zd->zd_dataset[len] == '/') {
208eda14cbcSMatt Macy 			if (write)
209eda14cbcSMatt Macy 				*write = 0;
210eda14cbcSMatt Macy 			ret = 1;
211eda14cbcSMatt Macy 			goto end;
212eda14cbcSMatt Macy 		}
213eda14cbcSMatt Macy 	}
214eda14cbcSMatt Macy end:
215eda14cbcSMatt Macy 	mtx_unlock(&pr->pr_mtx);
216eda14cbcSMatt Macy 	return (ret);
217eda14cbcSMatt Macy }
218eda14cbcSMatt Macy 
219eda14cbcSMatt Macy static void
zone_destroy(void * arg)220eda14cbcSMatt Macy zone_destroy(void *arg)
221eda14cbcSMatt Macy {
222eda14cbcSMatt Macy 	struct zone_dataset_head *head;
223eda14cbcSMatt Macy 	zone_dataset_t *zd;
224eda14cbcSMatt Macy 
225eda14cbcSMatt Macy 	head = arg;
226eda14cbcSMatt Macy 	while ((zd = LIST_FIRST(head)) != NULL) {
227eda14cbcSMatt Macy 		LIST_REMOVE(zd, zd_next);
228eda14cbcSMatt Macy 		free(zd, M_ZONES);
229eda14cbcSMatt Macy 	}
230eda14cbcSMatt Macy 	free(head, M_ZONES);
231eda14cbcSMatt Macy }
232eda14cbcSMatt Macy 
233eda14cbcSMatt Macy uint32_t
zone_get_hostid(void * ptr)234eda14cbcSMatt Macy zone_get_hostid(void *ptr)
235eda14cbcSMatt Macy {
236eda14cbcSMatt Macy 
237eda14cbcSMatt Macy 	KASSERT(ptr == NULL, ("only NULL pointer supported in %s", __func__));
238eda14cbcSMatt Macy 
239eda14cbcSMatt Macy 	return ((uint32_t)curthread->td_ucred->cr_prison->pr_hostid);
240eda14cbcSMatt Macy }
241eda14cbcSMatt Macy 
242eda14cbcSMatt Macy static void
zone_sysinit(void * arg __unused)243eda14cbcSMatt Macy zone_sysinit(void *arg __unused)
244eda14cbcSMatt Macy {
245eda14cbcSMatt Macy 
246eda14cbcSMatt Macy 	zone_slot = osd_jail_register(zone_destroy, NULL);
247eda14cbcSMatt Macy }
248eda14cbcSMatt Macy 
249eda14cbcSMatt Macy static void
zone_sysuninit(void * arg __unused)250eda14cbcSMatt Macy zone_sysuninit(void *arg __unused)
251eda14cbcSMatt Macy {
252eda14cbcSMatt Macy 
253eda14cbcSMatt Macy 	osd_jail_deregister(zone_slot);
254eda14cbcSMatt Macy }
255eda14cbcSMatt Macy 
256eda14cbcSMatt Macy SYSINIT(zone_sysinit, SI_SUB_DRIVERS, SI_ORDER_ANY, zone_sysinit, NULL);
257eda14cbcSMatt Macy SYSUNINIT(zone_sysuninit, SI_SUB_DRIVERS, SI_ORDER_ANY, zone_sysuninit, NULL);
258