xref: /illumos-gate/usr/src/uts/i86xpv/vm/seg_mf.c (revision da6c28aa)
1843e1988Sjohnlev /*
2843e1988Sjohnlev  * CDDL HEADER START
3843e1988Sjohnlev  *
4843e1988Sjohnlev  * The contents of this file are subject to the terms of the
5843e1988Sjohnlev  * Common Development and Distribution License (the "License").
6843e1988Sjohnlev  * You may not use this file except in compliance with the License.
7843e1988Sjohnlev  *
8843e1988Sjohnlev  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9843e1988Sjohnlev  * or http://www.opensolaris.org/os/licensing.
10843e1988Sjohnlev  * See the License for the specific language governing permissions
11843e1988Sjohnlev  * and limitations under the License.
12843e1988Sjohnlev  *
13843e1988Sjohnlev  * When distributing Covered Code, include this CDDL HEADER in each
14843e1988Sjohnlev  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15843e1988Sjohnlev  * If applicable, add the following below this CDDL HEADER, with the
16843e1988Sjohnlev  * fields enclosed by brackets "[]" replaced with your own identifying
17843e1988Sjohnlev  * information: Portions Copyright [yyyy] [name of copyright owner]
18843e1988Sjohnlev  *
19843e1988Sjohnlev  * CDDL HEADER END
20843e1988Sjohnlev  */
21843e1988Sjohnlev 
22843e1988Sjohnlev /*
23843e1988Sjohnlev  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
24843e1988Sjohnlev  * Use is subject to license terms.
25843e1988Sjohnlev  */
26843e1988Sjohnlev 
27843e1988Sjohnlev /*
28843e1988Sjohnlev  * Machine frame segment driver.  This segment driver allows dom0 processes to
29843e1988Sjohnlev  * map pages of other domains or Xen (e.g. during save/restore).  ioctl()s on
30843e1988Sjohnlev  * the privcmd driver provide the MFN values backing each mapping, and we map
31843e1988Sjohnlev  * them into the process's address space at this time.  Demand-faulting is not
32843e1988Sjohnlev  * supported by this driver due to the requirements upon some of the ioctl()s.
33843e1988Sjohnlev  */
34843e1988Sjohnlev 
35843e1988Sjohnlev #pragma ident	"%Z%%M%	%I%	%E% SMI"
36843e1988Sjohnlev 
37843e1988Sjohnlev #include <sys/types.h>
38843e1988Sjohnlev #include <sys/systm.h>
39843e1988Sjohnlev #include <sys/vmsystm.h>
40843e1988Sjohnlev #include <sys/mman.h>
41843e1988Sjohnlev #include <sys/errno.h>
42843e1988Sjohnlev #include <sys/kmem.h>
43843e1988Sjohnlev #include <sys/cmn_err.h>
44843e1988Sjohnlev #include <sys/vnode.h>
45843e1988Sjohnlev #include <sys/conf.h>
46843e1988Sjohnlev #include <sys/debug.h>
47843e1988Sjohnlev #include <sys/lgrp.h>
48843e1988Sjohnlev #include <sys/hypervisor.h>
49843e1988Sjohnlev 
50843e1988Sjohnlev #include <vm/page.h>
51843e1988Sjohnlev #include <vm/hat.h>
52843e1988Sjohnlev #include <vm/as.h>
53843e1988Sjohnlev #include <vm/seg.h>
54843e1988Sjohnlev 
55843e1988Sjohnlev #include <vm/hat_pte.h>
56843e1988Sjohnlev #include <vm/seg_mf.h>
57843e1988Sjohnlev 
58843e1988Sjohnlev #include <sys/fs/snode.h>
59843e1988Sjohnlev 
60843e1988Sjohnlev #define	VTOCVP(vp)	(VTOS(vp)->s_commonvp)
61843e1988Sjohnlev 
62843e1988Sjohnlev #define	mfatob(n)	((n) * sizeof (mfn_t))
63843e1988Sjohnlev 
64843e1988Sjohnlev struct segmf_data {
65843e1988Sjohnlev 	kmutex_t	lock;
66843e1988Sjohnlev 	struct vnode	*vp;
67843e1988Sjohnlev 	uchar_t		prot;
68843e1988Sjohnlev 	uchar_t		maxprot;
69843e1988Sjohnlev 	size_t		softlockcnt;
70843e1988Sjohnlev 	domid_t		domid;
71843e1988Sjohnlev 	mfn_t		*mfns;
72843e1988Sjohnlev };
73843e1988Sjohnlev 
74843e1988Sjohnlev static struct seg_ops segmf_ops;
75843e1988Sjohnlev 
76843e1988Sjohnlev static struct segmf_data *
77843e1988Sjohnlev segmf_data_zalloc(struct seg *seg)
78843e1988Sjohnlev {
79843e1988Sjohnlev 	struct segmf_data *data = kmem_zalloc(sizeof (*data), KM_SLEEP);
80843e1988Sjohnlev 
81843e1988Sjohnlev 	mutex_init(&data->lock, "segmf.lock", MUTEX_DEFAULT, NULL);
82843e1988Sjohnlev 	seg->s_ops = &segmf_ops;
83843e1988Sjohnlev 	seg->s_data = data;
84843e1988Sjohnlev 	return (data);
85843e1988Sjohnlev }
86843e1988Sjohnlev 
87843e1988Sjohnlev int
88843e1988Sjohnlev segmf_create(struct seg *seg, void *args)
89843e1988Sjohnlev {
90843e1988Sjohnlev 	struct segmf_crargs *a = args;
91843e1988Sjohnlev 	struct segmf_data *data;
92843e1988Sjohnlev 	struct as *as = seg->s_as;
93843e1988Sjohnlev 	pgcnt_t i, npages = seg_pages(seg);
94843e1988Sjohnlev 	int error;
95843e1988Sjohnlev 
96843e1988Sjohnlev 	hat_map(as->a_hat, seg->s_base, seg->s_size, HAT_MAP);
97843e1988Sjohnlev 
98843e1988Sjohnlev 	data = segmf_data_zalloc(seg);
99843e1988Sjohnlev 	data->vp = specfind(a->dev, VCHR);
100843e1988Sjohnlev 	data->prot = a->prot;
101843e1988Sjohnlev 	data->maxprot = a->maxprot;
102843e1988Sjohnlev 
103843e1988Sjohnlev 	data->mfns = kmem_alloc(mfatob(npages), KM_SLEEP);
104843e1988Sjohnlev 	for (i = 0; i < npages; i++)
105843e1988Sjohnlev 		data->mfns[i] = MFN_INVALID;
106843e1988Sjohnlev 
107843e1988Sjohnlev 	error = VOP_ADDMAP(VTOCVP(data->vp), 0, as, seg->s_base, seg->s_size,
108*da6c28aaSamw 	    data->prot, data->maxprot, MAP_SHARED, CRED(), NULL);
109843e1988Sjohnlev 
110843e1988Sjohnlev 	if (error != 0)
111843e1988Sjohnlev 		hat_unload(as->a_hat,
112843e1988Sjohnlev 		    seg->s_base, seg->s_size, HAT_UNLOAD_UNMAP);
113843e1988Sjohnlev 	return (error);
114843e1988Sjohnlev }
115843e1988Sjohnlev 
116843e1988Sjohnlev /*
117843e1988Sjohnlev  * Duplicate a seg and return new segment in newseg.
118843e1988Sjohnlev  */
119843e1988Sjohnlev static int
120843e1988Sjohnlev segmf_dup(struct seg *seg, struct seg *newseg)
121843e1988Sjohnlev {
122843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
123843e1988Sjohnlev 	struct segmf_data *ndata;
124843e1988Sjohnlev 	pgcnt_t npages = seg_pages(newseg);
125843e1988Sjohnlev 
126843e1988Sjohnlev 	ndata = segmf_data_zalloc(newseg);
127843e1988Sjohnlev 
128843e1988Sjohnlev 	VN_HOLD(data->vp);
129843e1988Sjohnlev 	ndata->vp = data->vp;
130843e1988Sjohnlev 	ndata->prot = data->prot;
131843e1988Sjohnlev 	ndata->maxprot = data->maxprot;
132843e1988Sjohnlev 	ndata->domid = data->domid;
133843e1988Sjohnlev 
134843e1988Sjohnlev 	ndata->mfns = kmem_alloc(mfatob(npages), KM_SLEEP);
135843e1988Sjohnlev 	bcopy(data->mfns, ndata->mfns, mfatob(npages));
136843e1988Sjohnlev 
137843e1988Sjohnlev 	return (VOP_ADDMAP(VTOCVP(ndata->vp), 0, newseg->s_as,
138843e1988Sjohnlev 	    newseg->s_base, newseg->s_size, ndata->prot, ndata->maxprot,
139*da6c28aaSamw 	    MAP_SHARED, CRED(), NULL));
140843e1988Sjohnlev }
141843e1988Sjohnlev 
142843e1988Sjohnlev /*
143843e1988Sjohnlev  * We only support unmapping the whole segment, and we automatically unlock
144843e1988Sjohnlev  * what we previously soft-locked.
145843e1988Sjohnlev  */
146843e1988Sjohnlev static int
147843e1988Sjohnlev segmf_unmap(struct seg *seg, caddr_t addr, size_t len)
148843e1988Sjohnlev {
149843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
150843e1988Sjohnlev 	offset_t off;
151843e1988Sjohnlev 
152843e1988Sjohnlev 	if (addr < seg->s_base || addr + len > seg->s_base + seg->s_size ||
153843e1988Sjohnlev 	    (len & PAGEOFFSET) || ((uintptr_t)addr & PAGEOFFSET))
154843e1988Sjohnlev 		panic("segmf_unmap");
155843e1988Sjohnlev 
156843e1988Sjohnlev 	if (addr != seg->s_base || len != seg->s_size)
157843e1988Sjohnlev 		return (ENOTSUP);
158843e1988Sjohnlev 
159843e1988Sjohnlev 	hat_unload(seg->s_as->a_hat, addr, len,
160843e1988Sjohnlev 	    HAT_UNLOAD_UNMAP | HAT_UNLOAD_UNLOCK);
161843e1988Sjohnlev 
162843e1988Sjohnlev 	off = (offset_t)seg_page(seg, addr);
163843e1988Sjohnlev 
164843e1988Sjohnlev 	ASSERT(data->vp != NULL);
165843e1988Sjohnlev 
166843e1988Sjohnlev 	(void) VOP_DELMAP(VTOCVP(data->vp), off, seg->s_as, addr, len,
167*da6c28aaSamw 	    data->prot, data->maxprot, MAP_SHARED, CRED(), NULL);
168843e1988Sjohnlev 
169843e1988Sjohnlev 	seg_free(seg);
170843e1988Sjohnlev 	return (0);
171843e1988Sjohnlev }
172843e1988Sjohnlev 
173843e1988Sjohnlev static void
174843e1988Sjohnlev segmf_free(struct seg *seg)
175843e1988Sjohnlev {
176843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
177843e1988Sjohnlev 	pgcnt_t npages = seg_pages(seg);
178843e1988Sjohnlev 
179843e1988Sjohnlev 	kmem_free(data->mfns, mfatob(npages));
180843e1988Sjohnlev 	VN_RELE(data->vp);
181843e1988Sjohnlev 	mutex_destroy(&data->lock);
182843e1988Sjohnlev 	kmem_free(data, sizeof (*data));
183843e1988Sjohnlev }
184843e1988Sjohnlev 
185843e1988Sjohnlev static int segmf_faultpage_debug = 0;
186843e1988Sjohnlev 
187843e1988Sjohnlev /*ARGSUSED*/
188843e1988Sjohnlev static int
189843e1988Sjohnlev segmf_faultpage(struct hat *hat, struct seg *seg, caddr_t addr,
190843e1988Sjohnlev     enum fault_type type, uint_t prot)
191843e1988Sjohnlev {
192843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
193843e1988Sjohnlev 	uint_t hat_flags = HAT_LOAD_NOCONSIST;
194843e1988Sjohnlev 	mfn_t mfn;
195843e1988Sjohnlev 	x86pte_t pte;
196843e1988Sjohnlev 
197843e1988Sjohnlev 	mfn = data->mfns[seg_page(seg, addr)];
198843e1988Sjohnlev 
199843e1988Sjohnlev 	ASSERT(mfn != MFN_INVALID);
200843e1988Sjohnlev 
201843e1988Sjohnlev 	if (type == F_SOFTLOCK) {
202843e1988Sjohnlev 		mutex_enter(&freemem_lock);
203843e1988Sjohnlev 		data->softlockcnt++;
204843e1988Sjohnlev 		mutex_exit(&freemem_lock);
205843e1988Sjohnlev 		hat_flags |= HAT_LOAD_LOCK;
206843e1988Sjohnlev 	} else
207843e1988Sjohnlev 		hat_flags |= HAT_LOAD;
208843e1988Sjohnlev 
209843e1988Sjohnlev 	if (segmf_faultpage_debug > 0) {
210843e1988Sjohnlev 		uprintf("segmf_faultpage: addr %p domid %x mfn %lx prot %x\n",
211843e1988Sjohnlev 		    (void *)addr, data->domid, mfn, prot);
212843e1988Sjohnlev 		segmf_faultpage_debug--;
213843e1988Sjohnlev 	}
214843e1988Sjohnlev 
215843e1988Sjohnlev 	/*
216843e1988Sjohnlev 	 * Ask the HAT to load a throwaway mapping to page zero, then
217843e1988Sjohnlev 	 * overwrite it with our foreign domain mapping. It gets removed
218843e1988Sjohnlev 	 * later via hat_unload()
219843e1988Sjohnlev 	 */
220843e1988Sjohnlev 	hat_devload(hat, addr, MMU_PAGESIZE, (pfn_t)0,
221843e1988Sjohnlev 	    PROT_READ | HAT_UNORDERED_OK, hat_flags);
222843e1988Sjohnlev 
223843e1988Sjohnlev 	pte = mmu_ptob((x86pte_t)mfn) | PT_VALID | PT_USER | PT_FOREIGN;
224843e1988Sjohnlev 	if (prot & PROT_WRITE)
225843e1988Sjohnlev 		pte |= PT_WRITABLE;
226843e1988Sjohnlev 
227843e1988Sjohnlev 	if (HYPERVISOR_update_va_mapping_otherdomain((uintptr_t)addr, pte,
228843e1988Sjohnlev 	    UVMF_INVLPG | UVMF_ALL, data->domid) != 0) {
229843e1988Sjohnlev 		hat_flags = HAT_UNLOAD_UNMAP;
230843e1988Sjohnlev 
231843e1988Sjohnlev 		if (type == F_SOFTLOCK) {
232843e1988Sjohnlev 			hat_flags |= HAT_UNLOAD_UNLOCK;
233843e1988Sjohnlev 			mutex_enter(&freemem_lock);
234843e1988Sjohnlev 			data->softlockcnt--;
235843e1988Sjohnlev 			mutex_exit(&freemem_lock);
236843e1988Sjohnlev 		}
237843e1988Sjohnlev 
238843e1988Sjohnlev 		hat_unload(hat, addr, MMU_PAGESIZE, hat_flags);
239843e1988Sjohnlev 		return (FC_MAKE_ERR(EFAULT));
240843e1988Sjohnlev 	}
241843e1988Sjohnlev 
242843e1988Sjohnlev 	return (0);
243843e1988Sjohnlev }
244843e1988Sjohnlev 
245843e1988Sjohnlev static int
246843e1988Sjohnlev seg_rw_to_prot(enum seg_rw rw)
247843e1988Sjohnlev {
248843e1988Sjohnlev 	switch (rw) {
249843e1988Sjohnlev 	case S_READ:
250843e1988Sjohnlev 		return (PROT_READ);
251843e1988Sjohnlev 	case S_WRITE:
252843e1988Sjohnlev 		return (PROT_WRITE);
253843e1988Sjohnlev 	case S_EXEC:
254843e1988Sjohnlev 		return (PROT_EXEC);
255843e1988Sjohnlev 	case S_OTHER:
256843e1988Sjohnlev 	default:
257843e1988Sjohnlev 		break;
258843e1988Sjohnlev 	}
259843e1988Sjohnlev 	return (PROT_READ | PROT_WRITE | PROT_EXEC);
260843e1988Sjohnlev }
261843e1988Sjohnlev 
262843e1988Sjohnlev static void
263843e1988Sjohnlev segmf_softunlock(struct hat *hat, struct seg *seg, caddr_t addr, size_t len)
264843e1988Sjohnlev {
265843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
266843e1988Sjohnlev 
267843e1988Sjohnlev 	hat_unlock(hat, addr, len);
268843e1988Sjohnlev 
269843e1988Sjohnlev 	mutex_enter(&freemem_lock);
270843e1988Sjohnlev 	ASSERT(data->softlockcnt >= btopr(len));
271843e1988Sjohnlev 	data->softlockcnt -= btopr(len);
272843e1988Sjohnlev 	mutex_exit(&freemem_lock);
273843e1988Sjohnlev 
274843e1988Sjohnlev 	if (data->softlockcnt == 0) {
275843e1988Sjohnlev 		struct as *as = seg->s_as;
276843e1988Sjohnlev 
277843e1988Sjohnlev 		if (AS_ISUNMAPWAIT(as)) {
278843e1988Sjohnlev 			mutex_enter(&as->a_contents);
279843e1988Sjohnlev 			if (AS_ISUNMAPWAIT(as)) {
280843e1988Sjohnlev 				AS_CLRUNMAPWAIT(as);
281843e1988Sjohnlev 				cv_broadcast(&as->a_cv);
282843e1988Sjohnlev 			}
283843e1988Sjohnlev 			mutex_exit(&as->a_contents);
284843e1988Sjohnlev 		}
285843e1988Sjohnlev 	}
286843e1988Sjohnlev }
287843e1988Sjohnlev 
288843e1988Sjohnlev static int
289843e1988Sjohnlev segmf_fault_range(struct hat *hat, struct seg *seg, caddr_t addr, size_t len,
290843e1988Sjohnlev     enum fault_type type, enum seg_rw rw)
291843e1988Sjohnlev {
292843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
293843e1988Sjohnlev 	int error = 0;
294843e1988Sjohnlev 	caddr_t a;
295843e1988Sjohnlev 
296843e1988Sjohnlev 	if ((data->prot & seg_rw_to_prot(rw)) == 0)
297843e1988Sjohnlev 		return (FC_PROT);
298843e1988Sjohnlev 
299843e1988Sjohnlev 	/* loop over the address range handling each fault */
300843e1988Sjohnlev 
301843e1988Sjohnlev 	for (a = addr; a < addr + len; a += PAGESIZE) {
302843e1988Sjohnlev 		error = segmf_faultpage(hat, seg, a, type, data->prot);
303843e1988Sjohnlev 		if (error != 0)
304843e1988Sjohnlev 			break;
305843e1988Sjohnlev 	}
306843e1988Sjohnlev 
307843e1988Sjohnlev 	if (error != 0 && type == F_SOFTLOCK) {
308843e1988Sjohnlev 		size_t done = (size_t)(a - addr);
309843e1988Sjohnlev 
310843e1988Sjohnlev 		/*
311843e1988Sjohnlev 		 * Undo what's been done so far.
312843e1988Sjohnlev 		 */
313843e1988Sjohnlev 		if (done > 0)
314843e1988Sjohnlev 			segmf_softunlock(hat, seg, addr, done);
315843e1988Sjohnlev 	}
316843e1988Sjohnlev 
317843e1988Sjohnlev 	return (error);
318843e1988Sjohnlev }
319843e1988Sjohnlev 
320843e1988Sjohnlev /*
321843e1988Sjohnlev  * We never demand-fault for seg_mf.
322843e1988Sjohnlev  */
323843e1988Sjohnlev /*ARGSUSED*/
324843e1988Sjohnlev static int
325843e1988Sjohnlev segmf_fault(struct hat *hat, struct seg *seg, caddr_t addr, size_t len,
326843e1988Sjohnlev     enum fault_type type, enum seg_rw rw)
327843e1988Sjohnlev {
328843e1988Sjohnlev 	return (FC_MAKE_ERR(EFAULT));
329843e1988Sjohnlev }
330843e1988Sjohnlev 
331843e1988Sjohnlev /*ARGSUSED*/
332843e1988Sjohnlev static int
333843e1988Sjohnlev segmf_faulta(struct seg *seg, caddr_t addr)
334843e1988Sjohnlev {
335843e1988Sjohnlev 	return (0);
336843e1988Sjohnlev }
337843e1988Sjohnlev 
338843e1988Sjohnlev /*ARGSUSED*/
339843e1988Sjohnlev static int
340843e1988Sjohnlev segmf_setprot(struct seg *seg, caddr_t addr, size_t len, uint_t prot)
341843e1988Sjohnlev {
342843e1988Sjohnlev 	return (EINVAL);
343843e1988Sjohnlev }
344843e1988Sjohnlev 
345843e1988Sjohnlev /*ARGSUSED*/
346843e1988Sjohnlev static int
347843e1988Sjohnlev segmf_checkprot(struct seg *seg, caddr_t addr, size_t len, uint_t prot)
348843e1988Sjohnlev {
349843e1988Sjohnlev 	return (EINVAL);
350843e1988Sjohnlev }
351843e1988Sjohnlev 
352843e1988Sjohnlev /*ARGSUSED*/
353843e1988Sjohnlev static int
354843e1988Sjohnlev segmf_kluster(struct seg *seg, caddr_t addr, ssize_t delta)
355843e1988Sjohnlev {
356843e1988Sjohnlev 	return (-1);
357843e1988Sjohnlev }
358843e1988Sjohnlev 
359843e1988Sjohnlev /*ARGSUSED*/
360843e1988Sjohnlev static int
361843e1988Sjohnlev segmf_sync(struct seg *seg, caddr_t addr, size_t len, int attr, uint_t flags)
362843e1988Sjohnlev {
363843e1988Sjohnlev 	return (0);
364843e1988Sjohnlev }
365843e1988Sjohnlev 
366843e1988Sjohnlev /*
367843e1988Sjohnlev  * XXPV	Hmm.  Should we say that mf mapping are "in core?"
368843e1988Sjohnlev  */
369843e1988Sjohnlev 
370843e1988Sjohnlev /*ARGSUSED*/
371843e1988Sjohnlev static size_t
372843e1988Sjohnlev segmf_incore(struct seg *seg, caddr_t addr, size_t len, char *vec)
373843e1988Sjohnlev {
374843e1988Sjohnlev 	size_t v;
375843e1988Sjohnlev 
376843e1988Sjohnlev 	for (v = 0, len = (len + PAGEOFFSET) & PAGEMASK; len;
377843e1988Sjohnlev 	    len -= PAGESIZE, v += PAGESIZE)
378843e1988Sjohnlev 		*vec++ = 1;
379843e1988Sjohnlev 	return (v);
380843e1988Sjohnlev }
381843e1988Sjohnlev 
382843e1988Sjohnlev /*ARGSUSED*/
383843e1988Sjohnlev static int
384843e1988Sjohnlev segmf_lockop(struct seg *seg, caddr_t addr,
385843e1988Sjohnlev     size_t len, int attr, int op, ulong_t *lockmap, size_t pos)
386843e1988Sjohnlev {
387843e1988Sjohnlev 	return (0);
388843e1988Sjohnlev }
389843e1988Sjohnlev 
390843e1988Sjohnlev static int
391843e1988Sjohnlev segmf_getprot(struct seg *seg, caddr_t addr, size_t len, uint_t *protv)
392843e1988Sjohnlev {
393843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
394843e1988Sjohnlev 	pgcnt_t pgno = seg_page(seg, addr + len) - seg_page(seg, addr) + 1;
395843e1988Sjohnlev 
396843e1988Sjohnlev 	if (pgno != 0) {
397843e1988Sjohnlev 		do
398843e1988Sjohnlev 			protv[--pgno] = data->prot;
399843e1988Sjohnlev 		while (pgno != 0)
400843e1988Sjohnlev 			;
401843e1988Sjohnlev 	}
402843e1988Sjohnlev 	return (0);
403843e1988Sjohnlev }
404843e1988Sjohnlev 
405843e1988Sjohnlev static u_offset_t
406843e1988Sjohnlev segmf_getoffset(struct seg *seg, caddr_t addr)
407843e1988Sjohnlev {
408843e1988Sjohnlev 	return (addr - seg->s_base);
409843e1988Sjohnlev }
410843e1988Sjohnlev 
411843e1988Sjohnlev /*ARGSUSED*/
412843e1988Sjohnlev static int
413843e1988Sjohnlev segmf_gettype(struct seg *seg, caddr_t addr)
414843e1988Sjohnlev {
415843e1988Sjohnlev 	return (MAP_SHARED);
416843e1988Sjohnlev }
417843e1988Sjohnlev 
418843e1988Sjohnlev /*ARGSUSED1*/
419843e1988Sjohnlev static int
420843e1988Sjohnlev segmf_getvp(struct seg *seg, caddr_t addr, struct vnode **vpp)
421843e1988Sjohnlev {
422843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
423843e1988Sjohnlev 
424843e1988Sjohnlev 	*vpp = VTOCVP(data->vp);
425843e1988Sjohnlev 	return (0);
426843e1988Sjohnlev }
427843e1988Sjohnlev 
428843e1988Sjohnlev /*ARGSUSED*/
429843e1988Sjohnlev static int
430843e1988Sjohnlev segmf_advise(struct seg *seg, caddr_t addr, size_t len, uint_t behav)
431843e1988Sjohnlev {
432843e1988Sjohnlev 	return (0);
433843e1988Sjohnlev }
434843e1988Sjohnlev 
435843e1988Sjohnlev /*ARGSUSED*/
436843e1988Sjohnlev static void
437843e1988Sjohnlev segmf_dump(struct seg *seg)
438843e1988Sjohnlev {}
439843e1988Sjohnlev 
440843e1988Sjohnlev /*ARGSUSED*/
441843e1988Sjohnlev static int
442843e1988Sjohnlev segmf_pagelock(struct seg *seg, caddr_t addr, size_t len,
443843e1988Sjohnlev     struct page ***ppp, enum lock_type type, enum seg_rw rw)
444843e1988Sjohnlev {
445843e1988Sjohnlev 	return (ENOTSUP);
446843e1988Sjohnlev }
447843e1988Sjohnlev 
448843e1988Sjohnlev /*ARGSUSED*/
449843e1988Sjohnlev static int
450843e1988Sjohnlev segmf_setpagesize(struct seg *seg, caddr_t addr, size_t len, uint_t szc)
451843e1988Sjohnlev {
452843e1988Sjohnlev 	return (ENOTSUP);
453843e1988Sjohnlev }
454843e1988Sjohnlev 
455843e1988Sjohnlev static int
456843e1988Sjohnlev segmf_getmemid(struct seg *seg, caddr_t addr, memid_t *memid)
457843e1988Sjohnlev {
458843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
459843e1988Sjohnlev 
460843e1988Sjohnlev 	memid->val[0] = (uintptr_t)VTOCVP(data->vp);
461843e1988Sjohnlev 	memid->val[1] = (uintptr_t)seg_page(seg, addr);
462843e1988Sjohnlev 	return (0);
463843e1988Sjohnlev }
464843e1988Sjohnlev 
465843e1988Sjohnlev /*ARGSUSED*/
466843e1988Sjohnlev static lgrp_mem_policy_info_t *
467843e1988Sjohnlev segmf_getpolicy(struct seg *seg, caddr_t addr)
468843e1988Sjohnlev {
469843e1988Sjohnlev 	return (NULL);
470843e1988Sjohnlev }
471843e1988Sjohnlev 
472843e1988Sjohnlev /*ARGSUSED*/
473843e1988Sjohnlev static int
474843e1988Sjohnlev segmf_capable(struct seg *seg, segcapability_t capability)
475843e1988Sjohnlev {
476843e1988Sjohnlev 	return (0);
477843e1988Sjohnlev }
478843e1988Sjohnlev 
479843e1988Sjohnlev /*
480843e1988Sjohnlev  * Add a set of contiguous foreign MFNs to the segment. soft-locking them.  The
481843e1988Sjohnlev  * pre-faulting is necessary due to live migration; in particular we must
482843e1988Sjohnlev  * return an error in response to IOCTL_PRIVCMD_MMAPBATCH rather than faulting
483843e1988Sjohnlev  * later on a bad MFN.  Whilst this isn't necessary for the other MMAP
484843e1988Sjohnlev  * ioctl()s, we lock them too, as they should be transitory.
485843e1988Sjohnlev  */
486843e1988Sjohnlev int
487843e1988Sjohnlev segmf_add_mfns(struct seg *seg, caddr_t addr, mfn_t mfn,
488843e1988Sjohnlev     pgcnt_t pgcnt, domid_t domid)
489843e1988Sjohnlev {
490843e1988Sjohnlev 	struct segmf_data *data = seg->s_data;
491843e1988Sjohnlev 	pgcnt_t base = seg_page(seg, addr);
492843e1988Sjohnlev 	faultcode_t fc;
493843e1988Sjohnlev 	pgcnt_t i;
494843e1988Sjohnlev 	int error = 0;
495843e1988Sjohnlev 
496843e1988Sjohnlev 	if (seg->s_ops != &segmf_ops)
497843e1988Sjohnlev 		return (EINVAL);
498843e1988Sjohnlev 
499843e1988Sjohnlev 	/*
500843e1988Sjohnlev 	 * Don't mess with dom0.
501843e1988Sjohnlev 	 *
502843e1988Sjohnlev 	 * Only allow the domid to be set once for the segment.
503843e1988Sjohnlev 	 * After that attempts to add mappings to this segment for
504843e1988Sjohnlev 	 * other domains explicitly fails.
505843e1988Sjohnlev 	 */
506843e1988Sjohnlev 
507843e1988Sjohnlev 	if (domid == 0 || domid == DOMID_SELF)
508843e1988Sjohnlev 		return (EACCES);
509843e1988Sjohnlev 
510843e1988Sjohnlev 	mutex_enter(&data->lock);
511843e1988Sjohnlev 
512843e1988Sjohnlev 	if (data->domid == 0)
513843e1988Sjohnlev 		data->domid = domid;
514843e1988Sjohnlev 
515843e1988Sjohnlev 	if (data->domid != domid) {
516843e1988Sjohnlev 		error = EINVAL;
517843e1988Sjohnlev 		goto out;
518843e1988Sjohnlev 	}
519843e1988Sjohnlev 
520843e1988Sjohnlev 	base = seg_page(seg, addr);
521843e1988Sjohnlev 
522843e1988Sjohnlev 	for (i = 0; i < pgcnt; i++)
523843e1988Sjohnlev 		data->mfns[base + i] = mfn++;
524843e1988Sjohnlev 
525843e1988Sjohnlev 	fc = segmf_fault_range(seg->s_as->a_hat, seg, addr,
526843e1988Sjohnlev 	    pgcnt * MMU_PAGESIZE, F_SOFTLOCK, S_OTHER);
527843e1988Sjohnlev 
528843e1988Sjohnlev 	if (fc != 0) {
529843e1988Sjohnlev 		error = fc_decode(fc);
530843e1988Sjohnlev 		for (i = 0; i < pgcnt; i++)
531843e1988Sjohnlev 			data->mfns[base + i] = MFN_INVALID;
532843e1988Sjohnlev 	}
533843e1988Sjohnlev 
534843e1988Sjohnlev out:
535843e1988Sjohnlev 	mutex_exit(&data->lock);
536843e1988Sjohnlev 	return (error);
537843e1988Sjohnlev }
538843e1988Sjohnlev 
539843e1988Sjohnlev static struct seg_ops segmf_ops = {
540843e1988Sjohnlev 	segmf_dup,
541843e1988Sjohnlev 	segmf_unmap,
542843e1988Sjohnlev 	segmf_free,
543843e1988Sjohnlev 	segmf_fault,
544843e1988Sjohnlev 	segmf_faulta,
545843e1988Sjohnlev 	segmf_setprot,
546843e1988Sjohnlev 	segmf_checkprot,
547843e1988Sjohnlev 	(int (*)())segmf_kluster,
548843e1988Sjohnlev 	(size_t (*)(struct seg *))NULL,	/* swapout */
549843e1988Sjohnlev 	segmf_sync,
550843e1988Sjohnlev 	segmf_incore,
551843e1988Sjohnlev 	segmf_lockop,
552843e1988Sjohnlev 	segmf_getprot,
553843e1988Sjohnlev 	segmf_getoffset,
554843e1988Sjohnlev 	segmf_gettype,
555843e1988Sjohnlev 	segmf_getvp,
556843e1988Sjohnlev 	segmf_advise,
557843e1988Sjohnlev 	segmf_dump,
558843e1988Sjohnlev 	segmf_pagelock,
559843e1988Sjohnlev 	segmf_setpagesize,
560843e1988Sjohnlev 	segmf_getmemid,
561843e1988Sjohnlev 	segmf_getpolicy,
562843e1988Sjohnlev 	segmf_capable
563843e1988Sjohnlev };
564