15b81b6b3SRodney W. Grimes /*- 25b81b6b3SRodney W. Grimes * Copyright (c) 1990 The Regents of the University of California. 35b81b6b3SRodney W. Grimes * All rights reserved. 45b81b6b3SRodney W. Grimes * 55b81b6b3SRodney W. Grimes * Redistribution and use in source and binary forms, with or without 65b81b6b3SRodney W. Grimes * modification, are permitted provided that the following conditions 75b81b6b3SRodney W. Grimes * are met: 85b81b6b3SRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 95b81b6b3SRodney W. Grimes * notice, this list of conditions and the following disclaimer. 105b81b6b3SRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 115b81b6b3SRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 125b81b6b3SRodney W. Grimes * documentation and/or other materials provided with the distribution. 135b81b6b3SRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 145b81b6b3SRodney W. Grimes * may be used to endorse or promote products derived from this software 155b81b6b3SRodney W. Grimes * without specific prior written permission. 165b81b6b3SRodney W. Grimes * 175b81b6b3SRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 185b81b6b3SRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 195b81b6b3SRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 205b81b6b3SRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 215b81b6b3SRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 225b81b6b3SRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 235b81b6b3SRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 245b81b6b3SRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 255b81b6b3SRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 265b81b6b3SRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 275b81b6b3SRodney W. Grimes * SUCH DAMAGE. 285b81b6b3SRodney W. Grimes * 2947cacd38SRodney W. Grimes * from: @(#)sys_machdep.c 5.5 (Berkeley) 1/19/91 305b81b6b3SRodney W. Grimes */ 315b81b6b3SRodney W. Grimes 329676a785SDavid E. O'Brien #include <sys/cdefs.h> 339676a785SDavid E. O'Brien __FBSDID("$FreeBSD$"); 349676a785SDavid E. O'Brien 3524c1c3bfSJonathan Anderson #include "opt_capsicum.h" 36b40ce416SJulian Elischer #include "opt_kstack_pages.h" 37268bdb43SPeter Wemm 38f540b106SGarrett Wollman #include <sys/param.h> 3974b5505eSRobert Watson #include <sys/capability.h> 40f540b106SGarrett Wollman #include <sys/systm.h> 41fb919e4dSMark Murray #include <sys/lock.h> 4291c28bfdSLuoqi Chen #include <sys/malloc.h> 43fb919e4dSMark Murray #include <sys/mutex.h> 44acd3428bSRobert Watson #include <sys/priv.h> 45f540b106SGarrett Wollman #include <sys/proc.h> 466caa8a15SJohn Baldwin #include <sys/smp.h> 47fb919e4dSMark Murray #include <sys/sysproto.h> 48efeaf95aSDavid Greenman 49efeaf95aSDavid Greenman #include <vm/vm.h> 50efeaf95aSDavid Greenman #include <vm/pmap.h> 51efeaf95aSDavid Greenman #include <vm/vm_map.h> 52efeaf95aSDavid Greenman #include <vm/vm_extern.h> 53efeaf95aSDavid Greenman 54f540b106SGarrett Wollman #include <machine/cpu.h> 556004362eSDavid Schultz #include <machine/pcb.h> 566004362eSDavid Schultz #include <machine/pcb_ext.h> 5724db0459SJohn Baldwin #include <machine/proc.h> 58f540b106SGarrett Wollman #include <machine/sysarch.h> 59812a11a2SDavid Greenman 6098bf5a70SRobert Watson #include <security/audit/audit.h> 6198bf5a70SRobert Watson 6293ee134aSKip Macy #ifdef XEN 6393ee134aSKip Macy #include <machine/xen/xenfunc.h> 6493ee134aSKip Macy 6593ee134aSKip Macy void i386_reset_ldt(struct proc_ldt *pldt); 6693ee134aSKip Macy 6793ee134aSKip Macy void 6893ee134aSKip Macy i386_reset_ldt(struct proc_ldt *pldt) 6993ee134aSKip Macy { 7093ee134aSKip Macy xen_set_ldt((vm_offset_t)pldt->ldt_base, pldt->ldt_len); 7193ee134aSKip Macy } 7293ee134aSKip Macy #else 7393ee134aSKip Macy #define i386_reset_ldt(x) 7493ee134aSKip Macy #endif 7593ee134aSKip Macy 76f540b106SGarrett Wollman #include <vm/vm_kern.h> /* for kernel_map */ 77da59a31cSDavid Greenman 780dbf6d73SJordan K. Hubbard #define MAX_LD 8192 790dbf6d73SJordan K. Hubbard #define LD_PER_PAGE 512 800dbf6d73SJordan K. Hubbard #define NEW_MAX_LD(num) ((num + LD_PER_PAGE) & ~(LD_PER_PAGE-1)) 810dbf6d73SJordan K. Hubbard #define SIZE_FROM_LARGEST_LD(num) (NEW_MAX_LD(num) << 3) 8205dfa22fSAttilio Rao #define NULL_LDT_BASE ((caddr_t)NULL) 830dbf6d73SJordan K. Hubbard 84ea11c140SAttilio Rao #ifdef SMP 8505dfa22fSAttilio Rao static void set_user_ldt_rv(struct vmspace *vmsp); 8605dfa22fSAttilio Rao #endif 87dae8d52dSDavid Xu static int i386_set_ldt_data(struct thread *, int start, int num, 88dae8d52dSDavid Xu union descriptor *descs); 89dae8d52dSDavid Xu static int i386_ldt_grow(struct thread *td, int len); 905b81b6b3SRodney W. Grimes 912f1ba63bSBruce Evans #ifndef _SYS_SYSPROTO_H_ 92812a11a2SDavid Greenman struct sysarch_args { 93812a11a2SDavid Greenman int op; 94812a11a2SDavid Greenman char *parms; 9501ae5b20SDavid Greenman }; 962f1ba63bSBruce Evans #endif 9701ae5b20SDavid Greenman 98812a11a2SDavid Greenman int 99b40ce416SJulian Elischer sysarch(td, uap) 100b40ce416SJulian Elischer struct thread *td; 101812a11a2SDavid Greenman register struct sysarch_args *uap; 1025b81b6b3SRodney W. Grimes { 1037ff022c4SJohn Baldwin int error; 10484569dffSMaxim Sobolev union descriptor *lp; 10584569dffSMaxim Sobolev union { 10684569dffSMaxim Sobolev struct i386_ldt_args largs; 10784569dffSMaxim Sobolev struct i386_ioperm_args iargs; 10884569dffSMaxim Sobolev } kargs; 109e0ab2c6dSPeter Wemm uint32_t base; 110e0ab2c6dSPeter Wemm struct segment_descriptor sd, *sdp; 11184569dffSMaxim Sobolev 11214961ba7SRobert Watson AUDIT_ARG_CMD(uap->op); 11374b5505eSRobert Watson 11424c1c3bfSJonathan Anderson #ifdef CAPABILITY_MODE 11574b5505eSRobert Watson /* 11612bc222eSJonathan Anderson * When adding new operations, add a new case statement here to 11712bc222eSJonathan Anderson * explicitly indicate whether or not the operation is safe to 11812bc222eSJonathan Anderson * perform in capability mode. 11974b5505eSRobert Watson */ 12074b5505eSRobert Watson if (IN_CAPABILITY_MODE(td)) { 12174b5505eSRobert Watson switch (uap->op) { 12274b5505eSRobert Watson case I386_GET_LDT: 12374b5505eSRobert Watson case I386_SET_LDT: 12474b5505eSRobert Watson case I386_GET_IOPERM: 12574b5505eSRobert Watson case I386_GET_FSBASE: 12674b5505eSRobert Watson case I386_SET_FSBASE: 12774b5505eSRobert Watson case I386_GET_GSBASE: 12874b5505eSRobert Watson case I386_SET_GSBASE: 12974b5505eSRobert Watson break; 13074b5505eSRobert Watson 13174b5505eSRobert Watson case I386_SET_IOPERM: 13274b5505eSRobert Watson default: 133a417d4a4SDag-Erling Smørgrav #ifdef KTRACE 134a417d4a4SDag-Erling Smørgrav if (KTRPOINT(td, KTR_CAPFAIL)) 135a417d4a4SDag-Erling Smørgrav ktrcapfail(CAPFAIL_SYSCALL, 0, 0); 136a417d4a4SDag-Erling Smørgrav #endif 13774b5505eSRobert Watson return (ECAPMODE); 13874b5505eSRobert Watson } 13974b5505eSRobert Watson } 14074b5505eSRobert Watson #endif 14174b5505eSRobert Watson 14284569dffSMaxim Sobolev switch (uap->op) { 14384569dffSMaxim Sobolev case I386_GET_IOPERM: 14484569dffSMaxim Sobolev case I386_SET_IOPERM: 14584569dffSMaxim Sobolev if ((error = copyin(uap->parms, &kargs.iargs, 14684569dffSMaxim Sobolev sizeof(struct i386_ioperm_args))) != 0) 14784569dffSMaxim Sobolev return (error); 14884569dffSMaxim Sobolev break; 14984569dffSMaxim Sobolev case I386_GET_LDT: 15084569dffSMaxim Sobolev case I386_SET_LDT: 15184569dffSMaxim Sobolev if ((error = copyin(uap->parms, &kargs.largs, 15284569dffSMaxim Sobolev sizeof(struct i386_ldt_args))) != 0) 15384569dffSMaxim Sobolev return (error); 1548a4d2b06SDavid Schultz if (kargs.largs.num > MAX_LD || kargs.largs.num <= 0) 1558a4d2b06SDavid Schultz return (EINVAL); 15684569dffSMaxim Sobolev break; 15784569dffSMaxim Sobolev default: 15884569dffSMaxim Sobolev break; 15984569dffSMaxim Sobolev } 1605b81b6b3SRodney W. Grimes 161812a11a2SDavid Greenman switch(uap->op) { 162812a11a2SDavid Greenman case I386_GET_LDT: 16384569dffSMaxim Sobolev error = i386_get_ldt(td, &kargs.largs); 1645b81b6b3SRodney W. Grimes break; 165812a11a2SDavid Greenman case I386_SET_LDT: 16684569dffSMaxim Sobolev if (kargs.largs.descs != NULL) { 1675df87b21SJeff Roberson lp = (union descriptor *)kmem_malloc(kernel_arena, 1682f84c08eSJeff Roberson kargs.largs.num * sizeof(union descriptor), 1692f84c08eSJeff Roberson M_WAITOK); 17084569dffSMaxim Sobolev if (lp == NULL) { 17184569dffSMaxim Sobolev error = ENOMEM; 17284569dffSMaxim Sobolev break; 17384569dffSMaxim Sobolev } 17484569dffSMaxim Sobolev error = copyin(kargs.largs.descs, lp, 17584569dffSMaxim Sobolev kargs.largs.num * sizeof(union descriptor)); 17684569dffSMaxim Sobolev if (error == 0) 17784569dffSMaxim Sobolev error = i386_set_ldt(td, &kargs.largs, lp); 1785df87b21SJeff Roberson kmem_free(kernel_arena, (vm_offset_t)lp, 17984569dffSMaxim Sobolev kargs.largs.num * sizeof(union descriptor)); 18084569dffSMaxim Sobolev } else { 18184569dffSMaxim Sobolev error = i386_set_ldt(td, &kargs.largs, NULL); 18284569dffSMaxim Sobolev } 1835b81b6b3SRodney W. Grimes break; 18448a09cf2SJohn Dyson case I386_GET_IOPERM: 18584569dffSMaxim Sobolev error = i386_get_ioperm(td, &kargs.iargs); 18684569dffSMaxim Sobolev if (error == 0) 18784569dffSMaxim Sobolev error = copyout(&kargs.iargs, uap->parms, 18884569dffSMaxim Sobolev sizeof(struct i386_ioperm_args)); 18948a09cf2SJohn Dyson break; 19048a09cf2SJohn Dyson case I386_SET_IOPERM: 19184569dffSMaxim Sobolev error = i386_set_ioperm(td, &kargs.iargs); 19248a09cf2SJohn Dyson break; 19348a09cf2SJohn Dyson case I386_VM86: 194b40ce416SJulian Elischer error = vm86_sysarch(td, uap->parms); 19548a09cf2SJohn Dyson break; 196e0ab2c6dSPeter Wemm case I386_GET_FSBASE: 197e0ab2c6dSPeter Wemm sdp = &td->td_pcb->pcb_fsd; 198e0ab2c6dSPeter Wemm base = sdp->sd_hibase << 24 | sdp->sd_lobase; 199e0ab2c6dSPeter Wemm error = copyout(&base, uap->parms, sizeof(base)); 200e0ab2c6dSPeter Wemm break; 201e0ab2c6dSPeter Wemm case I386_SET_FSBASE: 202e0ab2c6dSPeter Wemm error = copyin(uap->parms, &base, sizeof(base)); 203e0ab2c6dSPeter Wemm if (!error) { 204e0ab2c6dSPeter Wemm /* 205e0ab2c6dSPeter Wemm * Construct a descriptor and store it in the pcb for 206e0ab2c6dSPeter Wemm * the next context switch. Also store it in the gdt 207e0ab2c6dSPeter Wemm * so that the load of tf_fs into %fs will activate it 208e0ab2c6dSPeter Wemm * at return to userland. 209e0ab2c6dSPeter Wemm */ 210e0ab2c6dSPeter Wemm sd.sd_lobase = base & 0xffffff; 211e0ab2c6dSPeter Wemm sd.sd_hibase = (base >> 24) & 0xff; 21293ee134aSKip Macy #ifdef XEN 21393ee134aSKip Macy /* need to do nosegneg like Linux */ 21493ee134aSKip Macy sd.sd_lolimit = (HYPERVISOR_VIRT_START >> 12) & 0xffff; 21593ee134aSKip Macy #else 216e0ab2c6dSPeter Wemm sd.sd_lolimit = 0xffff; /* 4GB limit, wraps around */ 21793ee134aSKip Macy #endif 218e0ab2c6dSPeter Wemm sd.sd_hilimit = 0xf; 219e0ab2c6dSPeter Wemm sd.sd_type = SDT_MEMRWA; 220e0ab2c6dSPeter Wemm sd.sd_dpl = SEL_UPL; 221e0ab2c6dSPeter Wemm sd.sd_p = 1; 222e0ab2c6dSPeter Wemm sd.sd_xx = 0; 223e0ab2c6dSPeter Wemm sd.sd_def32 = 1; 224e0ab2c6dSPeter Wemm sd.sd_gran = 1; 2254b1fa239SDavid Xu critical_enter(); 226e0ab2c6dSPeter Wemm td->td_pcb->pcb_fsd = sd; 22793ee134aSKip Macy #ifdef XEN 22893ee134aSKip Macy HYPERVISOR_update_descriptor(vtomach(&PCPU_GET(fsgs_gdt)[0]), 22993ee134aSKip Macy *(uint64_t *)&sd); 23093ee134aSKip Macy #else 231e0ab2c6dSPeter Wemm PCPU_GET(fsgs_gdt)[0] = sd; 23293ee134aSKip Macy #endif 2334b1fa239SDavid Xu critical_exit(); 2349a045ca1SDavid Xu td->td_frame->tf_fs = GSEL(GUFS_SEL, SEL_UPL); 235e0ab2c6dSPeter Wemm } 236e0ab2c6dSPeter Wemm break; 237e0ab2c6dSPeter Wemm case I386_GET_GSBASE: 238e0ab2c6dSPeter Wemm sdp = &td->td_pcb->pcb_gsd; 239e0ab2c6dSPeter Wemm base = sdp->sd_hibase << 24 | sdp->sd_lobase; 240e0ab2c6dSPeter Wemm error = copyout(&base, uap->parms, sizeof(base)); 241e0ab2c6dSPeter Wemm break; 242e0ab2c6dSPeter Wemm case I386_SET_GSBASE: 243e0ab2c6dSPeter Wemm error = copyin(uap->parms, &base, sizeof(base)); 244e0ab2c6dSPeter Wemm if (!error) { 245e0ab2c6dSPeter Wemm /* 246e0ab2c6dSPeter Wemm * Construct a descriptor and store it in the pcb for 247e0ab2c6dSPeter Wemm * the next context switch. Also store it in the gdt 248e0ab2c6dSPeter Wemm * because we have to do a load_gs() right now. 249e0ab2c6dSPeter Wemm */ 250e0ab2c6dSPeter Wemm sd.sd_lobase = base & 0xffffff; 251e0ab2c6dSPeter Wemm sd.sd_hibase = (base >> 24) & 0xff; 25293ee134aSKip Macy 25393ee134aSKip Macy #ifdef XEN 25493ee134aSKip Macy /* need to do nosegneg like Linux */ 25593ee134aSKip Macy sd.sd_lolimit = (HYPERVISOR_VIRT_START >> 12) & 0xffff; 25693ee134aSKip Macy #else 257e0ab2c6dSPeter Wemm sd.sd_lolimit = 0xffff; /* 4GB limit, wraps around */ 25893ee134aSKip Macy #endif 259e0ab2c6dSPeter Wemm sd.sd_hilimit = 0xf; 260e0ab2c6dSPeter Wemm sd.sd_type = SDT_MEMRWA; 261e0ab2c6dSPeter Wemm sd.sd_dpl = SEL_UPL; 262e0ab2c6dSPeter Wemm sd.sd_p = 1; 263e0ab2c6dSPeter Wemm sd.sd_xx = 0; 264e0ab2c6dSPeter Wemm sd.sd_def32 = 1; 265e0ab2c6dSPeter Wemm sd.sd_gran = 1; 2664b1fa239SDavid Xu critical_enter(); 267e0ab2c6dSPeter Wemm td->td_pcb->pcb_gsd = sd; 26893ee134aSKip Macy #ifdef XEN 26993ee134aSKip Macy HYPERVISOR_update_descriptor(vtomach(&PCPU_GET(fsgs_gdt)[1]), 27093ee134aSKip Macy *(uint64_t *)&sd); 27193ee134aSKip Macy #else 272e0ab2c6dSPeter Wemm PCPU_GET(fsgs_gdt)[1] = sd; 27393ee134aSKip Macy #endif 2744b1fa239SDavid Xu critical_exit(); 275e0ab2c6dSPeter Wemm load_gs(GSEL(GUGS_SEL, SEL_UPL)); 276e0ab2c6dSPeter Wemm } 277e0ab2c6dSPeter Wemm break; 278812a11a2SDavid Greenman default: 2797ff022c4SJohn Baldwin error = EINVAL; 280812a11a2SDavid Greenman break; 281812a11a2SDavid Greenman } 282812a11a2SDavid Greenman return (error); 283812a11a2SDavid Greenman } 284da59a31cSDavid Greenman 28548a09cf2SJohn Dyson int 286b40ce416SJulian Elischer i386_extend_pcb(struct thread *td) 28748a09cf2SJohn Dyson { 28848a09cf2SJohn Dyson int i, offset; 28948a09cf2SJohn Dyson u_long *addr; 29048a09cf2SJohn Dyson struct pcb_ext *ext; 29148a09cf2SJohn Dyson struct soft_segment_descriptor ssd = { 29248a09cf2SJohn Dyson 0, /* segment base address (overwritten) */ 29348a09cf2SJohn Dyson ctob(IOPAGES + 1) - 1, /* length */ 29448a09cf2SJohn Dyson SDT_SYS386TSS, /* segment type */ 29548a09cf2SJohn Dyson 0, /* priority level */ 29648a09cf2SJohn Dyson 1, /* descriptor present */ 29748a09cf2SJohn Dyson 0, 0, 29848a09cf2SJohn Dyson 0, /* default 32 size */ 29948a09cf2SJohn Dyson 0 /* granularity */ 30048a09cf2SJohn Dyson }; 30148a09cf2SJohn Dyson 3025df87b21SJeff Roberson ext = (struct pcb_ext *)kmem_malloc(kernel_arena, ctob(IOPAGES+1), 3032f84c08eSJeff Roberson M_WAITOK); 30448a09cf2SJohn Dyson if (ext == 0) 30548a09cf2SJohn Dyson return (ENOMEM); 306640c4313SJonathan Lemon bzero(ext, sizeof(struct pcb_ext)); 307b40ce416SJulian Elischer /* -16 is so we can convert a trapframe into vm86trapframe inplace */ 308b40ce416SJulian Elischer ext->ext_tss.tss_esp0 = td->td_kstack + ctob(KSTACK_PAGES) - 309b40ce416SJulian Elischer sizeof(struct pcb) - 16; 31048a09cf2SJohn Dyson ext->ext_tss.tss_ss0 = GSEL(GDATA_SEL, SEL_KPL); 31148a09cf2SJohn Dyson /* 31248a09cf2SJohn Dyson * The last byte of the i/o map must be followed by an 0xff byte. 31348a09cf2SJohn Dyson * We arbitrarily allocate 16 bytes here, to keep the starting 31448a09cf2SJohn Dyson * address on a doubleword boundary. 31548a09cf2SJohn Dyson */ 31648a09cf2SJohn Dyson offset = PAGE_SIZE - 16; 31748a09cf2SJohn Dyson ext->ext_tss.tss_ioopt = 31848a09cf2SJohn Dyson (offset - ((unsigned)&ext->ext_tss - (unsigned)ext)) << 16; 31948a09cf2SJohn Dyson ext->ext_iomap = (caddr_t)ext + offset; 32048a09cf2SJohn Dyson ext->ext_vm86.vm86_intmap = (caddr_t)ext + offset - 32; 32148a09cf2SJohn Dyson 32248a09cf2SJohn Dyson addr = (u_long *)ext->ext_vm86.vm86_intmap; 32348a09cf2SJohn Dyson for (i = 0; i < (ctob(IOPAGES) + 32 + 16) / sizeof(u_long); i++) 32448a09cf2SJohn Dyson *addr++ = ~0; 32548a09cf2SJohn Dyson 32648a09cf2SJohn Dyson ssd.ssd_base = (unsigned)&ext->ext_tss; 32748a09cf2SJohn Dyson ssd.ssd_limit -= ((unsigned)&ext->ext_tss - (unsigned)ext); 32848a09cf2SJohn Dyson ssdtosd(&ssd, &ext->ext_tssd); 32948a09cf2SJohn Dyson 330f726a873SJohn Baldwin KASSERT(td == curthread, ("giving TSS to !curthread")); 331b40ce416SJulian Elischer KASSERT(td->td_pcb->pcb_ext == 0, ("already have a TSS!")); 332f726a873SJohn Baldwin 333f726a873SJohn Baldwin /* Switch to the new TSS. */ 3341bfa9108SDavid Xu critical_enter(); 335b40ce416SJulian Elischer td->td_pcb->pcb_ext = ext; 3361bfa9108SDavid Xu PCPU_SET(private_tss, 1); 337f726a873SJohn Baldwin *PCPU_GET(tss_gdt) = ext->ext_tssd; 338f726a873SJohn Baldwin ltr(GSEL(GPROC0_SEL, SEL_KPL)); 3391bfa9108SDavid Xu critical_exit(); 34048a09cf2SJohn Dyson 34148a09cf2SJohn Dyson return 0; 34248a09cf2SJohn Dyson } 34348a09cf2SJohn Dyson 34484569dffSMaxim Sobolev int 34584569dffSMaxim Sobolev i386_set_ioperm(td, uap) 346b40ce416SJulian Elischer struct thread *td; 34784569dffSMaxim Sobolev struct i386_ioperm_args *uap; 34848a09cf2SJohn Dyson { 3499729f279SBruce Evans int i, error; 35048a09cf2SJohn Dyson char *iomap; 35148a09cf2SJohn Dyson 352acd3428bSRobert Watson if ((error = priv_check(td, PRIV_IO)) != 0) 35348a09cf2SJohn Dyson return (error); 354a854ed98SJohn Baldwin if ((error = securelevel_gt(td->td_ucred, 0)) != 0) 355330e7889SRobert Watson return (error); 35648a09cf2SJohn Dyson /* 35748a09cf2SJohn Dyson * XXX 35848a09cf2SJohn Dyson * While this is restricted to root, we should probably figure out 35948a09cf2SJohn Dyson * whether any other driver is using this i/o address, as so not to 36048a09cf2SJohn Dyson * cause confusion. This probably requires a global 'usage registry'. 36148a09cf2SJohn Dyson */ 36248a09cf2SJohn Dyson 363b40ce416SJulian Elischer if (td->td_pcb->pcb_ext == 0) 364b40ce416SJulian Elischer if ((error = i386_extend_pcb(td)) != 0) 36548a09cf2SJohn Dyson return (error); 366b40ce416SJulian Elischer iomap = (char *)td->td_pcb->pcb_ext->ext_iomap; 36748a09cf2SJohn Dyson 36884569dffSMaxim Sobolev if (uap->start + uap->length > IOPAGES * PAGE_SIZE * NBBY) 36948a09cf2SJohn Dyson return (EINVAL); 37048a09cf2SJohn Dyson 37184569dffSMaxim Sobolev for (i = uap->start; i < uap->start + uap->length; i++) { 37284569dffSMaxim Sobolev if (uap->enable) 37348a09cf2SJohn Dyson iomap[i >> 3] &= ~(1 << (i & 7)); 37448a09cf2SJohn Dyson else 37548a09cf2SJohn Dyson iomap[i >> 3] |= (1 << (i & 7)); 37648a09cf2SJohn Dyson } 37748a09cf2SJohn Dyson return (error); 37848a09cf2SJohn Dyson } 37948a09cf2SJohn Dyson 38084569dffSMaxim Sobolev int 38184569dffSMaxim Sobolev i386_get_ioperm(td, uap) 382b40ce416SJulian Elischer struct thread *td; 38384569dffSMaxim Sobolev struct i386_ioperm_args *uap; 38448a09cf2SJohn Dyson { 38584569dffSMaxim Sobolev int i, state; 38648a09cf2SJohn Dyson char *iomap; 38748a09cf2SJohn Dyson 38884569dffSMaxim Sobolev if (uap->start >= IOPAGES * PAGE_SIZE * NBBY) 3899729f279SBruce Evans return (EINVAL); 39048a09cf2SJohn Dyson 391b40ce416SJulian Elischer if (td->td_pcb->pcb_ext == 0) { 39284569dffSMaxim Sobolev uap->length = 0; 39348a09cf2SJohn Dyson goto done; 39448a09cf2SJohn Dyson } 39548a09cf2SJohn Dyson 396b40ce416SJulian Elischer iomap = (char *)td->td_pcb->pcb_ext->ext_iomap; 39748a09cf2SJohn Dyson 39884569dffSMaxim Sobolev i = uap->start; 39938861023SPeter Wemm state = (iomap[i >> 3] >> (i & 7)) & 1; 40084569dffSMaxim Sobolev uap->enable = !state; 40184569dffSMaxim Sobolev uap->length = 1; 40248a09cf2SJohn Dyson 40384569dffSMaxim Sobolev for (i = uap->start + 1; i < IOPAGES * PAGE_SIZE * NBBY; i++) { 40448a09cf2SJohn Dyson if (state != ((iomap[i >> 3] >> (i & 7)) & 1)) 40548a09cf2SJohn Dyson break; 40684569dffSMaxim Sobolev uap->length++; 40748a09cf2SJohn Dyson } 40848a09cf2SJohn Dyson 40948a09cf2SJohn Dyson done: 41084569dffSMaxim Sobolev return (0); 41148a09cf2SJohn Dyson } 41248a09cf2SJohn Dyson 4130dbf6d73SJordan K. Hubbard /* 4140dbf6d73SJordan K. Hubbard * Update the GDT entry pointing to the LDT to point to the LDT of the 4150ad5e7f3SJeff Roberson * current process. Manage dt_lock holding/unholding autonomously. 4160dbf6d73SJordan K. Hubbard */ 417da59a31cSDavid Greenman void 41824db0459SJohn Baldwin set_user_ldt(struct mdproc *mdp) 419da59a31cSDavid Greenman { 42024db0459SJohn Baldwin struct proc_ldt *pldt; 4210ad5e7f3SJeff Roberson int dtlocked; 4220ad5e7f3SJeff Roberson 4230ad5e7f3SJeff Roberson dtlocked = 0; 4240ad5e7f3SJeff Roberson if (!mtx_owned(&dt_lock)) { 4250ad5e7f3SJeff Roberson mtx_lock_spin(&dt_lock); 4260ad5e7f3SJeff Roberson dtlocked = 1; 4270ad5e7f3SJeff Roberson } 42891c28bfdSLuoqi Chen 42924db0459SJohn Baldwin pldt = mdp->md_ldt; 43093ee134aSKip Macy #ifdef XEN 43193ee134aSKip Macy i386_reset_ldt(pldt); 43293ee134aSKip Macy PCPU_SET(currentldt, (int)pldt); 43393ee134aSKip Macy #else 4345206bca1SLuoqi Chen #ifdef SMP 43524db0459SJohn Baldwin gdt[PCPU_GET(cpuid) * NGDT + GUSERLDT_SEL].sd = pldt->ldt_sd; 4365206bca1SLuoqi Chen #else 43724db0459SJohn Baldwin gdt[GUSERLDT_SEL].sd = pldt->ldt_sd; 4385206bca1SLuoqi Chen #endif 439da59a31cSDavid Greenman lldt(GSEL(GUSERLDT_SEL, SEL_KPL)); 4404ef34f39SJake Burkholder PCPU_SET(currentldt, GSEL(GUSERLDT_SEL, SEL_KPL)); 44193ee134aSKip Macy #endif /* XEN */ 4420ad5e7f3SJeff Roberson if (dtlocked) 4430ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 4441acf256dSJohn Baldwin } 4451acf256dSJohn Baldwin 4465eb6e279SJohn Baldwin #ifdef SMP 4475eb6e279SJohn Baldwin static void 44805dfa22fSAttilio Rao set_user_ldt_rv(struct vmspace *vmsp) 4491acf256dSJohn Baldwin { 45005dfa22fSAttilio Rao struct thread *td; 4511acf256dSJohn Baldwin 45205dfa22fSAttilio Rao td = curthread; 45305dfa22fSAttilio Rao if (vmsp != td->td_proc->p_vmspace) 4541acf256dSJohn Baldwin return; 4551acf256dSJohn Baldwin 45624db0459SJohn Baldwin set_user_ldt(&td->td_proc->p_md); 457da59a31cSDavid Greenman } 4585eb6e279SJohn Baldwin #endif 459da59a31cSDavid Greenman 46093ee134aSKip Macy #ifdef XEN 46193ee134aSKip Macy 46293ee134aSKip Macy /* 46393ee134aSKip Macy * dt_lock must be held. Returns with dt_lock held. 46493ee134aSKip Macy */ 46593ee134aSKip Macy struct proc_ldt * 46693ee134aSKip Macy user_ldt_alloc(struct mdproc *mdp, int len) 46793ee134aSKip Macy { 46893ee134aSKip Macy struct proc_ldt *pldt, *new_ldt; 46993ee134aSKip Macy 47093ee134aSKip Macy mtx_assert(&dt_lock, MA_OWNED); 47193ee134aSKip Macy mtx_unlock_spin(&dt_lock); 4721ede983cSDag-Erling Smørgrav new_ldt = malloc(sizeof(struct proc_ldt), 47393ee134aSKip Macy M_SUBPROC, M_WAITOK); 47493ee134aSKip Macy 47593ee134aSKip Macy new_ldt->ldt_len = len = NEW_MAX_LD(len); 4765df87b21SJeff Roberson new_ldt->ldt_base = (caddr_t)kmem_malloc(kernel_arena, 4772f84c08eSJeff Roberson round_page(len * sizeof(union descriptor)), M_WAITOK); 47893ee134aSKip Macy if (new_ldt->ldt_base == NULL) { 4791ede983cSDag-Erling Smørgrav free(new_ldt, M_SUBPROC); 480cb1d78d0SKonstantin Belousov mtx_lock_spin(&dt_lock); 481cb1d78d0SKonstantin Belousov return (NULL); 48293ee134aSKip Macy } 48393ee134aSKip Macy new_ldt->ldt_refcnt = 1; 48493ee134aSKip Macy new_ldt->ldt_active = 0; 48593ee134aSKip Macy 486de187b8dSColin Percival mtx_lock_spin(&dt_lock); 48793ee134aSKip Macy if ((pldt = mdp->md_ldt)) { 48893ee134aSKip Macy if (len > pldt->ldt_len) 48993ee134aSKip Macy len = pldt->ldt_len; 49093ee134aSKip Macy bcopy(pldt->ldt_base, new_ldt->ldt_base, 49193ee134aSKip Macy len * sizeof(union descriptor)); 49293ee134aSKip Macy } else { 49393ee134aSKip Macy bcopy(ldt, new_ldt->ldt_base, PAGE_SIZE); 49493ee134aSKip Macy } 495de187b8dSColin Percival mtx_unlock_spin(&dt_lock); /* XXX kill once pmap locking fixed. */ 49693ee134aSKip Macy pmap_map_readonly(kernel_pmap, (vm_offset_t)new_ldt->ldt_base, 49793ee134aSKip Macy new_ldt->ldt_len*sizeof(union descriptor)); 498de187b8dSColin Percival mtx_lock_spin(&dt_lock); /* XXX kill once pmap locking fixed. */ 499cb1d78d0SKonstantin Belousov return (new_ldt); 50093ee134aSKip Macy } 50193ee134aSKip Macy #else 502df4d012bSJohn Baldwin /* 5030ad5e7f3SJeff Roberson * dt_lock must be held. Returns with dt_lock held. 504df4d012bSJohn Baldwin */ 50524db0459SJohn Baldwin struct proc_ldt * 50624db0459SJohn Baldwin user_ldt_alloc(struct mdproc *mdp, int len) 50791c28bfdSLuoqi Chen { 50824db0459SJohn Baldwin struct proc_ldt *pldt, *new_ldt; 50991c28bfdSLuoqi Chen 5100ad5e7f3SJeff Roberson mtx_assert(&dt_lock, MA_OWNED); 5110ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 5121ede983cSDag-Erling Smørgrav new_ldt = malloc(sizeof(struct proc_ldt), 513a163d034SWarner Losh M_SUBPROC, M_WAITOK); 51491c28bfdSLuoqi Chen 51591c28bfdSLuoqi Chen new_ldt->ldt_len = len = NEW_MAX_LD(len); 5165df87b21SJeff Roberson new_ldt->ldt_base = (caddr_t)kmem_malloc(kernel_arena, 5172f84c08eSJeff Roberson len * sizeof(union descriptor), M_WAITOK); 51891c28bfdSLuoqi Chen if (new_ldt->ldt_base == NULL) { 5191ede983cSDag-Erling Smørgrav free(new_ldt, M_SUBPROC); 520cb1d78d0SKonstantin Belousov mtx_lock_spin(&dt_lock); 521cb1d78d0SKonstantin Belousov return (NULL); 52291c28bfdSLuoqi Chen } 52305dfa22fSAttilio Rao new_ldt->ldt_refcnt = 1; 52491c28bfdSLuoqi Chen new_ldt->ldt_active = 0; 52591c28bfdSLuoqi Chen 5260ad5e7f3SJeff Roberson mtx_lock_spin(&dt_lock); 52791c28bfdSLuoqi Chen gdt_segs[GUSERLDT_SEL].ssd_base = (unsigned)new_ldt->ldt_base; 52891c28bfdSLuoqi Chen gdt_segs[GUSERLDT_SEL].ssd_limit = len * sizeof(union descriptor) - 1; 52991c28bfdSLuoqi Chen ssdtosd(&gdt_segs[GUSERLDT_SEL], &new_ldt->ldt_sd); 53091c28bfdSLuoqi Chen 5310ad5e7f3SJeff Roberson if ((pldt = mdp->md_ldt) != NULL) { 53224db0459SJohn Baldwin if (len > pldt->ldt_len) 53324db0459SJohn Baldwin len = pldt->ldt_len; 53424db0459SJohn Baldwin bcopy(pldt->ldt_base, new_ldt->ldt_base, 53591c28bfdSLuoqi Chen len * sizeof(union descriptor)); 5360ad5e7f3SJeff Roberson } else 53791c28bfdSLuoqi Chen bcopy(ldt, new_ldt->ldt_base, sizeof(ldt)); 5380ad5e7f3SJeff Roberson 5390ad5e7f3SJeff Roberson return (new_ldt); 54091c28bfdSLuoqi Chen } 54193ee134aSKip Macy #endif /* !XEN */ 54291c28bfdSLuoqi Chen 543df4d012bSJohn Baldwin /* 54402b0a160SAttilio Rao * Must be called with dt_lock held. Returns with dt_lock unheld. 545df4d012bSJohn Baldwin */ 54691c28bfdSLuoqi Chen void 54724db0459SJohn Baldwin user_ldt_free(struct thread *td) 54891c28bfdSLuoqi Chen { 54924db0459SJohn Baldwin struct mdproc *mdp = &td->td_proc->p_md; 5500ad5e7f3SJeff Roberson struct proc_ldt *pldt; 55191c28bfdSLuoqi Chen 5520ad5e7f3SJeff Roberson mtx_assert(&dt_lock, MA_OWNED); 553cb1d78d0SKonstantin Belousov if ((pldt = mdp->md_ldt) == NULL) { 554cb1d78d0SKonstantin Belousov mtx_unlock_spin(&dt_lock); 55591c28bfdSLuoqi Chen return; 556cb1d78d0SKonstantin Belousov } 55791c28bfdSLuoqi Chen 558b494482fSJohn Baldwin if (td == curthread) { 559aaaf6071SColin Percival #ifdef XEN 560aaaf6071SColin Percival i386_reset_ldt(&default_proc_ldt); 561aaaf6071SColin Percival PCPU_SET(currentldt, (int)&default_proc_ldt); 562aaaf6071SColin Percival #else 56391c28bfdSLuoqi Chen lldt(_default_ldt); 5644ef34f39SJake Burkholder PCPU_SET(currentldt, _default_ldt); 565aaaf6071SColin Percival #endif 56691c28bfdSLuoqi Chen } 56791c28bfdSLuoqi Chen 56824db0459SJohn Baldwin mdp->md_ldt = NULL; 5699719da13SKonstantin Belousov user_ldt_deref(pldt); 5709719da13SKonstantin Belousov } 5719719da13SKonstantin Belousov 5729719da13SKonstantin Belousov void 5739719da13SKonstantin Belousov user_ldt_deref(struct proc_ldt *pldt) 5749719da13SKonstantin Belousov { 5759719da13SKonstantin Belousov 5769719da13SKonstantin Belousov mtx_assert(&dt_lock, MA_OWNED); 57705dfa22fSAttilio Rao if (--pldt->ldt_refcnt == 0) { 57802b0a160SAttilio Rao mtx_unlock_spin(&dt_lock); 5795df87b21SJeff Roberson kmem_free(kernel_arena, (vm_offset_t)pldt->ldt_base, 58024db0459SJohn Baldwin pldt->ldt_len * sizeof(union descriptor)); 5811ede983cSDag-Erling Smørgrav free(pldt, M_SUBPROC); 58205dfa22fSAttilio Rao } else 58305dfa22fSAttilio Rao mtx_unlock_spin(&dt_lock); 58491c28bfdSLuoqi Chen } 58591c28bfdSLuoqi Chen 58684569dffSMaxim Sobolev /* 58784569dffSMaxim Sobolev * Note for the authors of compat layers (linux, etc): copyout() in 58884569dffSMaxim Sobolev * the function below is not a problem since it presents data in 58984569dffSMaxim Sobolev * arch-specific format (i.e. i386-specific in this case), not in 59084569dffSMaxim Sobolev * the OS-specific one. 59184569dffSMaxim Sobolev */ 59284569dffSMaxim Sobolev int 59384569dffSMaxim Sobolev i386_get_ldt(td, uap) 594b40ce416SJulian Elischer struct thread *td; 59584569dffSMaxim Sobolev struct i386_ldt_args *uap; 596da59a31cSDavid Greenman { 597da59a31cSDavid Greenman int error = 0; 5980ad5e7f3SJeff Roberson struct proc_ldt *pldt; 599da59a31cSDavid Greenman int nldt, num; 600da59a31cSDavid Greenman union descriptor *lp; 601da59a31cSDavid Greenman 602da59a31cSDavid Greenman #ifdef DEBUG 60300671271SBruce Evans printf("i386_get_ldt: start=%d num=%d descs=%p\n", 6047a2bb3b8SLuoqi Chen uap->start, uap->num, (void *)uap->descs); 605da59a31cSDavid Greenman #endif 606da59a31cSDavid Greenman 6070ad5e7f3SJeff Roberson mtx_lock_spin(&dt_lock); 6080ad5e7f3SJeff Roberson if ((pldt = td->td_proc->p_md.md_ldt) != NULL) { 60924db0459SJohn Baldwin nldt = pldt->ldt_len; 61024db0459SJohn Baldwin lp = &((union descriptor *)(pldt->ldt_base))[uap->start]; 6110ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 6120ad5e7f3SJeff Roberson num = min(uap->num, nldt); 613da59a31cSDavid Greenman } else { 6140ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 615da59a31cSDavid Greenman nldt = sizeof(ldt)/sizeof(ldt[0]); 616da59a31cSDavid Greenman num = min(uap->num, nldt); 617da59a31cSDavid Greenman lp = &ldt[uap->start]; 618da59a31cSDavid Greenman } 6199b2dc15cSColin Percival 6209b2dc15cSColin Percival if ((uap->start > (unsigned int)nldt) || 6219b2dc15cSColin Percival ((unsigned int)num > (unsigned int)nldt) || 6229b2dc15cSColin Percival ((unsigned int)(uap->start + num) > (unsigned int)nldt)) 623da59a31cSDavid Greenman return(EINVAL); 624da59a31cSDavid Greenman 6257a2bb3b8SLuoqi Chen error = copyout(lp, uap->descs, num * sizeof(union descriptor)); 626da59a31cSDavid Greenman if (!error) 627b40ce416SJulian Elischer td->td_retval[0] = num; 628da59a31cSDavid Greenman 629da59a31cSDavid Greenman return(error); 630da59a31cSDavid Greenman } 631da59a31cSDavid Greenman 63284569dffSMaxim Sobolev int 63384569dffSMaxim Sobolev i386_set_ldt(td, uap, descs) 634b40ce416SJulian Elischer struct thread *td; 63584569dffSMaxim Sobolev struct i386_ldt_args *uap; 63684569dffSMaxim Sobolev union descriptor *descs; 637da59a31cSDavid Greenman { 638dae8d52dSDavid Xu int error = 0, i; 6390dbf6d73SJordan K. Hubbard int largest_ld; 64024db0459SJohn Baldwin struct mdproc *mdp = &td->td_proc->p_md; 641bc2e774aSJohn Baldwin struct proc_ldt *pldt; 64284569dffSMaxim Sobolev union descriptor *dp; 643da59a31cSDavid Greenman 6441716a1afSJulian Elischer #ifdef DEBUG 6451716a1afSJulian Elischer printf("i386_set_ldt: start=%d num=%d descs=%p\n", 6461716a1afSJulian Elischer uap->start, uap->num, (void *)uap->descs); 6471716a1afSJulian Elischer #endif 6481716a1afSJulian Elischer 64984569dffSMaxim Sobolev if (descs == NULL) { 650dae8d52dSDavid Xu /* Free descriptors */ 651dae8d52dSDavid Xu if (uap->start == 0 && uap->num == 0) { 652dae8d52dSDavid Xu /* 653dae8d52dSDavid Xu * Treat this as a special case, so userland needn't 654dae8d52dSDavid Xu * know magic number NLDT. 655dae8d52dSDavid Xu */ 656dae8d52dSDavid Xu uap->start = NLDT; 657dae8d52dSDavid Xu uap->num = MAX_LD - NLDT; 6580dbf6d73SJordan K. Hubbard } 6596bd823f3SJohn Baldwin if (uap->num == 0) 660da59a31cSDavid Greenman return (EINVAL); 6610ad5e7f3SJeff Roberson mtx_lock_spin(&dt_lock); 6620ad5e7f3SJeff Roberson if ((pldt = mdp->md_ldt) == NULL || 6630ad5e7f3SJeff Roberson uap->start >= pldt->ldt_len) { 6640ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 665dae8d52dSDavid Xu return (0); 666dae8d52dSDavid Xu } 667dae8d52dSDavid Xu largest_ld = uap->start + uap->num; 668dae8d52dSDavid Xu if (largest_ld > pldt->ldt_len) 669dae8d52dSDavid Xu largest_ld = pldt->ldt_len; 670dae8d52dSDavid Xu i = largest_ld - uap->start; 671dae8d52dSDavid Xu bzero(&((union descriptor *)(pldt->ldt_base))[uap->start], 672dae8d52dSDavid Xu sizeof(union descriptor) * i); 6730ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 674dae8d52dSDavid Xu return (0); 675dae8d52dSDavid Xu } 676dae8d52dSDavid Xu 6775774db75SJulian Elischer if (!(uap->start == LDT_AUTO_ALLOC && uap->num == 1)) { 678dae8d52dSDavid Xu /* verify range of descriptors to modify */ 679dae8d52dSDavid Xu largest_ld = uap->start + uap->num; 6806bd823f3SJohn Baldwin if (uap->start >= MAX_LD || largest_ld > MAX_LD) { 681dae8d52dSDavid Xu return (EINVAL); 682dae8d52dSDavid Xu } 683da59a31cSDavid Greenman } 684da59a31cSDavid Greenman 685da59a31cSDavid Greenman /* Check descriptors for access violations */ 686dae8d52dSDavid Xu for (i = 0; i < uap->num; i++) { 6878eb8107bSPeter Wemm dp = &descs[i]; 688da59a31cSDavid Greenman 6898eb8107bSPeter Wemm switch (dp->sd.sd_type) { 6900dbf6d73SJordan K. Hubbard case SDT_SYSNULL: /* system null */ 6918eb8107bSPeter Wemm dp->sd.sd_p = 0; 6920dbf6d73SJordan K. Hubbard break; 6930dbf6d73SJordan K. Hubbard case SDT_SYS286TSS: /* system 286 TSS available */ 6940dbf6d73SJordan K. Hubbard case SDT_SYSLDT: /* system local descriptor table */ 6950dbf6d73SJordan K. Hubbard case SDT_SYS286BSY: /* system 286 TSS busy */ 6960dbf6d73SJordan K. Hubbard case SDT_SYSTASKGT: /* system task gate */ 6970dbf6d73SJordan K. Hubbard case SDT_SYS286IGT: /* system 286 interrupt gate */ 6980dbf6d73SJordan K. Hubbard case SDT_SYS286TGT: /* system 286 trap gate */ 6990dbf6d73SJordan K. Hubbard case SDT_SYSNULL2: /* undefined by Intel */ 7000dbf6d73SJordan K. Hubbard case SDT_SYS386TSS: /* system 386 TSS available */ 7010dbf6d73SJordan K. Hubbard case SDT_SYSNULL3: /* undefined by Intel */ 7020dbf6d73SJordan K. Hubbard case SDT_SYS386BSY: /* system 386 TSS busy */ 7030dbf6d73SJordan K. Hubbard case SDT_SYSNULL4: /* undefined by Intel */ 7040dbf6d73SJordan K. Hubbard case SDT_SYS386IGT: /* system 386 interrupt gate */ 7050dbf6d73SJordan K. Hubbard case SDT_SYS386TGT: /* system 386 trap gate */ 7060dbf6d73SJordan K. Hubbard case SDT_SYS286CGT: /* system 286 call gate */ 7070dbf6d73SJordan K. Hubbard case SDT_SYS386CGT: /* system 386 call gate */ 7080dbf6d73SJordan K. Hubbard /* I can't think of any reason to allow a user proc 7090dbf6d73SJordan K. Hubbard * to create a segment of these types. They are 7100dbf6d73SJordan K. Hubbard * for OS use only. 7110dbf6d73SJordan K. Hubbard */ 712dae8d52dSDavid Xu return (EACCES); 713df4d012bSJohn Baldwin /*NOTREACHED*/ 714da59a31cSDavid Greenman 7150dbf6d73SJordan K. Hubbard /* memory segment types */ 7160dbf6d73SJordan K. Hubbard case SDT_MEMEC: /* memory execute only conforming */ 7170dbf6d73SJordan K. Hubbard case SDT_MEMEAC: /* memory execute only accessed conforming */ 7180dbf6d73SJordan K. Hubbard case SDT_MEMERC: /* memory execute read conforming */ 7190dbf6d73SJordan K. Hubbard case SDT_MEMERAC: /* memory execute read accessed conforming */ 7200dbf6d73SJordan K. Hubbard /* Must be "present" if executable and conforming. */ 72184569dffSMaxim Sobolev if (dp->sd.sd_p == 0) 722da59a31cSDavid Greenman return (EACCES); 723da59a31cSDavid Greenman break; 7240dbf6d73SJordan K. Hubbard case SDT_MEMRO: /* memory read only */ 7250dbf6d73SJordan K. Hubbard case SDT_MEMROA: /* memory read only accessed */ 7260dbf6d73SJordan K. Hubbard case SDT_MEMRW: /* memory read write */ 7270dbf6d73SJordan K. Hubbard case SDT_MEMRWA: /* memory read write accessed */ 7280dbf6d73SJordan K. Hubbard case SDT_MEMROD: /* memory read only expand dwn limit */ 7290dbf6d73SJordan K. Hubbard case SDT_MEMRODA: /* memory read only expand dwn lim accessed */ 7300dbf6d73SJordan K. Hubbard case SDT_MEMRWD: /* memory read write expand dwn limit */ 7310dbf6d73SJordan K. Hubbard case SDT_MEMRWDA: /* memory read write expand dwn lim acessed */ 7320dbf6d73SJordan K. Hubbard case SDT_MEME: /* memory execute only */ 7330dbf6d73SJordan K. Hubbard case SDT_MEMEA: /* memory execute only accessed */ 7340dbf6d73SJordan K. Hubbard case SDT_MEMER: /* memory execute read */ 7350dbf6d73SJordan K. Hubbard case SDT_MEMERA: /* memory execute read accessed */ 736da59a31cSDavid Greenman break; 737da59a31cSDavid Greenman default: 7380dbf6d73SJordan K. Hubbard return(EINVAL); 739da59a31cSDavid Greenman /*NOTREACHED*/ 740da59a31cSDavid Greenman } 7410dbf6d73SJordan K. Hubbard 7420dbf6d73SJordan K. Hubbard /* Only user (ring-3) descriptors may be present. */ 74384569dffSMaxim Sobolev if ((dp->sd.sd_p != 0) && (dp->sd.sd_dpl != SEL_UPL)) 7440dbf6d73SJordan K. Hubbard return (EACCES); 745da59a31cSDavid Greenman } 746da59a31cSDavid Greenman 7475774db75SJulian Elischer if (uap->start == LDT_AUTO_ALLOC && uap->num == 1) { 748dae8d52dSDavid Xu /* Allocate a free slot */ 7490ad5e7f3SJeff Roberson mtx_lock_spin(&dt_lock); 7500ad5e7f3SJeff Roberson if ((pldt = mdp->md_ldt) == NULL) { 7510ad5e7f3SJeff Roberson if ((error = i386_ldt_grow(td, NLDT + 1))) { 7520ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 753dae8d52dSDavid Xu return (error); 7540ad5e7f3SJeff Roberson } 755dae8d52dSDavid Xu pldt = mdp->md_ldt; 756dae8d52dSDavid Xu } 757dae8d52dSDavid Xu again: 758f09fc81cSJulian Elischer /* 759f09fc81cSJulian Elischer * start scanning a bit up to leave room for NVidia and 760f09fc81cSJulian Elischer * Wine, which still user the "Blat" method of allocation. 761f09fc81cSJulian Elischer */ 7625774db75SJulian Elischer dp = &((union descriptor *)(pldt->ldt_base))[NLDT]; 763e4e2c613SJulian Elischer for (i = NLDT; i < pldt->ldt_len; ++i) { 764dae8d52dSDavid Xu if (dp->sd.sd_type == SDT_SYSNULL) 765dae8d52dSDavid Xu break; 766dae8d52dSDavid Xu dp++; 767dae8d52dSDavid Xu } 768dae8d52dSDavid Xu if (i >= pldt->ldt_len) { 7690ad5e7f3SJeff Roberson if ((error = i386_ldt_grow(td, pldt->ldt_len+1))) { 7700ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 771dae8d52dSDavid Xu return (error); 7720ad5e7f3SJeff Roberson } 773dae8d52dSDavid Xu goto again; 774dae8d52dSDavid Xu } 775dae8d52dSDavid Xu uap->start = i; 776dae8d52dSDavid Xu error = i386_set_ldt_data(td, i, 1, descs); 7770ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 778dae8d52dSDavid Xu } else { 779dae8d52dSDavid Xu largest_ld = uap->start + uap->num; 7800ad5e7f3SJeff Roberson mtx_lock_spin(&dt_lock); 7810ad5e7f3SJeff Roberson if (!(error = i386_ldt_grow(td, largest_ld))) { 782dae8d52dSDavid Xu error = i386_set_ldt_data(td, uap->start, uap->num, 783dae8d52dSDavid Xu descs); 784dae8d52dSDavid Xu } 7850ad5e7f3SJeff Roberson mtx_unlock_spin(&dt_lock); 786dae8d52dSDavid Xu } 787dae8d52dSDavid Xu if (error == 0) 788dae8d52dSDavid Xu td->td_retval[0] = uap->start; 789dae8d52dSDavid Xu return (error); 790dae8d52dSDavid Xu } 79193ee134aSKip Macy #ifdef XEN 792dae8d52dSDavid Xu static int 793dae8d52dSDavid Xu i386_set_ldt_data(struct thread *td, int start, int num, 794dae8d52dSDavid Xu union descriptor *descs) 795dae8d52dSDavid Xu { 796dae8d52dSDavid Xu struct mdproc *mdp = &td->td_proc->p_md; 797dae8d52dSDavid Xu struct proc_ldt *pldt = mdp->md_ldt; 798dae8d52dSDavid Xu 7990ad5e7f3SJeff Roberson mtx_assert(&dt_lock, MA_OWNED); 800dae8d52dSDavid Xu 801698cc19dSColin Percival while (num) { 802698cc19dSColin Percival xen_update_descriptor( 803dae8d52dSDavid Xu &((union descriptor *)(pldt->ldt_base))[start], 804698cc19dSColin Percival descs); 805698cc19dSColin Percival num--; 806698cc19dSColin Percival start++; 807698cc19dSColin Percival descs++; 808698cc19dSColin Percival } 809dae8d52dSDavid Xu return (0); 810dae8d52dSDavid Xu } 81193ee134aSKip Macy #else 81293ee134aSKip Macy static int 81393ee134aSKip Macy i386_set_ldt_data(struct thread *td, int start, int num, 81493ee134aSKip Macy union descriptor *descs) 81593ee134aSKip Macy { 81693ee134aSKip Macy struct mdproc *mdp = &td->td_proc->p_md; 81793ee134aSKip Macy struct proc_ldt *pldt = mdp->md_ldt; 81893ee134aSKip Macy 81993ee134aSKip Macy mtx_assert(&dt_lock, MA_OWNED); 82093ee134aSKip Macy 82193ee134aSKip Macy /* Fill in range */ 82293ee134aSKip Macy bcopy(descs, 82393ee134aSKip Macy &((union descriptor *)(pldt->ldt_base))[start], 82493ee134aSKip Macy num * sizeof(union descriptor)); 82593ee134aSKip Macy return (0); 82693ee134aSKip Macy } 82793ee134aSKip Macy #endif /* !XEN */ 828dae8d52dSDavid Xu 829dae8d52dSDavid Xu static int 830dae8d52dSDavid Xu i386_ldt_grow(struct thread *td, int len) 831dae8d52dSDavid Xu { 832dae8d52dSDavid Xu struct mdproc *mdp = &td->td_proc->p_md; 83305dfa22fSAttilio Rao struct proc_ldt *new_ldt, *pldt; 83405dfa22fSAttilio Rao caddr_t old_ldt_base = NULL_LDT_BASE; 83505dfa22fSAttilio Rao int old_ldt_len = 0; 836dae8d52dSDavid Xu 8370ad5e7f3SJeff Roberson mtx_assert(&dt_lock, MA_OWNED); 8380ad5e7f3SJeff Roberson 839dae8d52dSDavid Xu if (len > MAX_LD) 840dae8d52dSDavid Xu return (ENOMEM); 841dae8d52dSDavid Xu if (len < NLDT + 1) 842dae8d52dSDavid Xu len = NLDT + 1; 843bc2e774aSJohn Baldwin 844bc2e774aSJohn Baldwin /* Allocate a user ldt. */ 84502b0a160SAttilio Rao if ((pldt = mdp->md_ldt) == NULL || len > pldt->ldt_len) { 846bc2e774aSJohn Baldwin new_ldt = user_ldt_alloc(mdp, len); 847dae8d52dSDavid Xu if (new_ldt == NULL) 848dae8d52dSDavid Xu return (ENOMEM); 849dae8d52dSDavid Xu pldt = mdp->md_ldt; 850bc2e774aSJohn Baldwin 8510ad5e7f3SJeff Roberson if (pldt != NULL) { 85205dfa22fSAttilio Rao if (new_ldt->ldt_len <= pldt->ldt_len) { 853dae8d52dSDavid Xu /* 85405dfa22fSAttilio Rao * We just lost the race for allocation, so 85505dfa22fSAttilio Rao * free the new object and return. 856dae8d52dSDavid Xu */ 85702b0a160SAttilio Rao mtx_unlock_spin(&dt_lock); 8585df87b21SJeff Roberson kmem_free(kernel_arena, 859dae8d52dSDavid Xu (vm_offset_t)new_ldt->ldt_base, 860dae8d52dSDavid Xu new_ldt->ldt_len * sizeof(union descriptor)); 8611ede983cSDag-Erling Smørgrav free(new_ldt, M_SUBPROC); 86202b0a160SAttilio Rao mtx_lock_spin(&dt_lock); 863dae8d52dSDavid Xu return (0); 864dae8d52dSDavid Xu } 86505dfa22fSAttilio Rao 86605dfa22fSAttilio Rao /* 86705dfa22fSAttilio Rao * We have to substitute the current LDT entry for 86805dfa22fSAttilio Rao * curproc with the new one since its size grew. 86905dfa22fSAttilio Rao */ 87005dfa22fSAttilio Rao old_ldt_base = pldt->ldt_base; 87105dfa22fSAttilio Rao old_ldt_len = pldt->ldt_len; 87205dfa22fSAttilio Rao pldt->ldt_sd = new_ldt->ldt_sd; 87305dfa22fSAttilio Rao pldt->ldt_base = new_ldt->ldt_base; 87405dfa22fSAttilio Rao pldt->ldt_len = new_ldt->ldt_len; 8750ad5e7f3SJeff Roberson } else 876dae8d52dSDavid Xu mdp->md_ldt = pldt = new_ldt; 877dae8d52dSDavid Xu #ifdef SMP 87802b0a160SAttilio Rao /* 87902b0a160SAttilio Rao * Signal other cpus to reload ldt. We need to unlock dt_lock 88002b0a160SAttilio Rao * here because other CPU will contest on it since their 88102b0a160SAttilio Rao * curthreads won't hold the lock and will block when trying 88202b0a160SAttilio Rao * to acquire it. 88302b0a160SAttilio Rao */ 88402b0a160SAttilio Rao mtx_unlock_spin(&dt_lock); 885dae8d52dSDavid Xu smp_rendezvous(NULL, (void (*)(void *))set_user_ldt_rv, 88605dfa22fSAttilio Rao NULL, td->td_proc->p_vmspace); 887dae8d52dSDavid Xu #else 888ea11c140SAttilio Rao set_user_ldt(&td->td_proc->p_md); 88905dfa22fSAttilio Rao mtx_unlock_spin(&dt_lock); 890dae8d52dSDavid Xu #endif 89105dfa22fSAttilio Rao if (old_ldt_base != NULL_LDT_BASE) { 8925df87b21SJeff Roberson kmem_free(kernel_arena, (vm_offset_t)old_ldt_base, 89305dfa22fSAttilio Rao old_ldt_len * sizeof(union descriptor)); 8941ede983cSDag-Erling Smørgrav free(new_ldt, M_SUBPROC); 89505dfa22fSAttilio Rao } 89605dfa22fSAttilio Rao mtx_lock_spin(&dt_lock); 897dae8d52dSDavid Xu } 8988eb8107bSPeter Wemm return (0); 899da59a31cSDavid Greenman } 900