1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2011 NetApp, Inc.
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY NETAPP, INC ``AS IS'' AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19  * ARE DISCLAIMED.  IN NO EVENT SHALL NETAPP, INC OR CONTRIBUTORS BE LIABLE
20  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26  * SUCH DAMAGE.
27  *
28  * $FreeBSD$
29  */
30 /*
31  * This file and its contents are supplied under the terms of the
32  * Common Development and Distribution License ("CDDL"), version 1.0.
33  * You may only use this file in accordance with the terms of version
34  * 1.0 of the CDDL.
35  *
36  * A full copy of the text of the CDDL should have accompanied this
37  * source.  A copy of the CDDL is also available via the Internet at
38  * http://www.illumos.org/license/CDDL.
39  *
40  * Copyright 2015 Pluribus Networks Inc.
41  * Copyright 2019 Joyent, Inc.
42  * Copyright 2021 Oxide Computer Company
43  */
44 
45 #ifndef _VMMAPI_H_
46 #define	_VMMAPI_H_
47 
48 #include <sys/param.h>
49 #include <sys/cpuset.h>
50 #include <x86/segments.h>
51 
52 #include <stdbool.h>
53 
54 /*
55  * API version for out-of-tree consumers like grub-bhyve for making compile
56  * time decisions.
57  */
58 #define	VMMAPI_VERSION	0103	/* 2 digit major followed by 2 digit minor */
59 
60 struct iovec;
61 struct vmctx;
62 enum x2apic_state;
63 
64 /*
65  * Different styles of mapping the memory assigned to a VM into the address
66  * space of the controlling process.
67  */
68 enum vm_mmap_style {
69 	VM_MMAP_NONE,		/* no mapping */
70 	VM_MMAP_ALL,		/* fully and statically mapped */
71 	VM_MMAP_SPARSE,		/* mappings created on-demand */
72 };
73 
74 /*
75  * 'flags' value passed to 'vm_set_memflags()'.
76  */
77 #define	VM_MEM_F_INCORE	0x01	/* include guest memory in core file */
78 #define	VM_MEM_F_WIRED	0x02	/* guest memory is wired */
79 
80 /*
81  * Identifiers for memory segments:
82  * - vm_setup_memory() uses VM_SYSMEM for the system memory segment.
83  * - the remaining identifiers can be used to create devmem segments.
84  */
85 enum {
86 #ifdef __FreeBSD__
87 	VM_SYSMEM,
88 #else
89 	VM_LOWMEM,
90 	VM_HIGHMEM,
91 #endif
92 	VM_BOOTROM,
93 	VM_FRAMEBUFFER,
94 	VM_PCIROM,
95 };
96 
97 /*
98  * Get the length and name of the memory segment identified by 'segid'.
99  * Note that system memory segments are identified with a nul name.
100  *
101  * Returns 0 on success and non-zero otherwise.
102  */
103 int	vm_get_memseg(struct vmctx *ctx, int ident, size_t *lenp, char *name,
104 	    size_t namesiz);
105 
106 /*
107  * Iterate over the guest address space. This function finds an address range
108  * that starts at an address >= *gpa.
109  *
110  * Returns 0 if the next address range was found and non-zero otherwise.
111  */
112 int	vm_mmap_getnext(struct vmctx *ctx, vm_paddr_t *gpa, int *segid,
113 	    vm_ooffset_t *segoff, size_t *len, int *prot, int *flags);
114 /*
115  * Create a device memory segment identified by 'segid'.
116  *
117  * Returns a pointer to the memory segment on success and MAP_FAILED otherwise.
118  */
119 void	*vm_create_devmem(struct vmctx *ctx, int segid, const char *name,
120 	    size_t len);
121 
122 #ifndef __FreeBSD__
123 /*
124  * Return the map offset for the device memory segment 'segid'.
125  */
126 int	vm_get_devmem_offset(struct vmctx *ctx, int segid, off_t *mapoff);
127 #endif
128 
129 /*
130  * Map the memory segment identified by 'segid' into the guest address space
131  * at [gpa,gpa+len) with protection 'prot'.
132  */
133 int	vm_mmap_memseg(struct vmctx *ctx, vm_paddr_t gpa, int segid,
134 	    vm_ooffset_t segoff, size_t len, int prot);
135 
136 int	vm_munmap_memseg(struct vmctx *ctx, vm_paddr_t gpa, size_t len);
137 
138 #ifndef __FreeBSD__
139 int	vm_create(const char *name, uint64_t flags);
140 #else
141 int	vm_create(const char *name);
142 #endif /* __FreeBSD__ */
143 int	vm_get_device_fd(struct vmctx *ctx);
144 struct vmctx *vm_open(const char *name);
145 #ifndef __FreeBSD__
146 void	vm_close(struct vmctx *ctx);
147 #endif
148 void	vm_destroy(struct vmctx *ctx);
149 int	vm_parse_memsize(const char *optarg, size_t *memsize);
150 int	vm_setup_memory(struct vmctx *ctx, size_t len, enum vm_mmap_style s);
151 void	*vm_map_gpa(struct vmctx *ctx, vm_paddr_t gaddr, size_t len);
152 int	vm_get_gpa_pmap(struct vmctx *, uint64_t gpa, uint64_t *pte, int *num);
153 int	vm_gla2gpa(struct vmctx *, int vcpuid, struct vm_guest_paging *paging,
154 		   uint64_t gla, int prot, uint64_t *gpa, int *fault);
155 int	vm_gla2gpa_nofault(struct vmctx *, int vcpuid,
156 		   struct vm_guest_paging *paging, uint64_t gla, int prot,
157 		   uint64_t *gpa, int *fault);
158 uint32_t vm_get_lowmem_limit(struct vmctx *ctx);
159 void	vm_set_lowmem_limit(struct vmctx *ctx, uint32_t limit);
160 void	vm_set_memflags(struct vmctx *ctx, int flags);
161 int	vm_get_memflags(struct vmctx *ctx);
162 size_t	vm_get_lowmem_size(struct vmctx *ctx);
163 size_t	vm_get_highmem_size(struct vmctx *ctx);
164 int	vm_set_desc(struct vmctx *ctx, int vcpu, int reg,
165 		    uint64_t base, uint32_t limit, uint32_t access);
166 int	vm_get_desc(struct vmctx *ctx, int vcpu, int reg,
167 		    uint64_t *base, uint32_t *limit, uint32_t *access);
168 int	vm_get_seg_desc(struct vmctx *ctx, int vcpu, int reg,
169 			struct seg_desc *seg_desc);
170 int	vm_set_register(struct vmctx *ctx, int vcpu, int reg, uint64_t val);
171 int	vm_get_register(struct vmctx *ctx, int vcpu, int reg, uint64_t *retval);
172 int	vm_set_register_set(struct vmctx *ctx, int vcpu, unsigned int count,
173     const int *regnums, uint64_t *regvals);
174 int	vm_get_register_set(struct vmctx *ctx, int vcpu, unsigned int count,
175     const int *regnums, uint64_t *regvals);
176 int	vm_run(struct vmctx *ctx, int vcpu, const struct vm_entry *vm_entry,
177     struct vm_exit *vm_exit);
178 int	vm_suspend(struct vmctx *ctx, enum vm_suspend_how how);
179 #ifndef __FreeBSD__
180 int	vm_reinit(struct vmctx *ctx, uint64_t);
181 #else
182 int	vm_reinit(struct vmctx *ctx);
183 #endif
184 int	vm_apicid2vcpu(struct vmctx *ctx, int apicid);
185 int	vm_inject_exception(struct vmctx *ctx, int vcpu, int vector,
186     int errcode_valid, uint32_t errcode, int restart_instruction);
187 #ifndef __FreeBSD__
188 void	vm_inject_fault(struct vmctx *ctx, int vcpu, int vector,
189     int errcode_valid, int errcode);
190 
191 static __inline void
192 vm_inject_gp(struct vmctx *ctx, int vcpuid)
193 {
194 	vm_inject_fault(ctx, vcpuid, IDT_GP, 1, 0);
195 }
196 
197 static __inline void
198 vm_inject_ac(struct vmctx *ctx, int vcpuid, int errcode)
199 {
200 	vm_inject_fault(ctx, vcpuid, IDT_AC, 1, errcode);
201 }
202 static __inline void
203 vm_inject_ss(struct vmctx *ctx, int vcpuid, int errcode)
204 {
205 	vm_inject_fault(ctx, vcpuid, IDT_SS, 1, errcode);
206 }
207 #endif
208 int	vm_lapic_irq(struct vmctx *ctx, int vcpu, int vector);
209 int	vm_lapic_local_irq(struct vmctx *ctx, int vcpu, int vector);
210 int	vm_lapic_msi(struct vmctx *ctx, uint64_t addr, uint64_t msg);
211 int	vm_ioapic_assert_irq(struct vmctx *ctx, int irq);
212 int	vm_ioapic_deassert_irq(struct vmctx *ctx, int irq);
213 int	vm_ioapic_pulse_irq(struct vmctx *ctx, int irq);
214 int	vm_ioapic_pincount(struct vmctx *ctx, int *pincount);
215 int	vm_readwrite_kernemu_device(struct vmctx *ctx, int vcpu,
216 	    vm_paddr_t gpa, bool write, int size, uint64_t *value);
217 int	vm_isa_assert_irq(struct vmctx *ctx, int atpic_irq, int ioapic_irq);
218 int	vm_isa_deassert_irq(struct vmctx *ctx, int atpic_irq, int ioapic_irq);
219 int	vm_isa_pulse_irq(struct vmctx *ctx, int atpic_irq, int ioapic_irq);
220 int	vm_isa_set_irq_trigger(struct vmctx *ctx, int atpic_irq,
221 	    enum vm_intr_trigger trigger);
222 int	vm_inject_nmi(struct vmctx *ctx, int vcpu);
223 int	vm_capability_name2type(const char *capname);
224 const char *vm_capability_type2name(int type);
225 int	vm_get_capability(struct vmctx *ctx, int vcpu, enum vm_cap_type cap,
226 			  int *retval);
227 int	vm_set_capability(struct vmctx *ctx, int vcpu, enum vm_cap_type cap,
228 			  int val);
229 #ifdef __FreeBSD__
230 int	vm_assign_pptdev(struct vmctx *ctx, int bus, int slot, int func);
231 int	vm_unassign_pptdev(struct vmctx *ctx, int bus, int slot, int func);
232 int	vm_map_pptdev_mmio(struct vmctx *ctx, int bus, int slot, int func,
233 			   vm_paddr_t gpa, size_t len, vm_paddr_t hpa);
234 int	vm_unmap_pptdev_mmio(struct vmctx *ctx, int bus, int slot, int func,
235 			     vm_paddr_t gpa, size_t len);
236 int	vm_setup_pptdev_msi(struct vmctx *ctx, int vcpu, int bus, int slot,
237 	    int func, uint64_t addr, uint64_t msg, int numvec);
238 int	vm_setup_pptdev_msix(struct vmctx *ctx, int vcpu, int bus, int slot,
239 	    int func, int idx, uint64_t addr, uint64_t msg,
240 	    uint32_t vector_control);
241 int	vm_disable_pptdev_msix(struct vmctx *ctx, int bus, int slot, int func);
242 int	vm_get_pptdev_limits(struct vmctx *ctx, int bus, int slot, int func,
243     int *msi_limit, int *msix_limit);
244 #else /* __FreeBSD__ */
245 int	vm_assign_pptdev(struct vmctx *ctx, int pptfd);
246 int	vm_unassign_pptdev(struct vmctx *ctx, int pptfd);
247 int	vm_map_pptdev_mmio(struct vmctx *ctx, int pptfd, vm_paddr_t gpa,
248     size_t len, vm_paddr_t hpa);
249 int	vm_unmap_pptdev_mmio(struct vmctx *ctx, int pptfd, vm_paddr_t gpa,
250     size_t len);
251 int	vm_setup_pptdev_msi(struct vmctx *ctx, int vcpu, int pptfd,
252     uint64_t addr, uint64_t msg, int numvec);
253 int	vm_setup_pptdev_msix(struct vmctx *ctx, int vcpu, int pptfd,
254     int idx, uint64_t addr, uint64_t msg, uint32_t vector_control);
255 int	vm_disable_pptdev_msix(struct vmctx *ctx, int pptfd);
256 int	vm_get_pptdev_limits(struct vmctx *ctx, int pptfd, int *msi_limit,
257     int *msix_limit);
258 #endif /* __FreeBSD__ */
259 
260 int	vm_get_intinfo(struct vmctx *ctx, int vcpu, uint64_t *i1, uint64_t *i2);
261 int	vm_set_intinfo(struct vmctx *ctx, int vcpu, uint64_t exit_intinfo);
262 
263 #ifdef __FreeBSD__
264 const cap_ioctl_t *vm_get_ioctls(size_t *len);
265 #endif
266 
267 /*
268  * Return a pointer to the statistics buffer. Note that this is not MT-safe.
269  */
270 uint64_t *vm_get_stats(struct vmctx *ctx, int vcpu, struct timeval *ret_tv,
271 		       int *ret_entries);
272 const char *vm_get_stat_desc(struct vmctx *ctx, int index);
273 
274 int	vm_get_x2apic_state(struct vmctx *ctx, int vcpu, enum x2apic_state *s);
275 int	vm_set_x2apic_state(struct vmctx *ctx, int vcpu, enum x2apic_state s);
276 
277 int	vm_get_hpet_capabilities(struct vmctx *ctx, uint32_t *capabilities);
278 
279 /*
280  * Translate the GLA range [gla,gla+len) into GPA segments in 'iov'.
281  * The 'iovcnt' should be big enough to accommodate all GPA segments.
282  *
283  * retval	fault		Interpretation
284  *   0		  0		Success
285  *   0		  1		An exception was injected into the guest
286  * EFAULT	 N/A		Error
287  */
288 int	vm_copy_setup(struct vmctx *ctx, int vcpu, struct vm_guest_paging *pg,
289 	    uint64_t gla, size_t len, int prot, struct iovec *iov, int iovcnt,
290 	    int *fault);
291 void	vm_copyin(struct vmctx *ctx, int vcpu, struct iovec *guest_iov,
292 	    void *host_dst, size_t len);
293 void	vm_copyout(struct vmctx *ctx, int vcpu, const void *host_src,
294 	    struct iovec *guest_iov, size_t len);
295 void	vm_copy_teardown(struct vmctx *ctx, int vcpu, struct iovec *iov,
296 	    int iovcnt);
297 
298 /* RTC */
299 int	vm_rtc_write(struct vmctx *ctx, int offset, uint8_t value);
300 int	vm_rtc_read(struct vmctx *ctx, int offset, uint8_t *retval);
301 int	vm_rtc_settime(struct vmctx *ctx, time_t secs);
302 int	vm_rtc_gettime(struct vmctx *ctx, time_t *secs);
303 
304 /* Reset vcpu register state */
305 int	vcpu_reset(struct vmctx *ctx, int vcpu);
306 
307 int	vm_active_cpus(struct vmctx *ctx, cpuset_t *cpus);
308 int	vm_suspended_cpus(struct vmctx *ctx, cpuset_t *cpus);
309 int	vm_debug_cpus(struct vmctx *ctx, cpuset_t *cpus);
310 int	vm_activate_cpu(struct vmctx *ctx, int vcpu);
311 int	vm_suspend_cpu(struct vmctx *ctx, int vcpu);
312 int	vm_resume_cpu(struct vmctx *ctx, int vcpu);
313 
314 /* CPU topology */
315 int	vm_set_topology(struct vmctx *ctx, uint16_t sockets, uint16_t cores,
316 	    uint16_t threads, uint16_t maxcpus);
317 int	vm_get_topology(struct vmctx *ctx, uint16_t *sockets, uint16_t *cores,
318 	    uint16_t *threads, uint16_t *maxcpus);
319 
320 #ifndef	__FreeBSD__
321 /* illumos-specific APIs */
322 int	vm_pmtmr_set_location(struct vmctx *ctx, uint16_t ioport);
323 int	vm_wrlock_cycle(struct vmctx *ctx);
324 int vm_get_run_state(struct vmctx *ctx, int vcpu, enum vcpu_run_state *state,
325     uint8_t *sipi_vector);
326 int vm_set_run_state(struct vmctx *ctx, int vcpu, enum vcpu_run_state state,
327     uint8_t sipi_vector);
328 #endif	/* __FreeBSD__ */
329 
330 #ifdef	__FreeBSD__
331 /*
332  * FreeBSD specific APIs
333  */
334 int	vm_setup_freebsd_registers(struct vmctx *ctx, int vcpu,
335 				uint64_t rip, uint64_t cr3, uint64_t gdtbase,
336 				uint64_t rsp);
337 int	vm_setup_freebsd_registers_i386(struct vmctx *vmctx, int vcpu,
338 					uint32_t eip, uint32_t gdtbase,
339 					uint32_t esp);
340 void	vm_setup_freebsd_gdt(uint64_t *gdtr);
341 #endif
342 #endif	/* _VMMAPI_H_ */
343