1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 
22 /*
23  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
24  * Use is subject to license terms.
25  */
26 
27 /*
28  * Copyright (c) 2013, Joyent, Inc. All rights reserved.
29  * Copyright (c) 2013 by Delphix. All rights reserved.
30  */
31 
32 #ifndef _SYS_DTRACE_H
33 #define	_SYS_DTRACE_H
34 
35 /* #pragma ident	"%Z%%M%	%I%	%E% SMI" */
36 
37 #ifdef	__cplusplus
38 extern "C" {
39 #endif
40 
41 /*
42  * DTrace Dynamic Tracing Software: Kernel Interfaces
43  *
44  * Note: The contents of this file are private to the implementation of the
45  * Solaris system and DTrace subsystem and are subject to change at any time
46  * without notice.  Applications and drivers using these interfaces will fail
47  * to run on future releases.  These interfaces should not be used for any
48  * purpose except those expressly outlined in dtrace(7D) and libdtrace(3LIB).
49  * Please refer to the "Solaris Dynamic Tracing Guide" for more information.
50  */
51 
52 #ifndef _ASM
53 
54 #include <sys/types.h>
55 #include <sys/modctl.h>
56 #include <sys/processor.h>
57 #ifdef illumos
58 #include <sys/systm.h>
59 #else
60 #include <sys/proc.h>
61 #include <sys/param.h>
62 #include <sys/linker.h>
63 #include <sys/ioccom.h>
64 #include <sys/ucred.h>
65 #include <sys/pset.h>
66 typedef int model_t;
67 #endif
68 #include <sys/ctf_api.h>
69 #ifdef illumos
70 #include <sys/cyclic.h>
71 #include <sys/int_limits.h>
72 #else
73 #include <sys/stdint.h>
74 #endif
75 
76 /*
77  * DTrace Universal Constants and Typedefs
78  */
79 #define	DTRACE_CPUALL		-1	/* all CPUs */
80 #define	DTRACE_IDNONE		0	/* invalid probe identifier */
81 #define	DTRACE_EPIDNONE		0	/* invalid enabled probe identifier */
82 #define	DTRACE_AGGIDNONE	0	/* invalid aggregation identifier */
83 #define	DTRACE_AGGVARIDNONE	0	/* invalid aggregation variable ID */
84 #define	DTRACE_CACHEIDNONE	0	/* invalid predicate cache */
85 #define	DTRACE_PROVNONE		0	/* invalid provider identifier */
86 #define	DTRACE_METAPROVNONE	0	/* invalid meta-provider identifier */
87 #define	DTRACE_ARGNONE		-1	/* invalid argument index */
88 
89 #define	DTRACE_PROVNAMELEN	64
90 #define	DTRACE_MODNAMELEN	64
91 #define	DTRACE_FUNCNAMELEN	128
92 #define	DTRACE_NAMELEN		64
93 #define	DTRACE_FULLNAMELEN	(DTRACE_PROVNAMELEN + DTRACE_MODNAMELEN + \
94 				DTRACE_FUNCNAMELEN + DTRACE_NAMELEN + 4)
95 #define	DTRACE_ARGTYPELEN	128
96 
97 typedef uint32_t dtrace_id_t;		/* probe identifier */
98 typedef uint32_t dtrace_epid_t;		/* enabled probe identifier */
99 typedef uint32_t dtrace_aggid_t;	/* aggregation identifier */
100 typedef int64_t dtrace_aggvarid_t;	/* aggregation variable identifier */
101 typedef uint16_t dtrace_actkind_t;	/* action kind */
102 typedef int64_t dtrace_optval_t;	/* option value */
103 typedef uint32_t dtrace_cacheid_t;	/* predicate cache identifier */
104 
105 typedef enum dtrace_probespec {
106 	DTRACE_PROBESPEC_NONE = -1,
107 	DTRACE_PROBESPEC_PROVIDER = 0,
108 	DTRACE_PROBESPEC_MOD,
109 	DTRACE_PROBESPEC_FUNC,
110 	DTRACE_PROBESPEC_NAME
111 } dtrace_probespec_t;
112 
113 /*
114  * DTrace Intermediate Format (DIF)
115  *
116  * The following definitions describe the DTrace Intermediate Format (DIF), a
117  * a RISC-like instruction set and program encoding used to represent
118  * predicates and actions that can be bound to DTrace probes.  The constants
119  * below defining the number of available registers are suggested minimums; the
120  * compiler should use DTRACEIOC_CONF to dynamically obtain the number of
121  * registers provided by the current DTrace implementation.
122  */
123 #define	DIF_VERSION_1	1		/* DIF version 1: Solaris 10 Beta */
124 #define	DIF_VERSION_2	2		/* DIF version 2: Solaris 10 FCS */
125 #define	DIF_VERSION	DIF_VERSION_2	/* latest DIF instruction set version */
126 #define	DIF_DIR_NREGS	8		/* number of DIF integer registers */
127 #define	DIF_DTR_NREGS	8		/* number of DIF tuple registers */
128 
129 #define	DIF_OP_OR	1		/* or	r1, r2, rd */
130 #define	DIF_OP_XOR	2		/* xor	r1, r2, rd */
131 #define	DIF_OP_AND	3		/* and	r1, r2, rd */
132 #define	DIF_OP_SLL	4		/* sll	r1, r2, rd */
133 #define	DIF_OP_SRL	5		/* srl	r1, r2, rd */
134 #define	DIF_OP_SUB	6		/* sub	r1, r2, rd */
135 #define	DIF_OP_ADD	7		/* add	r1, r2, rd */
136 #define	DIF_OP_MUL	8		/* mul	r1, r2, rd */
137 #define	DIF_OP_SDIV	9		/* sdiv	r1, r2, rd */
138 #define	DIF_OP_UDIV	10		/* udiv r1, r2, rd */
139 #define	DIF_OP_SREM	11		/* srem r1, r2, rd */
140 #define	DIF_OP_UREM	12		/* urem r1, r2, rd */
141 #define	DIF_OP_NOT	13		/* not	r1, rd */
142 #define	DIF_OP_MOV	14		/* mov	r1, rd */
143 #define	DIF_OP_CMP	15		/* cmp	r1, r2 */
144 #define	DIF_OP_TST	16		/* tst  r1 */
145 #define	DIF_OP_BA	17		/* ba	label */
146 #define	DIF_OP_BE	18		/* be	label */
147 #define	DIF_OP_BNE	19		/* bne	label */
148 #define	DIF_OP_BG	20		/* bg	label */
149 #define	DIF_OP_BGU	21		/* bgu	label */
150 #define	DIF_OP_BGE	22		/* bge	label */
151 #define	DIF_OP_BGEU	23		/* bgeu	label */
152 #define	DIF_OP_BL	24		/* bl	label */
153 #define	DIF_OP_BLU	25		/* blu	label */
154 #define	DIF_OP_BLE	26		/* ble	label */
155 #define	DIF_OP_BLEU	27		/* bleu	label */
156 #define	DIF_OP_LDSB	28		/* ldsb	[r1], rd */
157 #define	DIF_OP_LDSH	29		/* ldsh	[r1], rd */
158 #define	DIF_OP_LDSW	30		/* ldsw [r1], rd */
159 #define	DIF_OP_LDUB	31		/* ldub	[r1], rd */
160 #define	DIF_OP_LDUH	32		/* lduh	[r1], rd */
161 #define	DIF_OP_LDUW	33		/* lduw	[r1], rd */
162 #define	DIF_OP_LDX	34		/* ldx	[r1], rd */
163 #define	DIF_OP_RET	35		/* ret	rd */
164 #define	DIF_OP_NOP	36		/* nop */
165 #define	DIF_OP_SETX	37		/* setx	intindex, rd */
166 #define	DIF_OP_SETS	38		/* sets strindex, rd */
167 #define	DIF_OP_SCMP	39		/* scmp	r1, r2 */
168 #define	DIF_OP_LDGA	40		/* ldga	var, ri, rd */
169 #define	DIF_OP_LDGS	41		/* ldgs var, rd */
170 #define	DIF_OP_STGS	42		/* stgs var, rs */
171 #define	DIF_OP_LDTA	43		/* ldta var, ri, rd */
172 #define	DIF_OP_LDTS	44		/* ldts var, rd */
173 #define	DIF_OP_STTS	45		/* stts var, rs */
174 #define	DIF_OP_SRA	46		/* sra	r1, r2, rd */
175 #define	DIF_OP_CALL	47		/* call	subr, rd */
176 #define	DIF_OP_PUSHTR	48		/* pushtr type, rs, rr */
177 #define	DIF_OP_PUSHTV	49		/* pushtv type, rs, rv */
178 #define	DIF_OP_POPTS	50		/* popts */
179 #define	DIF_OP_FLUSHTS	51		/* flushts */
180 #define	DIF_OP_LDGAA	52		/* ldgaa var, rd */
181 #define	DIF_OP_LDTAA	53		/* ldtaa var, rd */
182 #define	DIF_OP_STGAA	54		/* stgaa var, rs */
183 #define	DIF_OP_STTAA	55		/* sttaa var, rs */
184 #define	DIF_OP_LDLS	56		/* ldls	var, rd */
185 #define	DIF_OP_STLS	57		/* stls	var, rs */
186 #define	DIF_OP_ALLOCS	58		/* allocs r1, rd */
187 #define	DIF_OP_COPYS	59		/* copys  r1, r2, rd */
188 #define	DIF_OP_STB	60		/* stb	r1, [rd] */
189 #define	DIF_OP_STH	61		/* sth	r1, [rd] */
190 #define	DIF_OP_STW	62		/* stw	r1, [rd] */
191 #define	DIF_OP_STX	63		/* stx	r1, [rd] */
192 #define	DIF_OP_ULDSB	64		/* uldsb [r1], rd */
193 #define	DIF_OP_ULDSH	65		/* uldsh [r1], rd */
194 #define	DIF_OP_ULDSW	66		/* uldsw [r1], rd */
195 #define	DIF_OP_ULDUB	67		/* uldub [r1], rd */
196 #define	DIF_OP_ULDUH	68		/* ulduh [r1], rd */
197 #define	DIF_OP_ULDUW	69		/* ulduw [r1], rd */
198 #define	DIF_OP_ULDX	70		/* uldx  [r1], rd */
199 #define	DIF_OP_RLDSB	71		/* rldsb [r1], rd */
200 #define	DIF_OP_RLDSH	72		/* rldsh [r1], rd */
201 #define	DIF_OP_RLDSW	73		/* rldsw [r1], rd */
202 #define	DIF_OP_RLDUB	74		/* rldub [r1], rd */
203 #define	DIF_OP_RLDUH	75		/* rlduh [r1], rd */
204 #define	DIF_OP_RLDUW	76		/* rlduw [r1], rd */
205 #define	DIF_OP_RLDX	77		/* rldx  [r1], rd */
206 #define	DIF_OP_XLATE	78		/* xlate xlrindex, rd */
207 #define	DIF_OP_XLARG	79		/* xlarg xlrindex, rd */
208 
209 #define	DIF_INTOFF_MAX		0xffff	/* highest integer table offset */
210 #define	DIF_STROFF_MAX		0xffff	/* highest string table offset */
211 #define	DIF_REGISTER_MAX	0xff	/* highest register number */
212 #define	DIF_VARIABLE_MAX	0xffff	/* highest variable identifier */
213 #define	DIF_SUBROUTINE_MAX	0xffff	/* highest subroutine code */
214 
215 #define	DIF_VAR_ARRAY_MIN	0x0000	/* lowest numbered array variable */
216 #define	DIF_VAR_ARRAY_UBASE	0x0080	/* lowest user-defined array */
217 #define	DIF_VAR_ARRAY_MAX	0x00ff	/* highest numbered array variable */
218 
219 #define	DIF_VAR_OTHER_MIN	0x0100	/* lowest numbered scalar or assc */
220 #define	DIF_VAR_OTHER_UBASE	0x0500	/* lowest user-defined scalar or assc */
221 #define	DIF_VAR_OTHER_MAX	0xffff	/* highest numbered scalar or assc */
222 
223 #define	DIF_VAR_ARGS		0x0000	/* arguments array */
224 #define	DIF_VAR_REGS		0x0001	/* registers array */
225 #define	DIF_VAR_UREGS		0x0002	/* user registers array */
226 #define	DIF_VAR_CURTHREAD	0x0100	/* thread pointer */
227 #define	DIF_VAR_TIMESTAMP	0x0101	/* timestamp */
228 #define	DIF_VAR_VTIMESTAMP	0x0102	/* virtual timestamp */
229 #define	DIF_VAR_IPL		0x0103	/* interrupt priority level */
230 #define	DIF_VAR_EPID		0x0104	/* enabled probe ID */
231 #define	DIF_VAR_ID		0x0105	/* probe ID */
232 #define	DIF_VAR_ARG0		0x0106	/* first argument */
233 #define	DIF_VAR_ARG1		0x0107	/* second argument */
234 #define	DIF_VAR_ARG2		0x0108	/* third argument */
235 #define	DIF_VAR_ARG3		0x0109	/* fourth argument */
236 #define	DIF_VAR_ARG4		0x010a	/* fifth argument */
237 #define	DIF_VAR_ARG5		0x010b	/* sixth argument */
238 #define	DIF_VAR_ARG6		0x010c	/* seventh argument */
239 #define	DIF_VAR_ARG7		0x010d	/* eighth argument */
240 #define	DIF_VAR_ARG8		0x010e	/* ninth argument */
241 #define	DIF_VAR_ARG9		0x010f	/* tenth argument */
242 #define	DIF_VAR_STACKDEPTH	0x0110	/* stack depth */
243 #define	DIF_VAR_CALLER		0x0111	/* caller */
244 #define	DIF_VAR_PROBEPROV	0x0112	/* probe provider */
245 #define	DIF_VAR_PROBEMOD	0x0113	/* probe module */
246 #define	DIF_VAR_PROBEFUNC	0x0114	/* probe function */
247 #define	DIF_VAR_PROBENAME	0x0115	/* probe name */
248 #define	DIF_VAR_PID		0x0116	/* process ID */
249 #define	DIF_VAR_TID		0x0117	/* (per-process) thread ID */
250 #define	DIF_VAR_EXECNAME	0x0118	/* name of executable */
251 #define	DIF_VAR_ZONENAME	0x0119	/* zone name associated with process */
252 #define	DIF_VAR_WALLTIMESTAMP	0x011a	/* wall-clock timestamp */
253 #define	DIF_VAR_USTACKDEPTH	0x011b	/* user-land stack depth */
254 #define	DIF_VAR_UCALLER		0x011c	/* user-level caller */
255 #define	DIF_VAR_PPID		0x011d	/* parent process ID */
256 #define	DIF_VAR_UID		0x011e	/* process user ID */
257 #define	DIF_VAR_GID		0x011f	/* process group ID */
258 #define	DIF_VAR_ERRNO		0x0120	/* thread errno */
259 #define	DIF_VAR_EXECARGS	0x0121	/* process arguments */
260 
261 #ifndef illumos
262 #define	DIF_VAR_CPU		0x0200
263 #endif
264 
265 #define	DIF_SUBR_RAND			0
266 #define	DIF_SUBR_MUTEX_OWNED		1
267 #define	DIF_SUBR_MUTEX_OWNER		2
268 #define	DIF_SUBR_MUTEX_TYPE_ADAPTIVE	3
269 #define	DIF_SUBR_MUTEX_TYPE_SPIN	4
270 #define	DIF_SUBR_RW_READ_HELD		5
271 #define	DIF_SUBR_RW_WRITE_HELD		6
272 #define	DIF_SUBR_RW_ISWRITER		7
273 #define	DIF_SUBR_COPYIN			8
274 #define	DIF_SUBR_COPYINSTR		9
275 #define	DIF_SUBR_SPECULATION		10
276 #define	DIF_SUBR_PROGENYOF		11
277 #define	DIF_SUBR_STRLEN			12
278 #define	DIF_SUBR_COPYOUT		13
279 #define	DIF_SUBR_COPYOUTSTR		14
280 #define	DIF_SUBR_ALLOCA			15
281 #define	DIF_SUBR_BCOPY			16
282 #define	DIF_SUBR_COPYINTO		17
283 #define	DIF_SUBR_MSGDSIZE		18
284 #define	DIF_SUBR_MSGSIZE		19
285 #define	DIF_SUBR_GETMAJOR		20
286 #define	DIF_SUBR_GETMINOR		21
287 #define	DIF_SUBR_DDI_PATHNAME		22
288 #define	DIF_SUBR_STRJOIN		23
289 #define	DIF_SUBR_LLTOSTR		24
290 #define	DIF_SUBR_BASENAME		25
291 #define	DIF_SUBR_DIRNAME		26
292 #define	DIF_SUBR_CLEANPATH		27
293 #define	DIF_SUBR_STRCHR			28
294 #define	DIF_SUBR_STRRCHR		29
295 #define	DIF_SUBR_STRSTR			30
296 #define	DIF_SUBR_STRTOK			31
297 #define	DIF_SUBR_SUBSTR			32
298 #define	DIF_SUBR_INDEX			33
299 #define	DIF_SUBR_RINDEX			34
300 #define	DIF_SUBR_HTONS			35
301 #define	DIF_SUBR_HTONL			36
302 #define	DIF_SUBR_HTONLL			37
303 #define	DIF_SUBR_NTOHS			38
304 #define	DIF_SUBR_NTOHL			39
305 #define	DIF_SUBR_NTOHLL			40
306 #define	DIF_SUBR_INET_NTOP		41
307 #define	DIF_SUBR_INET_NTOA		42
308 #define	DIF_SUBR_INET_NTOA6		43
309 #define	DIF_SUBR_TOUPPER		44
310 #define	DIF_SUBR_TOLOWER		45
311 #define	DIF_SUBR_MEMREF			46
312 #define	DIF_SUBR_TYPEREF		47
313 #define	DIF_SUBR_SX_SHARED_HELD		48
314 #define	DIF_SUBR_SX_EXCLUSIVE_HELD	49
315 #define	DIF_SUBR_SX_ISEXCLUSIVE		50
316 #define	DIF_SUBR_MEMSTR			51
317 #define	DIF_SUBR_GETF			52
318 #define	DIF_SUBR_JSON			53
319 #define	DIF_SUBR_STRTOLL		54
320 #define	DIF_SUBR_MAX			54	/* max subroutine value */
321 
322 typedef uint32_t dif_instr_t;
323 
324 #define	DIF_INSTR_OP(i)			(((i) >> 24) & 0xff)
325 #define	DIF_INSTR_R1(i)			(((i) >> 16) & 0xff)
326 #define	DIF_INSTR_R2(i)			(((i) >>  8) & 0xff)
327 #define	DIF_INSTR_RD(i)			((i) & 0xff)
328 #define	DIF_INSTR_RS(i)			((i) & 0xff)
329 #define	DIF_INSTR_LABEL(i)		((i) & 0xffffff)
330 #define	DIF_INSTR_VAR(i)		(((i) >>  8) & 0xffff)
331 #define	DIF_INSTR_INTEGER(i)		(((i) >>  8) & 0xffff)
332 #define	DIF_INSTR_STRING(i)		(((i) >>  8) & 0xffff)
333 #define	DIF_INSTR_SUBR(i)		(((i) >>  8) & 0xffff)
334 #define	DIF_INSTR_TYPE(i)		(((i) >> 16) & 0xff)
335 #define	DIF_INSTR_XLREF(i)		(((i) >>  8) & 0xffff)
336 
337 #define	DIF_INSTR_FMT(op, r1, r2, d) \
338 	(((op) << 24) | ((r1) << 16) | ((r2) << 8) | (d))
339 
340 #define	DIF_INSTR_NOT(r1, d)		(DIF_INSTR_FMT(DIF_OP_NOT, r1, 0, d))
341 #define	DIF_INSTR_MOV(r1, d)		(DIF_INSTR_FMT(DIF_OP_MOV, r1, 0, d))
342 #define	DIF_INSTR_CMP(op, r1, r2)	(DIF_INSTR_FMT(op, r1, r2, 0))
343 #define	DIF_INSTR_TST(r1)		(DIF_INSTR_FMT(DIF_OP_TST, r1, 0, 0))
344 #define	DIF_INSTR_BRANCH(op, label)	(((op) << 24) | (label))
345 #define	DIF_INSTR_LOAD(op, r1, d)	(DIF_INSTR_FMT(op, r1, 0, d))
346 #define	DIF_INSTR_STORE(op, r1, d)	(DIF_INSTR_FMT(op, r1, 0, d))
347 #define	DIF_INSTR_SETX(i, d)		((DIF_OP_SETX << 24) | ((i) << 8) | (d))
348 #define	DIF_INSTR_SETS(s, d)		((DIF_OP_SETS << 24) | ((s) << 8) | (d))
349 #define	DIF_INSTR_RET(d)		(DIF_INSTR_FMT(DIF_OP_RET, 0, 0, d))
350 #define	DIF_INSTR_NOP			(DIF_OP_NOP << 24)
351 #define	DIF_INSTR_LDA(op, v, r, d)	(DIF_INSTR_FMT(op, v, r, d))
352 #define	DIF_INSTR_LDV(op, v, d)		(((op) << 24) | ((v) << 8) | (d))
353 #define	DIF_INSTR_STV(op, v, rs)	(((op) << 24) | ((v) << 8) | (rs))
354 #define	DIF_INSTR_CALL(s, d)		((DIF_OP_CALL << 24) | ((s) << 8) | (d))
355 #define	DIF_INSTR_PUSHTS(op, t, r2, rs)	(DIF_INSTR_FMT(op, t, r2, rs))
356 #define	DIF_INSTR_POPTS			(DIF_OP_POPTS << 24)
357 #define	DIF_INSTR_FLUSHTS		(DIF_OP_FLUSHTS << 24)
358 #define	DIF_INSTR_ALLOCS(r1, d)		(DIF_INSTR_FMT(DIF_OP_ALLOCS, r1, 0, d))
359 #define	DIF_INSTR_COPYS(r1, r2, d)	(DIF_INSTR_FMT(DIF_OP_COPYS, r1, r2, d))
360 #define	DIF_INSTR_XLATE(op, r, d)	(((op) << 24) | ((r) << 8) | (d))
361 
362 #define	DIF_REG_R0	0		/* %r0 is always set to zero */
363 
364 /*
365  * A DTrace Intermediate Format Type (DIF Type) is used to represent the types
366  * of variables, function and associative array arguments, and the return type
367  * for each DIF object (shown below).  It contains a description of the type,
368  * its size in bytes, and a module identifier.
369  */
370 typedef struct dtrace_diftype {
371 	uint8_t dtdt_kind;		/* type kind (see below) */
372 	uint8_t dtdt_ckind;		/* type kind in CTF */
373 	uint8_t dtdt_flags;		/* type flags (see below) */
374 	uint8_t dtdt_pad;		/* reserved for future use */
375 	uint32_t dtdt_size;		/* type size in bytes (unless string) */
376 } dtrace_diftype_t;
377 
378 #define	DIF_TYPE_CTF		0	/* type is a CTF type */
379 #define	DIF_TYPE_STRING		1	/* type is a D string */
380 
381 #define	DIF_TF_BYREF		0x1	/* type is passed by reference */
382 #define	DIF_TF_BYUREF		0x2	/* user type is passed by reference */
383 
384 /*
385  * A DTrace Intermediate Format variable record is used to describe each of the
386  * variables referenced by a given DIF object.  It contains an integer variable
387  * identifier along with variable scope and properties, as shown below.  The
388  * size of this structure must be sizeof (int) aligned.
389  */
390 typedef struct dtrace_difv {
391 	uint32_t dtdv_name;		/* variable name index in dtdo_strtab */
392 	uint32_t dtdv_id;		/* variable reference identifier */
393 	uint8_t dtdv_kind;		/* variable kind (see below) */
394 	uint8_t dtdv_scope;		/* variable scope (see below) */
395 	uint16_t dtdv_flags;		/* variable flags (see below) */
396 	dtrace_diftype_t dtdv_type;	/* variable type (see above) */
397 } dtrace_difv_t;
398 
399 #define	DIFV_KIND_ARRAY		0	/* variable is an array of quantities */
400 #define	DIFV_KIND_SCALAR	1	/* variable is a scalar quantity */
401 
402 #define	DIFV_SCOPE_GLOBAL	0	/* variable has global scope */
403 #define	DIFV_SCOPE_THREAD	1	/* variable has thread scope */
404 #define	DIFV_SCOPE_LOCAL	2	/* variable has local scope */
405 
406 #define	DIFV_F_REF		0x1	/* variable is referenced by DIFO */
407 #define	DIFV_F_MOD		0x2	/* variable is written by DIFO */
408 
409 /*
410  * DTrace Actions
411  *
412  * The upper byte determines the class of the action; the low bytes determines
413  * the specific action within that class.  The classes of actions are as
414  * follows:
415  *
416  *   [ no class ]                  <= May record process- or kernel-related data
417  *   DTRACEACT_PROC                <= Only records process-related data
418  *   DTRACEACT_PROC_DESTRUCTIVE    <= Potentially destructive to processes
419  *   DTRACEACT_KERNEL              <= Only records kernel-related data
420  *   DTRACEACT_KERNEL_DESTRUCTIVE  <= Potentially destructive to the kernel
421  *   DTRACEACT_SPECULATIVE         <= Speculation-related action
422  *   DTRACEACT_AGGREGATION         <= Aggregating action
423  */
424 #define	DTRACEACT_NONE			0	/* no action */
425 #define	DTRACEACT_DIFEXPR		1	/* action is DIF expression */
426 #define	DTRACEACT_EXIT			2	/* exit() action */
427 #define	DTRACEACT_PRINTF		3	/* printf() action */
428 #define	DTRACEACT_PRINTA		4	/* printa() action */
429 #define	DTRACEACT_LIBACT		5	/* library-controlled action */
430 #define	DTRACEACT_TRACEMEM		6	/* tracemem() action */
431 #define	DTRACEACT_TRACEMEM_DYNSIZE	7	/* dynamic tracemem() size */
432 #define	DTRACEACT_PRINTM		8	/* printm() action (BSD) */
433 #define	DTRACEACT_PRINTT		9	/* printt() action (BSD) */
434 
435 #define	DTRACEACT_PROC			0x0100
436 #define	DTRACEACT_USTACK		(DTRACEACT_PROC + 1)
437 #define	DTRACEACT_JSTACK		(DTRACEACT_PROC + 2)
438 #define	DTRACEACT_USYM			(DTRACEACT_PROC + 3)
439 #define	DTRACEACT_UMOD			(DTRACEACT_PROC + 4)
440 #define	DTRACEACT_UADDR			(DTRACEACT_PROC + 5)
441 
442 #define	DTRACEACT_PROC_DESTRUCTIVE	0x0200
443 #define	DTRACEACT_STOP			(DTRACEACT_PROC_DESTRUCTIVE + 1)
444 #define	DTRACEACT_RAISE			(DTRACEACT_PROC_DESTRUCTIVE + 2)
445 #define	DTRACEACT_SYSTEM		(DTRACEACT_PROC_DESTRUCTIVE + 3)
446 #define	DTRACEACT_FREOPEN		(DTRACEACT_PROC_DESTRUCTIVE + 4)
447 
448 #define	DTRACEACT_PROC_CONTROL		0x0300
449 
450 #define	DTRACEACT_KERNEL		0x0400
451 #define	DTRACEACT_STACK			(DTRACEACT_KERNEL + 1)
452 #define	DTRACEACT_SYM			(DTRACEACT_KERNEL + 2)
453 #define	DTRACEACT_MOD			(DTRACEACT_KERNEL + 3)
454 
455 #define	DTRACEACT_KERNEL_DESTRUCTIVE	0x0500
456 #define	DTRACEACT_BREAKPOINT		(DTRACEACT_KERNEL_DESTRUCTIVE + 1)
457 #define	DTRACEACT_PANIC			(DTRACEACT_KERNEL_DESTRUCTIVE + 2)
458 #define	DTRACEACT_CHILL			(DTRACEACT_KERNEL_DESTRUCTIVE + 3)
459 
460 #define	DTRACEACT_SPECULATIVE		0x0600
461 #define	DTRACEACT_SPECULATE		(DTRACEACT_SPECULATIVE + 1)
462 #define	DTRACEACT_COMMIT		(DTRACEACT_SPECULATIVE + 2)
463 #define	DTRACEACT_DISCARD		(DTRACEACT_SPECULATIVE + 3)
464 
465 #define	DTRACEACT_CLASS(x)		((x) & 0xff00)
466 
467 #define	DTRACEACT_ISDESTRUCTIVE(x)	\
468 	(DTRACEACT_CLASS(x) == DTRACEACT_PROC_DESTRUCTIVE || \
469 	DTRACEACT_CLASS(x) == DTRACEACT_KERNEL_DESTRUCTIVE)
470 
471 #define	DTRACEACT_ISSPECULATIVE(x)	\
472 	(DTRACEACT_CLASS(x) == DTRACEACT_SPECULATIVE)
473 
474 #define	DTRACEACT_ISPRINTFLIKE(x)	\
475 	((x) == DTRACEACT_PRINTF || (x) == DTRACEACT_PRINTA || \
476 	(x) == DTRACEACT_SYSTEM || (x) == DTRACEACT_FREOPEN)
477 
478 /*
479  * DTrace Aggregating Actions
480  *
481  * These are functions f(x) for which the following is true:
482  *
483  *    f(f(x_0) U f(x_1) U ... U f(x_n)) = f(x_0 U x_1 U ... U x_n)
484  *
485  * where x_n is a set of arbitrary data.  Aggregating actions are in their own
486  * DTrace action class, DTTRACEACT_AGGREGATION.  The macros provided here allow
487  * for easier processing of the aggregation argument and data payload for a few
488  * aggregating actions (notably:  quantize(), lquantize(), and ustack()).
489  */
490 #define	DTRACEACT_AGGREGATION		0x0700
491 #define	DTRACEAGG_COUNT			(DTRACEACT_AGGREGATION + 1)
492 #define	DTRACEAGG_MIN			(DTRACEACT_AGGREGATION + 2)
493 #define	DTRACEAGG_MAX			(DTRACEACT_AGGREGATION + 3)
494 #define	DTRACEAGG_AVG			(DTRACEACT_AGGREGATION + 4)
495 #define	DTRACEAGG_SUM			(DTRACEACT_AGGREGATION + 5)
496 #define	DTRACEAGG_STDDEV		(DTRACEACT_AGGREGATION + 6)
497 #define	DTRACEAGG_QUANTIZE		(DTRACEACT_AGGREGATION + 7)
498 #define	DTRACEAGG_LQUANTIZE		(DTRACEACT_AGGREGATION + 8)
499 #define	DTRACEAGG_LLQUANTIZE		(DTRACEACT_AGGREGATION + 9)
500 
501 #define	DTRACEACT_ISAGG(x)		\
502 	(DTRACEACT_CLASS(x) == DTRACEACT_AGGREGATION)
503 
504 #define	DTRACE_QUANTIZE_NBUCKETS	\
505 	(((sizeof (uint64_t) * NBBY) - 1) * 2 + 1)
506 
507 #define	DTRACE_QUANTIZE_ZEROBUCKET	((sizeof (uint64_t) * NBBY) - 1)
508 
509 #define	DTRACE_QUANTIZE_BUCKETVAL(buck)					\
510 	(int64_t)((buck) < DTRACE_QUANTIZE_ZEROBUCKET ?			\
511 	-(1LL << (DTRACE_QUANTIZE_ZEROBUCKET - 1 - (buck))) :		\
512 	(buck) == DTRACE_QUANTIZE_ZEROBUCKET ? 0 :			\
513 	1LL << ((buck) - DTRACE_QUANTIZE_ZEROBUCKET - 1))
514 
515 #define	DTRACE_LQUANTIZE_STEPSHIFT		48
516 #define	DTRACE_LQUANTIZE_STEPMASK		((uint64_t)UINT16_MAX << 48)
517 #define	DTRACE_LQUANTIZE_LEVELSHIFT		32
518 #define	DTRACE_LQUANTIZE_LEVELMASK		((uint64_t)UINT16_MAX << 32)
519 #define	DTRACE_LQUANTIZE_BASESHIFT		0
520 #define	DTRACE_LQUANTIZE_BASEMASK		UINT32_MAX
521 
522 #define	DTRACE_LQUANTIZE_STEP(x)		\
523 	(uint16_t)(((x) & DTRACE_LQUANTIZE_STEPMASK) >> \
524 	DTRACE_LQUANTIZE_STEPSHIFT)
525 
526 #define	DTRACE_LQUANTIZE_LEVELS(x)		\
527 	(uint16_t)(((x) & DTRACE_LQUANTIZE_LEVELMASK) >> \
528 	DTRACE_LQUANTIZE_LEVELSHIFT)
529 
530 #define	DTRACE_LQUANTIZE_BASE(x)		\
531 	(int32_t)(((x) & DTRACE_LQUANTIZE_BASEMASK) >> \
532 	DTRACE_LQUANTIZE_BASESHIFT)
533 
534 #define	DTRACE_LLQUANTIZE_FACTORSHIFT		48
535 #define	DTRACE_LLQUANTIZE_FACTORMASK		((uint64_t)UINT16_MAX << 48)
536 #define	DTRACE_LLQUANTIZE_LOWSHIFT		32
537 #define	DTRACE_LLQUANTIZE_LOWMASK		((uint64_t)UINT16_MAX << 32)
538 #define	DTRACE_LLQUANTIZE_HIGHSHIFT		16
539 #define	DTRACE_LLQUANTIZE_HIGHMASK		((uint64_t)UINT16_MAX << 16)
540 #define	DTRACE_LLQUANTIZE_NSTEPSHIFT		0
541 #define	DTRACE_LLQUANTIZE_NSTEPMASK		UINT16_MAX
542 
543 #define	DTRACE_LLQUANTIZE_FACTOR(x)		\
544 	(uint16_t)(((x) & DTRACE_LLQUANTIZE_FACTORMASK) >> \
545 	DTRACE_LLQUANTIZE_FACTORSHIFT)
546 
547 #define	DTRACE_LLQUANTIZE_LOW(x)		\
548 	(uint16_t)(((x) & DTRACE_LLQUANTIZE_LOWMASK) >> \
549 	DTRACE_LLQUANTIZE_LOWSHIFT)
550 
551 #define	DTRACE_LLQUANTIZE_HIGH(x)		\
552 	(uint16_t)(((x) & DTRACE_LLQUANTIZE_HIGHMASK) >> \
553 	DTRACE_LLQUANTIZE_HIGHSHIFT)
554 
555 #define	DTRACE_LLQUANTIZE_NSTEP(x)		\
556 	(uint16_t)(((x) & DTRACE_LLQUANTIZE_NSTEPMASK) >> \
557 	DTRACE_LLQUANTIZE_NSTEPSHIFT)
558 
559 #define	DTRACE_USTACK_NFRAMES(x)	(uint32_t)((x) & UINT32_MAX)
560 #define	DTRACE_USTACK_STRSIZE(x)	(uint32_t)((x) >> 32)
561 #define	DTRACE_USTACK_ARG(x, y)		\
562 	((((uint64_t)(y)) << 32) | ((x) & UINT32_MAX))
563 
564 #ifndef _LP64
565 #if BYTE_ORDER == _BIG_ENDIAN
566 #define	DTRACE_PTR(type, name)	uint32_t name##pad; type *name
567 #else
568 #define	DTRACE_PTR(type, name)	type *name; uint32_t name##pad
569 #endif
570 #else
571 #define	DTRACE_PTR(type, name)	type *name
572 #endif
573 
574 /*
575  * DTrace Object Format (DOF)
576  *
577  * DTrace programs can be persistently encoded in the DOF format so that they
578  * may be embedded in other programs (for example, in an ELF file) or in the
579  * dtrace driver configuration file for use in anonymous tracing.  The DOF
580  * format is versioned and extensible so that it can be revised and so that
581  * internal data structures can be modified or extended compatibly.  All DOF
582  * structures use fixed-size types, so the 32-bit and 64-bit representations
583  * are identical and consumers can use either data model transparently.
584  *
585  * The file layout is structured as follows:
586  *
587  * +---------------+-------------------+----- ... ----+---- ... ------+
588  * |   dof_hdr_t   |  dof_sec_t[ ... ] |   loadable   | non-loadable  |
589  * | (file header) | (section headers) | section data | section data  |
590  * +---------------+-------------------+----- ... ----+---- ... ------+
591  * |<------------ dof_hdr.dofh_loadsz --------------->|               |
592  * |<------------ dof_hdr.dofh_filesz ------------------------------->|
593  *
594  * The file header stores meta-data including a magic number, data model for
595  * the instrumentation, data encoding, and properties of the DIF code within.
596  * The header describes its own size and the size of the section headers.  By
597  * convention, an array of section headers follows the file header, and then
598  * the data for all loadable sections and unloadable sections.  This permits
599  * consumer code to easily download the headers and all loadable data into the
600  * DTrace driver in one contiguous chunk, omitting other extraneous sections.
601  *
602  * The section headers describe the size, offset, alignment, and section type
603  * for each section.  Sections are described using a set of #defines that tell
604  * the consumer what kind of data is expected.  Sections can contain links to
605  * other sections by storing a dof_secidx_t, an index into the section header
606  * array, inside of the section data structures.  The section header includes
607  * an entry size so that sections with data arrays can grow their structures.
608  *
609  * The DOF data itself can contain many snippets of DIF (i.e. >1 DIFOs), which
610  * are represented themselves as a collection of related DOF sections.  This
611  * permits us to change the set of sections associated with a DIFO over time,
612  * and also permits us to encode DIFOs that contain different sets of sections.
613  * When a DOF section wants to refer to a DIFO, it stores the dof_secidx_t of a
614  * section of type DOF_SECT_DIFOHDR.  This section's data is then an array of
615  * dof_secidx_t's which in turn denote the sections associated with this DIFO.
616  *
617  * This loose coupling of the file structure (header and sections) to the
618  * structure of the DTrace program itself (ECB descriptions, action
619  * descriptions, and DIFOs) permits activities such as relocation processing
620  * to occur in a single pass without having to understand D program structure.
621  *
622  * Finally, strings are always stored in ELF-style string tables along with a
623  * string table section index and string table offset.  Therefore strings in
624  * DOF are always arbitrary-length and not bound to the current implementation.
625  */
626 
627 #define	DOF_ID_SIZE	16	/* total size of dofh_ident[] in bytes */
628 
629 typedef struct dof_hdr {
630 	uint8_t dofh_ident[DOF_ID_SIZE]; /* identification bytes (see below) */
631 	uint32_t dofh_flags;		/* file attribute flags (if any) */
632 	uint32_t dofh_hdrsize;		/* size of file header in bytes */
633 	uint32_t dofh_secsize;		/* size of section header in bytes */
634 	uint32_t dofh_secnum;		/* number of section headers */
635 	uint64_t dofh_secoff;		/* file offset of section headers */
636 	uint64_t dofh_loadsz;		/* file size of loadable portion */
637 	uint64_t dofh_filesz;		/* file size of entire DOF file */
638 	uint64_t dofh_pad;		/* reserved for future use */
639 } dof_hdr_t;
640 
641 #define	DOF_ID_MAG0	0	/* first byte of magic number */
642 #define	DOF_ID_MAG1	1	/* second byte of magic number */
643 #define	DOF_ID_MAG2	2	/* third byte of magic number */
644 #define	DOF_ID_MAG3	3	/* fourth byte of magic number */
645 #define	DOF_ID_MODEL	4	/* DOF data model (see below) */
646 #define	DOF_ID_ENCODING	5	/* DOF data encoding (see below) */
647 #define	DOF_ID_VERSION	6	/* DOF file format major version (see below) */
648 #define	DOF_ID_DIFVERS	7	/* DIF instruction set version */
649 #define	DOF_ID_DIFIREG	8	/* DIF integer registers used by compiler */
650 #define	DOF_ID_DIFTREG	9	/* DIF tuple registers used by compiler */
651 #define	DOF_ID_PAD	10	/* start of padding bytes (all zeroes) */
652 
653 #define	DOF_MAG_MAG0	0x7F	/* DOF_ID_MAG[0-3] */
654 #define	DOF_MAG_MAG1	'D'
655 #define	DOF_MAG_MAG2	'O'
656 #define	DOF_MAG_MAG3	'F'
657 
658 #define	DOF_MAG_STRING	"\177DOF"
659 #define	DOF_MAG_STRLEN	4
660 
661 #define	DOF_MODEL_NONE	0	/* DOF_ID_MODEL */
662 #define	DOF_MODEL_ILP32	1
663 #define	DOF_MODEL_LP64	2
664 
665 #ifdef _LP64
666 #define	DOF_MODEL_NATIVE	DOF_MODEL_LP64
667 #else
668 #define	DOF_MODEL_NATIVE	DOF_MODEL_ILP32
669 #endif
670 
671 #define	DOF_ENCODE_NONE	0	/* DOF_ID_ENCODING */
672 #define	DOF_ENCODE_LSB	1
673 #define	DOF_ENCODE_MSB	2
674 
675 #if BYTE_ORDER == _BIG_ENDIAN
676 #define	DOF_ENCODE_NATIVE	DOF_ENCODE_MSB
677 #else
678 #define	DOF_ENCODE_NATIVE	DOF_ENCODE_LSB
679 #endif
680 
681 #define	DOF_VERSION_1	1	/* DOF version 1: Solaris 10 FCS */
682 #define	DOF_VERSION_2	2	/* DOF version 2: Solaris Express 6/06 */
683 #define	DOF_VERSION	DOF_VERSION_2	/* Latest DOF version */
684 
685 #define	DOF_FL_VALID	0	/* mask of all valid dofh_flags bits */
686 
687 typedef uint32_t dof_secidx_t;	/* section header table index type */
688 typedef uint32_t dof_stridx_t;	/* string table index type */
689 
690 #define	DOF_SECIDX_NONE	(-1U)	/* null value for section indices */
691 #define	DOF_STRIDX_NONE	(-1U)	/* null value for string indices */
692 
693 typedef struct dof_sec {
694 	uint32_t dofs_type;	/* section type (see below) */
695 	uint32_t dofs_align;	/* section data memory alignment */
696 	uint32_t dofs_flags;	/* section flags (if any) */
697 	uint32_t dofs_entsize;	/* size of section entry (if table) */
698 	uint64_t dofs_offset;	/* offset of section data within file */
699 	uint64_t dofs_size;	/* size of section data in bytes */
700 } dof_sec_t;
701 
702 #define	DOF_SECT_NONE		0	/* null section */
703 #define	DOF_SECT_COMMENTS	1	/* compiler comments */
704 #define	DOF_SECT_SOURCE		2	/* D program source code */
705 #define	DOF_SECT_ECBDESC	3	/* dof_ecbdesc_t */
706 #define	DOF_SECT_PROBEDESC	4	/* dof_probedesc_t */
707 #define	DOF_SECT_ACTDESC	5	/* dof_actdesc_t array */
708 #define	DOF_SECT_DIFOHDR	6	/* dof_difohdr_t (variable length) */
709 #define	DOF_SECT_DIF		7	/* uint32_t array of byte code */
710 #define	DOF_SECT_STRTAB		8	/* string table */
711 #define	DOF_SECT_VARTAB		9	/* dtrace_difv_t array */
712 #define	DOF_SECT_RELTAB		10	/* dof_relodesc_t array */
713 #define	DOF_SECT_TYPTAB		11	/* dtrace_diftype_t array */
714 #define	DOF_SECT_URELHDR	12	/* dof_relohdr_t (user relocations) */
715 #define	DOF_SECT_KRELHDR	13	/* dof_relohdr_t (kernel relocations) */
716 #define	DOF_SECT_OPTDESC	14	/* dof_optdesc_t array */
717 #define	DOF_SECT_PROVIDER	15	/* dof_provider_t */
718 #define	DOF_SECT_PROBES		16	/* dof_probe_t array */
719 #define	DOF_SECT_PRARGS		17	/* uint8_t array (probe arg mappings) */
720 #define	DOF_SECT_PROFFS		18	/* uint32_t array (probe arg offsets) */
721 #define	DOF_SECT_INTTAB		19	/* uint64_t array */
722 #define	DOF_SECT_UTSNAME	20	/* struct utsname */
723 #define	DOF_SECT_XLTAB		21	/* dof_xlref_t array */
724 #define	DOF_SECT_XLMEMBERS	22	/* dof_xlmember_t array */
725 #define	DOF_SECT_XLIMPORT	23	/* dof_xlator_t */
726 #define	DOF_SECT_XLEXPORT	24	/* dof_xlator_t */
727 #define	DOF_SECT_PREXPORT	25	/* dof_secidx_t array (exported objs) */
728 #define	DOF_SECT_PRENOFFS	26	/* uint32_t array (enabled offsets) */
729 
730 #define	DOF_SECF_LOAD		1	/* section should be loaded */
731 
732 #define	DOF_SEC_ISLOADABLE(x)						\
733 	(((x) == DOF_SECT_ECBDESC) || ((x) == DOF_SECT_PROBEDESC) ||	\
734 	((x) == DOF_SECT_ACTDESC) || ((x) == DOF_SECT_DIFOHDR) ||	\
735 	((x) == DOF_SECT_DIF) || ((x) == DOF_SECT_STRTAB) ||		\
736 	((x) == DOF_SECT_VARTAB) || ((x) == DOF_SECT_RELTAB) ||		\
737 	((x) == DOF_SECT_TYPTAB) || ((x) == DOF_SECT_URELHDR) ||	\
738 	((x) == DOF_SECT_KRELHDR) || ((x) == DOF_SECT_OPTDESC) ||	\
739 	((x) == DOF_SECT_PROVIDER) || ((x) == DOF_SECT_PROBES) ||	\
740 	((x) == DOF_SECT_PRARGS) || ((x) == DOF_SECT_PROFFS) ||		\
741 	((x) == DOF_SECT_INTTAB) || ((x) == DOF_SECT_XLTAB) ||		\
742 	((x) == DOF_SECT_XLMEMBERS) || ((x) == DOF_SECT_XLIMPORT) ||	\
743 	((x) == DOF_SECT_XLIMPORT) || ((x) == DOF_SECT_XLEXPORT) ||	\
744 	((x) == DOF_SECT_PREXPORT) || ((x) == DOF_SECT_PRENOFFS))
745 
746 typedef struct dof_ecbdesc {
747 	dof_secidx_t dofe_probes;	/* link to DOF_SECT_PROBEDESC */
748 	dof_secidx_t dofe_pred;		/* link to DOF_SECT_DIFOHDR */
749 	dof_secidx_t dofe_actions;	/* link to DOF_SECT_ACTDESC */
750 	uint32_t dofe_pad;		/* reserved for future use */
751 	uint64_t dofe_uarg;		/* user-supplied library argument */
752 } dof_ecbdesc_t;
753 
754 typedef struct dof_probedesc {
755 	dof_secidx_t dofp_strtab;	/* link to DOF_SECT_STRTAB section */
756 	dof_stridx_t dofp_provider;	/* provider string */
757 	dof_stridx_t dofp_mod;		/* module string */
758 	dof_stridx_t dofp_func;		/* function string */
759 	dof_stridx_t dofp_name;		/* name string */
760 	uint32_t dofp_id;		/* probe identifier (or zero) */
761 } dof_probedesc_t;
762 
763 typedef struct dof_actdesc {
764 	dof_secidx_t dofa_difo;		/* link to DOF_SECT_DIFOHDR */
765 	dof_secidx_t dofa_strtab;	/* link to DOF_SECT_STRTAB section */
766 	uint32_t dofa_kind;		/* action kind (DTRACEACT_* constant) */
767 	uint32_t dofa_ntuple;		/* number of subsequent tuple actions */
768 	uint64_t dofa_arg;		/* kind-specific argument */
769 	uint64_t dofa_uarg;		/* user-supplied argument */
770 } dof_actdesc_t;
771 
772 typedef struct dof_difohdr {
773 	dtrace_diftype_t dofd_rtype;	/* return type for this fragment */
774 	dof_secidx_t dofd_links[1];	/* variable length array of indices */
775 } dof_difohdr_t;
776 
777 typedef struct dof_relohdr {
778 	dof_secidx_t dofr_strtab;	/* link to DOF_SECT_STRTAB for names */
779 	dof_secidx_t dofr_relsec;	/* link to DOF_SECT_RELTAB for relos */
780 	dof_secidx_t dofr_tgtsec;	/* link to section we are relocating */
781 } dof_relohdr_t;
782 
783 typedef struct dof_relodesc {
784 	dof_stridx_t dofr_name;		/* string name of relocation symbol */
785 	uint32_t dofr_type;		/* relo type (DOF_RELO_* constant) */
786 	uint64_t dofr_offset;		/* byte offset for relocation */
787 	uint64_t dofr_data;		/* additional type-specific data */
788 } dof_relodesc_t;
789 
790 #define	DOF_RELO_NONE	0		/* empty relocation entry */
791 #define	DOF_RELO_SETX	1		/* relocate setx value */
792 
793 typedef struct dof_optdesc {
794 	uint32_t dofo_option;		/* option identifier */
795 	dof_secidx_t dofo_strtab;	/* string table, if string option */
796 	uint64_t dofo_value;		/* option value or string index */
797 } dof_optdesc_t;
798 
799 typedef uint32_t dof_attr_t;		/* encoded stability attributes */
800 
801 #define	DOF_ATTR(n, d, c)	(((n) << 24) | ((d) << 16) | ((c) << 8))
802 #define	DOF_ATTR_NAME(a)	(((a) >> 24) & 0xff)
803 #define	DOF_ATTR_DATA(a)	(((a) >> 16) & 0xff)
804 #define	DOF_ATTR_CLASS(a)	(((a) >>  8) & 0xff)
805 
806 typedef struct dof_provider {
807 	dof_secidx_t dofpv_strtab;	/* link to DOF_SECT_STRTAB section */
808 	dof_secidx_t dofpv_probes;	/* link to DOF_SECT_PROBES section */
809 	dof_secidx_t dofpv_prargs;	/* link to DOF_SECT_PRARGS section */
810 	dof_secidx_t dofpv_proffs;	/* link to DOF_SECT_PROFFS section */
811 	dof_stridx_t dofpv_name;	/* provider name string */
812 	dof_attr_t dofpv_provattr;	/* provider attributes */
813 	dof_attr_t dofpv_modattr;	/* module attributes */
814 	dof_attr_t dofpv_funcattr;	/* function attributes */
815 	dof_attr_t dofpv_nameattr;	/* name attributes */
816 	dof_attr_t dofpv_argsattr;	/* args attributes */
817 	dof_secidx_t dofpv_prenoffs;	/* link to DOF_SECT_PRENOFFS section */
818 } dof_provider_t;
819 
820 typedef struct dof_probe {
821 	uint64_t dofpr_addr;		/* probe base address or offset */
822 	dof_stridx_t dofpr_func;	/* probe function string */
823 	dof_stridx_t dofpr_name;	/* probe name string */
824 	dof_stridx_t dofpr_nargv;	/* native argument type strings */
825 	dof_stridx_t dofpr_xargv;	/* translated argument type strings */
826 	uint32_t dofpr_argidx;		/* index of first argument mapping */
827 	uint32_t dofpr_offidx;		/* index of first offset entry */
828 	uint8_t dofpr_nargc;		/* native argument count */
829 	uint8_t dofpr_xargc;		/* translated argument count */
830 	uint16_t dofpr_noffs;		/* number of offset entries for probe */
831 	uint32_t dofpr_enoffidx;	/* index of first is-enabled offset */
832 	uint16_t dofpr_nenoffs;		/* number of is-enabled offsets */
833 	uint16_t dofpr_pad1;		/* reserved for future use */
834 	uint32_t dofpr_pad2;		/* reserved for future use */
835 } dof_probe_t;
836 
837 typedef struct dof_xlator {
838 	dof_secidx_t dofxl_members;	/* link to DOF_SECT_XLMEMBERS section */
839 	dof_secidx_t dofxl_strtab;	/* link to DOF_SECT_STRTAB section */
840 	dof_stridx_t dofxl_argv;	/* input parameter type strings */
841 	uint32_t dofxl_argc;		/* input parameter list length */
842 	dof_stridx_t dofxl_type;	/* output type string name */
843 	dof_attr_t dofxl_attr;		/* output stability attributes */
844 } dof_xlator_t;
845 
846 typedef struct dof_xlmember {
847 	dof_secidx_t dofxm_difo;	/* member link to DOF_SECT_DIFOHDR */
848 	dof_stridx_t dofxm_name;	/* member name */
849 	dtrace_diftype_t dofxm_type;	/* member type */
850 } dof_xlmember_t;
851 
852 typedef struct dof_xlref {
853 	dof_secidx_t dofxr_xlator;	/* link to DOF_SECT_XLATORS section */
854 	uint32_t dofxr_member;		/* index of referenced dof_xlmember */
855 	uint32_t dofxr_argn;		/* index of argument for DIF_OP_XLARG */
856 } dof_xlref_t;
857 
858 /*
859  * DTrace Intermediate Format Object (DIFO)
860  *
861  * A DIFO is used to store the compiled DIF for a D expression, its return
862  * type, and its string and variable tables.  The string table is a single
863  * buffer of character data into which sets instructions and variable
864  * references can reference strings using a byte offset.  The variable table
865  * is an array of dtrace_difv_t structures that describe the name and type of
866  * each variable and the id used in the DIF code.  This structure is described
867  * above in the DIF section of this header file.  The DIFO is used at both
868  * user-level (in the library) and in the kernel, but the structure is never
869  * passed between the two: the DOF structures form the only interface.  As a
870  * result, the definition can change depending on the presence of _KERNEL.
871  */
872 typedef struct dtrace_difo {
873 	dif_instr_t *dtdo_buf;		/* instruction buffer */
874 	uint64_t *dtdo_inttab;		/* integer table (optional) */
875 	char *dtdo_strtab;		/* string table (optional) */
876 	dtrace_difv_t *dtdo_vartab;	/* variable table (optional) */
877 	uint_t dtdo_len;		/* length of instruction buffer */
878 	uint_t dtdo_intlen;		/* length of integer table */
879 	uint_t dtdo_strlen;		/* length of string table */
880 	uint_t dtdo_varlen;		/* length of variable table */
881 	dtrace_diftype_t dtdo_rtype;	/* return type */
882 	uint_t dtdo_refcnt;		/* owner reference count */
883 	uint_t dtdo_destructive;	/* invokes destructive subroutines */
884 #ifndef _KERNEL
885 	dof_relodesc_t *dtdo_kreltab;	/* kernel relocations */
886 	dof_relodesc_t *dtdo_ureltab;	/* user relocations */
887 	struct dt_node **dtdo_xlmtab;	/* translator references */
888 	uint_t dtdo_krelen;		/* length of krelo table */
889 	uint_t dtdo_urelen;		/* length of urelo table */
890 	uint_t dtdo_xlmlen;		/* length of translator table */
891 #endif
892 } dtrace_difo_t;
893 
894 /*
895  * DTrace Enabling Description Structures
896  *
897  * When DTrace is tracking the description of a DTrace enabling entity (probe,
898  * predicate, action, ECB, record, etc.), it does so in a description
899  * structure.  These structures all end in "desc", and are used at both
900  * user-level and in the kernel -- but (with the exception of
901  * dtrace_probedesc_t) they are never passed between them.  Typically,
902  * user-level will use the description structures when assembling an enabling.
903  * It will then distill those description structures into a DOF object (see
904  * above), and send it into the kernel.  The kernel will again use the
905  * description structures to create a description of the enabling as it reads
906  * the DOF.  When the description is complete, the enabling will be actually
907  * created -- turning it into the structures that represent the enabling
908  * instead of merely describing it.  Not surprisingly, the description
909  * structures bear a strong resemblance to the DOF structures that act as their
910  * conduit.
911  */
912 struct dtrace_predicate;
913 
914 typedef struct dtrace_probedesc {
915 	dtrace_id_t dtpd_id;			/* probe identifier */
916 	char dtpd_provider[DTRACE_PROVNAMELEN]; /* probe provider name */
917 	char dtpd_mod[DTRACE_MODNAMELEN];	/* probe module name */
918 	char dtpd_func[DTRACE_FUNCNAMELEN];	/* probe function name */
919 	char dtpd_name[DTRACE_NAMELEN];		/* probe name */
920 } dtrace_probedesc_t;
921 
922 typedef struct dtrace_repldesc {
923 	dtrace_probedesc_t dtrpd_match;		/* probe descr. to match */
924 	dtrace_probedesc_t dtrpd_create;	/* probe descr. to create */
925 } dtrace_repldesc_t;
926 
927 typedef struct dtrace_preddesc {
928 	dtrace_difo_t *dtpdd_difo;		/* pointer to DIF object */
929 	struct dtrace_predicate *dtpdd_predicate; /* pointer to predicate */
930 } dtrace_preddesc_t;
931 
932 typedef struct dtrace_actdesc {
933 	dtrace_difo_t *dtad_difo;		/* pointer to DIF object */
934 	struct dtrace_actdesc *dtad_next;	/* next action */
935 	dtrace_actkind_t dtad_kind;		/* kind of action */
936 	uint32_t dtad_ntuple;			/* number in tuple */
937 	uint64_t dtad_arg;			/* action argument */
938 	uint64_t dtad_uarg;			/* user argument */
939 	int dtad_refcnt;			/* reference count */
940 } dtrace_actdesc_t;
941 
942 typedef struct dtrace_ecbdesc {
943 	dtrace_actdesc_t *dted_action;		/* action description(s) */
944 	dtrace_preddesc_t dted_pred;		/* predicate description */
945 	dtrace_probedesc_t dted_probe;		/* probe description */
946 	uint64_t dted_uarg;			/* library argument */
947 	int dted_refcnt;			/* reference count */
948 } dtrace_ecbdesc_t;
949 
950 /*
951  * DTrace Metadata Description Structures
952  *
953  * DTrace separates the trace data stream from the metadata stream.  The only
954  * metadata tokens placed in the data stream are the dtrace_rechdr_t (EPID +
955  * timestamp) or (in the case of aggregations) aggregation identifiers.  To
956  * determine the structure of the data, DTrace consumers pass the token to the
957  * kernel, and receive in return a corresponding description of the enabled
958  * probe (via the dtrace_eprobedesc structure) or the aggregation (via the
959  * dtrace_aggdesc structure).  Both of these structures are expressed in terms
960  * of record descriptions (via the dtrace_recdesc structure) that describe the
961  * exact structure of the data.  Some record descriptions may also contain a
962  * format identifier; this additional bit of metadata can be retrieved from the
963  * kernel, for which a format description is returned via the dtrace_fmtdesc
964  * structure.  Note that all four of these structures must be bitness-neutral
965  * to allow for a 32-bit DTrace consumer on a 64-bit kernel.
966  */
967 typedef struct dtrace_recdesc {
968 	dtrace_actkind_t dtrd_action;		/* kind of action */
969 	uint32_t dtrd_size;			/* size of record */
970 	uint32_t dtrd_offset;			/* offset in ECB's data */
971 	uint16_t dtrd_alignment;		/* required alignment */
972 	uint16_t dtrd_format;			/* format, if any */
973 	uint64_t dtrd_arg;			/* action argument */
974 	uint64_t dtrd_uarg;			/* user argument */
975 } dtrace_recdesc_t;
976 
977 typedef struct dtrace_eprobedesc {
978 	dtrace_epid_t dtepd_epid;		/* enabled probe ID */
979 	dtrace_id_t dtepd_probeid;		/* probe ID */
980 	uint64_t dtepd_uarg;			/* library argument */
981 	uint32_t dtepd_size;			/* total size */
982 	int dtepd_nrecs;			/* number of records */
983 	dtrace_recdesc_t dtepd_rec[1];		/* records themselves */
984 } dtrace_eprobedesc_t;
985 
986 typedef struct dtrace_aggdesc {
987 	DTRACE_PTR(char, dtagd_name);		/* not filled in by kernel */
988 	dtrace_aggvarid_t dtagd_varid;		/* not filled in by kernel */
989 	int dtagd_flags;			/* not filled in by kernel */
990 	dtrace_aggid_t dtagd_id;		/* aggregation ID */
991 	dtrace_epid_t dtagd_epid;		/* enabled probe ID */
992 	uint32_t dtagd_size;			/* size in bytes */
993 	int dtagd_nrecs;			/* number of records */
994 	uint32_t dtagd_pad;			/* explicit padding */
995 	dtrace_recdesc_t dtagd_rec[1];		/* record descriptions */
996 } dtrace_aggdesc_t;
997 
998 typedef struct dtrace_fmtdesc {
999 	DTRACE_PTR(char, dtfd_string);		/* format string */
1000 	int dtfd_length;			/* length of format string */
1001 	uint16_t dtfd_format;			/* format identifier */
1002 } dtrace_fmtdesc_t;
1003 
1004 #define	DTRACE_SIZEOF_EPROBEDESC(desc)				\
1005 	(sizeof (dtrace_eprobedesc_t) + ((desc)->dtepd_nrecs ?	\
1006 	(((desc)->dtepd_nrecs - 1) * sizeof (dtrace_recdesc_t)) : 0))
1007 
1008 #define	DTRACE_SIZEOF_AGGDESC(desc)				\
1009 	(sizeof (dtrace_aggdesc_t) + ((desc)->dtagd_nrecs ?	\
1010 	(((desc)->dtagd_nrecs - 1) * sizeof (dtrace_recdesc_t)) : 0))
1011 
1012 /*
1013  * DTrace Option Interface
1014  *
1015  * Run-time DTrace options are set and retrieved via DOF_SECT_OPTDESC sections
1016  * in a DOF image.  The dof_optdesc structure contains an option identifier and
1017  * an option value.  The valid option identifiers are found below; the mapping
1018  * between option identifiers and option identifying strings is maintained at
1019  * user-level.  Note that the value of DTRACEOPT_UNSET is such that all of the
1020  * following are potentially valid option values:  all positive integers, zero
1021  * and negative one.  Some options (notably "bufpolicy" and "bufresize") take
1022  * predefined tokens as their values; these are defined with
1023  * DTRACEOPT_{option}_{token}.
1024  */
1025 #define	DTRACEOPT_BUFSIZE	0	/* buffer size */
1026 #define	DTRACEOPT_BUFPOLICY	1	/* buffer policy */
1027 #define	DTRACEOPT_DYNVARSIZE	2	/* dynamic variable size */
1028 #define	DTRACEOPT_AGGSIZE	3	/* aggregation size */
1029 #define	DTRACEOPT_SPECSIZE	4	/* speculation size */
1030 #define	DTRACEOPT_NSPEC		5	/* number of speculations */
1031 #define	DTRACEOPT_STRSIZE	6	/* string size */
1032 #define	DTRACEOPT_CLEANRATE	7	/* dynvar cleaning rate */
1033 #define	DTRACEOPT_CPU		8	/* CPU to trace */
1034 #define	DTRACEOPT_BUFRESIZE	9	/* buffer resizing policy */
1035 #define	DTRACEOPT_GRABANON	10	/* grab anonymous state, if any */
1036 #define	DTRACEOPT_FLOWINDENT	11	/* indent function entry/return */
1037 #define	DTRACEOPT_QUIET		12	/* only output explicitly traced data */
1038 #define	DTRACEOPT_STACKFRAMES	13	/* number of stack frames */
1039 #define	DTRACEOPT_USTACKFRAMES	14	/* number of user stack frames */
1040 #define	DTRACEOPT_AGGRATE	15	/* aggregation snapshot rate */
1041 #define	DTRACEOPT_SWITCHRATE	16	/* buffer switching rate */
1042 #define	DTRACEOPT_STATUSRATE	17	/* status rate */
1043 #define	DTRACEOPT_DESTRUCTIVE	18	/* destructive actions allowed */
1044 #define	DTRACEOPT_STACKINDENT	19	/* output indent for stack traces */
1045 #define	DTRACEOPT_RAWBYTES	20	/* always print bytes in raw form */
1046 #define	DTRACEOPT_JSTACKFRAMES	21	/* number of jstack() frames */
1047 #define	DTRACEOPT_JSTACKSTRSIZE	22	/* size of jstack() string table */
1048 #define	DTRACEOPT_AGGSORTKEY	23	/* sort aggregations by key */
1049 #define	DTRACEOPT_AGGSORTREV	24	/* reverse-sort aggregations */
1050 #define	DTRACEOPT_AGGSORTPOS	25	/* agg. position to sort on */
1051 #define	DTRACEOPT_AGGSORTKEYPOS	26	/* agg. key position to sort on */
1052 #define	DTRACEOPT_TEMPORAL	27	/* temporally ordered output */
1053 #define	DTRACEOPT_AGGHIST	28	/* histogram aggregation output */
1054 #define	DTRACEOPT_AGGPACK	29	/* packed aggregation output */
1055 #define	DTRACEOPT_AGGZOOM	30	/* zoomed aggregation scaling */
1056 #define	DTRACEOPT_ZONE		31	/* zone in which to enable probes */
1057 #define	DTRACEOPT_MAX		32	/* number of options */
1058 
1059 #define	DTRACEOPT_UNSET		(dtrace_optval_t)-2	/* unset option */
1060 
1061 #define	DTRACEOPT_BUFPOLICY_RING	0	/* ring buffer */
1062 #define	DTRACEOPT_BUFPOLICY_FILL	1	/* fill buffer, then stop */
1063 #define	DTRACEOPT_BUFPOLICY_SWITCH	2	/* switch buffers */
1064 
1065 #define	DTRACEOPT_BUFRESIZE_AUTO	0	/* automatic resizing */
1066 #define	DTRACEOPT_BUFRESIZE_MANUAL	1	/* manual resizing */
1067 
1068 /*
1069  * DTrace Buffer Interface
1070  *
1071  * In order to get a snapshot of the principal or aggregation buffer,
1072  * user-level passes a buffer description to the kernel with the dtrace_bufdesc
1073  * structure.  This describes which CPU user-level is interested in, and
1074  * where user-level wishes the kernel to snapshot the buffer to (the
1075  * dtbd_data field).  The kernel uses the same structure to pass back some
1076  * information regarding the buffer:  the size of data actually copied out, the
1077  * number of drops, the number of errors, the offset of the oldest record,
1078  * and the time of the snapshot.
1079  *
1080  * If the buffer policy is a "switch" policy, taking a snapshot of the
1081  * principal buffer has the additional effect of switching the active and
1082  * inactive buffers.  Taking a snapshot of the aggregation buffer _always_ has
1083  * the additional effect of switching the active and inactive buffers.
1084  */
1085 typedef struct dtrace_bufdesc {
1086 	uint64_t dtbd_size;			/* size of buffer */
1087 	uint32_t dtbd_cpu;			/* CPU or DTRACE_CPUALL */
1088 	uint32_t dtbd_errors;			/* number of errors */
1089 	uint64_t dtbd_drops;			/* number of drops */
1090 	DTRACE_PTR(char, dtbd_data);		/* data */
1091 	uint64_t dtbd_oldest;			/* offset of oldest record */
1092 	uint64_t dtbd_timestamp;		/* hrtime of snapshot */
1093 } dtrace_bufdesc_t;
1094 
1095 /*
1096  * Each record in the buffer (dtbd_data) begins with a header that includes
1097  * the epid and a timestamp.  The timestamp is split into two 4-byte parts
1098  * so that we do not require 8-byte alignment.
1099  */
1100 typedef struct dtrace_rechdr {
1101 	dtrace_epid_t dtrh_epid;		/* enabled probe id */
1102 	uint32_t dtrh_timestamp_hi;		/* high bits of hrtime_t */
1103 	uint32_t dtrh_timestamp_lo;		/* low bits of hrtime_t */
1104 } dtrace_rechdr_t;
1105 
1106 #define	DTRACE_RECORD_LOAD_TIMESTAMP(dtrh)			\
1107 	((dtrh)->dtrh_timestamp_lo +				\
1108 	((uint64_t)(dtrh)->dtrh_timestamp_hi << 32))
1109 
1110 #define	DTRACE_RECORD_STORE_TIMESTAMP(dtrh, hrtime) {		\
1111 	(dtrh)->dtrh_timestamp_lo = (uint32_t)hrtime;		\
1112 	(dtrh)->dtrh_timestamp_hi = hrtime >> 32;		\
1113 }
1114 
1115 /*
1116  * DTrace Status
1117  *
1118  * The status of DTrace is relayed via the dtrace_status structure.  This
1119  * structure contains members to count drops other than the capacity drops
1120  * available via the buffer interface (see above).  This consists of dynamic
1121  * drops (including capacity dynamic drops, rinsing drops and dirty drops), and
1122  * speculative drops (including capacity speculative drops, drops due to busy
1123  * speculative buffers and drops due to unavailable speculative buffers).
1124  * Additionally, the status structure contains a field to indicate the number
1125  * of "fill"-policy buffers have been filled and a boolean field to indicate
1126  * that exit() has been called.  If the dtst_exiting field is non-zero, no
1127  * further data will be generated until tracing is stopped (at which time any
1128  * enablings of the END action will be processed); if user-level sees that
1129  * this field is non-zero, tracing should be stopped as soon as possible.
1130  */
1131 typedef struct dtrace_status {
1132 	uint64_t dtst_dyndrops;			/* dynamic drops */
1133 	uint64_t dtst_dyndrops_rinsing;		/* dyn drops due to rinsing */
1134 	uint64_t dtst_dyndrops_dirty;		/* dyn drops due to dirty */
1135 	uint64_t dtst_specdrops;		/* speculative drops */
1136 	uint64_t dtst_specdrops_busy;		/* spec drops due to busy */
1137 	uint64_t dtst_specdrops_unavail;	/* spec drops due to unavail */
1138 	uint64_t dtst_errors;			/* total errors */
1139 	uint64_t dtst_filled;			/* number of filled bufs */
1140 	uint64_t dtst_stkstroverflows;		/* stack string tab overflows */
1141 	uint64_t dtst_dblerrors;		/* errors in ERROR probes */
1142 	char dtst_killed;			/* non-zero if killed */
1143 	char dtst_exiting;			/* non-zero if exit() called */
1144 	char dtst_pad[6];			/* pad out to 64-bit align */
1145 } dtrace_status_t;
1146 
1147 /*
1148  * DTrace Configuration
1149  *
1150  * User-level may need to understand some elements of the kernel DTrace
1151  * configuration in order to generate correct DIF.  This information is
1152  * conveyed via the dtrace_conf structure.
1153  */
1154 typedef struct dtrace_conf {
1155 	uint_t dtc_difversion;			/* supported DIF version */
1156 	uint_t dtc_difintregs;			/* # of DIF integer registers */
1157 	uint_t dtc_diftupregs;			/* # of DIF tuple registers */
1158 	uint_t dtc_ctfmodel;			/* CTF data model */
1159 	uint_t dtc_pad[8];			/* reserved for future use */
1160 } dtrace_conf_t;
1161 
1162 /*
1163  * DTrace Faults
1164  *
1165  * The constants below DTRACEFLT_LIBRARY indicate probe processing faults;
1166  * constants at or above DTRACEFLT_LIBRARY indicate faults in probe
1167  * postprocessing at user-level.  Probe processing faults induce an ERROR
1168  * probe and are replicated in unistd.d to allow users' ERROR probes to decode
1169  * the error condition using thse symbolic labels.
1170  */
1171 #define	DTRACEFLT_UNKNOWN		0	/* Unknown fault */
1172 #define	DTRACEFLT_BADADDR		1	/* Bad address */
1173 #define	DTRACEFLT_BADALIGN		2	/* Bad alignment */
1174 #define	DTRACEFLT_ILLOP			3	/* Illegal operation */
1175 #define	DTRACEFLT_DIVZERO		4	/* Divide-by-zero */
1176 #define	DTRACEFLT_NOSCRATCH		5	/* Out of scratch space */
1177 #define	DTRACEFLT_KPRIV			6	/* Illegal kernel access */
1178 #define	DTRACEFLT_UPRIV			7	/* Illegal user access */
1179 #define	DTRACEFLT_TUPOFLOW		8	/* Tuple stack overflow */
1180 #define	DTRACEFLT_BADSTACK		9	/* Bad stack */
1181 
1182 #define	DTRACEFLT_LIBRARY		1000	/* Library-level fault */
1183 
1184 /*
1185  * DTrace Argument Types
1186  *
1187  * Because it would waste both space and time, argument types do not reside
1188  * with the probe.  In order to determine argument types for args[X]
1189  * variables, the D compiler queries for argument types on a probe-by-probe
1190  * basis.  (This optimizes for the common case that arguments are either not
1191  * used or used in an untyped fashion.)  Typed arguments are specified with a
1192  * string of the type name in the dtragd_native member of the argument
1193  * description structure.  Typed arguments may be further translated to types
1194  * of greater stability; the provider indicates such a translated argument by
1195  * filling in the dtargd_xlate member with the string of the translated type.
1196  * Finally, the provider may indicate which argument value a given argument
1197  * maps to by setting the dtargd_mapping member -- allowing a single argument
1198  * to map to multiple args[X] variables.
1199  */
1200 typedef struct dtrace_argdesc {
1201 	dtrace_id_t dtargd_id;			/* probe identifier */
1202 	int dtargd_ndx;				/* arg number (-1 iff none) */
1203 	int dtargd_mapping;			/* value mapping */
1204 	char dtargd_native[DTRACE_ARGTYPELEN];	/* native type name */
1205 	char dtargd_xlate[DTRACE_ARGTYPELEN];	/* translated type name */
1206 } dtrace_argdesc_t;
1207 
1208 /*
1209  * DTrace Stability Attributes
1210  *
1211  * Each DTrace provider advertises the name and data stability of each of its
1212  * probe description components, as well as its architectural dependencies.
1213  * The D compiler can query the provider attributes (dtrace_pattr_t below) in
1214  * order to compute the properties of an input program and report them.
1215  */
1216 typedef uint8_t dtrace_stability_t;	/* stability code (see attributes(5)) */
1217 typedef uint8_t dtrace_class_t;		/* architectural dependency class */
1218 
1219 #define	DTRACE_STABILITY_INTERNAL	0	/* private to DTrace itself */
1220 #define	DTRACE_STABILITY_PRIVATE	1	/* private to Sun (see docs) */
1221 #define	DTRACE_STABILITY_OBSOLETE	2	/* scheduled for removal */
1222 #define	DTRACE_STABILITY_EXTERNAL	3	/* not controlled by Sun */
1223 #define	DTRACE_STABILITY_UNSTABLE	4	/* new or rapidly changing */
1224 #define	DTRACE_STABILITY_EVOLVING	5	/* less rapidly changing */
1225 #define	DTRACE_STABILITY_STABLE		6	/* mature interface from Sun */
1226 #define	DTRACE_STABILITY_STANDARD	7	/* industry standard */
1227 #define	DTRACE_STABILITY_MAX		7	/* maximum valid stability */
1228 
1229 #define	DTRACE_CLASS_UNKNOWN	0	/* unknown architectural dependency */
1230 #define	DTRACE_CLASS_CPU	1	/* CPU-module-specific */
1231 #define	DTRACE_CLASS_PLATFORM	2	/* platform-specific (uname -i) */
1232 #define	DTRACE_CLASS_GROUP	3	/* hardware-group-specific (uname -m) */
1233 #define	DTRACE_CLASS_ISA	4	/* ISA-specific (uname -p) */
1234 #define	DTRACE_CLASS_COMMON	5	/* common to all systems */
1235 #define	DTRACE_CLASS_MAX	5	/* maximum valid class */
1236 
1237 #define	DTRACE_PRIV_NONE	0x0000
1238 #define	DTRACE_PRIV_KERNEL	0x0001
1239 #define	DTRACE_PRIV_USER	0x0002
1240 #define	DTRACE_PRIV_PROC	0x0004
1241 #define	DTRACE_PRIV_OWNER	0x0008
1242 #define	DTRACE_PRIV_ZONEOWNER	0x0010
1243 
1244 #define	DTRACE_PRIV_ALL	\
1245 	(DTRACE_PRIV_KERNEL | DTRACE_PRIV_USER | \
1246 	DTRACE_PRIV_PROC | DTRACE_PRIV_OWNER | DTRACE_PRIV_ZONEOWNER)
1247 
1248 typedef struct dtrace_ppriv {
1249 	uint32_t dtpp_flags;			/* privilege flags */
1250 	uid_t dtpp_uid;				/* user ID */
1251 	zoneid_t dtpp_zoneid;			/* zone ID */
1252 } dtrace_ppriv_t;
1253 
1254 typedef struct dtrace_attribute {
1255 	dtrace_stability_t dtat_name;		/* entity name stability */
1256 	dtrace_stability_t dtat_data;		/* entity data stability */
1257 	dtrace_class_t dtat_class;		/* entity data dependency */
1258 } dtrace_attribute_t;
1259 
1260 typedef struct dtrace_pattr {
1261 	dtrace_attribute_t dtpa_provider;	/* provider attributes */
1262 	dtrace_attribute_t dtpa_mod;		/* module attributes */
1263 	dtrace_attribute_t dtpa_func;		/* function attributes */
1264 	dtrace_attribute_t dtpa_name;		/* name attributes */
1265 	dtrace_attribute_t dtpa_args;		/* args[] attributes */
1266 } dtrace_pattr_t;
1267 
1268 typedef struct dtrace_providerdesc {
1269 	char dtvd_name[DTRACE_PROVNAMELEN];	/* provider name */
1270 	dtrace_pattr_t dtvd_attr;		/* stability attributes */
1271 	dtrace_ppriv_t dtvd_priv;		/* privileges required */
1272 } dtrace_providerdesc_t;
1273 
1274 /*
1275  * DTrace Pseudodevice Interface
1276  *
1277  * DTrace is controlled through ioctl(2)'s to the in-kernel dtrace:dtrace
1278  * pseudodevice driver.  These ioctls comprise the user-kernel interface to
1279  * DTrace.
1280  */
1281 #ifdef illumos
1282 #define	DTRACEIOC		(('d' << 24) | ('t' << 16) | ('r' << 8))
1283 #define	DTRACEIOC_PROVIDER	(DTRACEIOC | 1)		/* provider query */
1284 #define	DTRACEIOC_PROBES	(DTRACEIOC | 2)		/* probe query */
1285 #define	DTRACEIOC_BUFSNAP	(DTRACEIOC | 4)		/* snapshot buffer */
1286 #define	DTRACEIOC_PROBEMATCH	(DTRACEIOC | 5)		/* match probes */
1287 #define	DTRACEIOC_ENABLE	(DTRACEIOC | 6)		/* enable probes */
1288 #define	DTRACEIOC_AGGSNAP	(DTRACEIOC | 7)		/* snapshot agg. */
1289 #define	DTRACEIOC_EPROBE	(DTRACEIOC | 8)		/* get eprobe desc. */
1290 #define	DTRACEIOC_PROBEARG	(DTRACEIOC | 9)		/* get probe arg */
1291 #define	DTRACEIOC_CONF		(DTRACEIOC | 10)	/* get config. */
1292 #define	DTRACEIOC_STATUS	(DTRACEIOC | 11)	/* get status */
1293 #define	DTRACEIOC_GO		(DTRACEIOC | 12)	/* start tracing */
1294 #define	DTRACEIOC_STOP		(DTRACEIOC | 13)	/* stop tracing */
1295 #define	DTRACEIOC_AGGDESC	(DTRACEIOC | 15)	/* get agg. desc. */
1296 #define	DTRACEIOC_FORMAT	(DTRACEIOC | 16)	/* get format str */
1297 #define	DTRACEIOC_DOFGET	(DTRACEIOC | 17)	/* get DOF */
1298 #define	DTRACEIOC_REPLICATE	(DTRACEIOC | 18)	/* replicate enab */
1299 #else
1300 #define	DTRACEIOC_PROVIDER	_IOWR('x',1,dtrace_providerdesc_t)
1301 							/* provider query */
1302 #define	DTRACEIOC_PROBES	_IOWR('x',2,dtrace_probedesc_t)
1303 							/* probe query */
1304 #define	DTRACEIOC_BUFSNAP	_IOW('x',4,dtrace_bufdesc_t *)
1305 							/* snapshot buffer */
1306 #define	DTRACEIOC_PROBEMATCH	_IOWR('x',5,dtrace_probedesc_t)
1307 							/* match probes */
1308 typedef struct {
1309 	void	*dof;		/* DOF userland address written to driver. */
1310 	int	n_matched;	/* # matches returned by driver. */
1311 } dtrace_enable_io_t;
1312 #define	DTRACEIOC_ENABLE	_IOWR('x',6,dtrace_enable_io_t)
1313 							/* enable probes */
1314 #define	DTRACEIOC_AGGSNAP	_IOW('x',7,dtrace_bufdesc_t *)
1315 							/* snapshot agg. */
1316 #define	DTRACEIOC_EPROBE	_IOW('x',8,dtrace_eprobedesc_t)
1317 							/* get eprobe desc. */
1318 #define	DTRACEIOC_PROBEARG	_IOWR('x',9,dtrace_argdesc_t)
1319 							/* get probe arg */
1320 #define	DTRACEIOC_CONF		_IOR('x',10,dtrace_conf_t)
1321 							/* get config. */
1322 #define	DTRACEIOC_STATUS	_IOR('x',11,dtrace_status_t)
1323 							/* get status */
1324 #define	DTRACEIOC_GO		_IOR('x',12,processorid_t)
1325 							/* start tracing */
1326 #define	DTRACEIOC_STOP		_IOWR('x',13,processorid_t)
1327 							/* stop tracing */
1328 #define	DTRACEIOC_AGGDESC	_IOW('x',15,dtrace_aggdesc_t *)
1329 							/* get agg. desc. */
1330 #define	DTRACEIOC_FORMAT	_IOWR('x',16,dtrace_fmtdesc_t)
1331 							/* get format str */
1332 #define	DTRACEIOC_DOFGET	_IOW('x',17,dof_hdr_t *)
1333 							/* get DOF */
1334 #define	DTRACEIOC_REPLICATE	_IOW('x',18,dtrace_repldesc_t)
1335 							/* replicate enab */
1336 #endif
1337 
1338 /*
1339  * DTrace Helpers
1340  *
1341  * In general, DTrace establishes probes in processes and takes actions on
1342  * processes without knowing their specific user-level structures.  Instead of
1343  * existing in the framework, process-specific knowledge is contained by the
1344  * enabling D program -- which can apply process-specific knowledge by making
1345  * appropriate use of DTrace primitives like copyin() and copyinstr() to
1346  * operate on user-level data.  However, there may exist some specific probes
1347  * of particular semantic relevance that the application developer may wish to
1348  * explicitly export.  For example, an application may wish to export a probe
1349  * at the point that it begins and ends certain well-defined transactions.  In
1350  * addition to providing probes, programs may wish to offer assistance for
1351  * certain actions.  For example, in highly dynamic environments (e.g., Java),
1352  * it may be difficult to obtain a stack trace in terms of meaningful symbol
1353  * names (the translation from instruction addresses to corresponding symbol
1354  * names may only be possible in situ); these environments may wish to define
1355  * a series of actions to be applied in situ to obtain a meaningful stack
1356  * trace.
1357  *
1358  * These two mechanisms -- user-level statically defined tracing and assisting
1359  * DTrace actions -- are provided via DTrace _helpers_.  Helpers are specified
1360  * via DOF, but unlike enabling DOF, helper DOF may contain definitions of
1361  * providers, probes and their arguments.  If a helper wishes to provide
1362  * action assistance, probe descriptions and corresponding DIF actions may be
1363  * specified in the helper DOF.  For such helper actions, however, the probe
1364  * description describes the specific helper:  all DTrace helpers have the
1365  * provider name "dtrace" and the module name "helper", and the name of the
1366  * helper is contained in the function name (for example, the ustack() helper
1367  * is named "ustack").  Any helper-specific name may be contained in the name
1368  * (for example, if a helper were to have a constructor, it might be named
1369  * "dtrace:helper:<helper>:init").  Helper actions are only called when the
1370  * action that they are helping is taken.  Helper actions may only return DIF
1371  * expressions, and may only call the following subroutines:
1372  *
1373  *    alloca()      <= Allocates memory out of the consumer's scratch space
1374  *    bcopy()       <= Copies memory to scratch space
1375  *    copyin()      <= Copies memory from user-level into consumer's scratch
1376  *    copyinto()    <= Copies memory into a specific location in scratch
1377  *    copyinstr()   <= Copies a string into a specific location in scratch
1378  *
1379  * Helper actions may only access the following built-in variables:
1380  *
1381  *    curthread     <= Current kthread_t pointer
1382  *    tid           <= Current thread identifier
1383  *    pid           <= Current process identifier
1384  *    ppid          <= Parent process identifier
1385  *    uid           <= Current user ID
1386  *    gid           <= Current group ID
1387  *    execname      <= Current executable name
1388  *    zonename      <= Current zone name
1389  *
1390  * Helper actions may not manipulate or allocate dynamic variables, but they
1391  * may have clause-local and statically-allocated global variables.  The
1392  * helper action variable state is specific to the helper action -- variables
1393  * used by the helper action may not be accessed outside of the helper
1394  * action, and the helper action may not access variables that like outside
1395  * of it.  Helper actions may not load from kernel memory at-large; they are
1396  * restricting to loading current user state (via copyin() and variants) and
1397  * scratch space.  As with probe enablings, helper actions are executed in
1398  * program order.  The result of the helper action is the result of the last
1399  * executing helper expression.
1400  *
1401  * Helpers -- composed of either providers/probes or probes/actions (or both)
1402  * -- are added by opening the "helper" minor node, and issuing an ioctl(2)
1403  * (DTRACEHIOC_ADDDOF) that specifies the dof_helper_t structure. This
1404  * encapsulates the name and base address of the user-level library or
1405  * executable publishing the helpers and probes as well as the DOF that
1406  * contains the definitions of those helpers and probes.
1407  *
1408  * The DTRACEHIOC_ADD and DTRACEHIOC_REMOVE are left in place for legacy
1409  * helpers and should no longer be used.  No other ioctls are valid on the
1410  * helper minor node.
1411  */
1412 #ifdef illumos
1413 #define	DTRACEHIOC		(('d' << 24) | ('t' << 16) | ('h' << 8))
1414 #define	DTRACEHIOC_ADD		(DTRACEHIOC | 1)	/* add helper */
1415 #define	DTRACEHIOC_REMOVE	(DTRACEHIOC | 2)	/* remove helper */
1416 #define	DTRACEHIOC_ADDDOF	(DTRACEHIOC | 3)	/* add helper DOF */
1417 #else
1418 #define	DTRACEHIOC_ADD		_IOWR('z', 1, dof_hdr_t)/* add helper */
1419 #define	DTRACEHIOC_REMOVE	_IOW('z', 2, int)	/* remove helper */
1420 #define	DTRACEHIOC_ADDDOF	_IOWR('z', 3, dof_helper_t)/* add helper DOF */
1421 #endif
1422 
1423 typedef struct dof_helper {
1424 	char dofhp_mod[DTRACE_MODNAMELEN];	/* executable or library name */
1425 	uint64_t dofhp_addr;			/* base address of object */
1426 	uint64_t dofhp_dof;			/* address of helper DOF */
1427 #if defined(__FreeBSD__) || defined(__NetBSD__)
1428 	pid_t dofhp_pid;			/* target process ID */
1429 	int dofhp_gen;
1430 #endif
1431 } dof_helper_t;
1432 
1433 #define	DTRACEMNR_DTRACE	"dtrace"	/* node for DTrace ops */
1434 #define	DTRACEMNR_HELPER	"helper"	/* node for helpers */
1435 #define	DTRACEMNRN_DTRACE	0		/* minor for DTrace ops */
1436 #define	DTRACEMNRN_HELPER	1		/* minor for helpers */
1437 #define	DTRACEMNRN_CLONE	2		/* first clone minor */
1438 
1439 #ifdef _KERNEL
1440 
1441 /*
1442  * DTrace Provider API
1443  *
1444  * The following functions are implemented by the DTrace framework and are
1445  * used to implement separate in-kernel DTrace providers.  Common functions
1446  * are provided in uts/common/os/dtrace.c.  ISA-dependent subroutines are
1447  * defined in uts/<isa>/dtrace/dtrace_asm.s or uts/<isa>/dtrace/dtrace_isa.c.
1448  *
1449  * The provider API has two halves:  the API that the providers consume from
1450  * DTrace, and the API that providers make available to DTrace.
1451  *
1452  * 1 Framework-to-Provider API
1453  *
1454  * 1.1  Overview
1455  *
1456  * The Framework-to-Provider API is represented by the dtrace_pops structure
1457  * that the provider passes to the framework when registering itself.  This
1458  * structure consists of the following members:
1459  *
1460  *   dtps_provide()          <-- Provide all probes, all modules
1461  *   dtps_provide_module()   <-- Provide all probes in specified module
1462  *   dtps_enable()           <-- Enable specified probe
1463  *   dtps_disable()          <-- Disable specified probe
1464  *   dtps_suspend()          <-- Suspend specified probe
1465  *   dtps_resume()           <-- Resume specified probe
1466  *   dtps_getargdesc()       <-- Get the argument description for args[X]
1467  *   dtps_getargval()        <-- Get the value for an argX or args[X] variable
1468  *   dtps_usermode()         <-- Find out if the probe was fired in user mode
1469  *   dtps_destroy()          <-- Destroy all state associated with this probe
1470  *
1471  * 1.2  void dtps_provide(void *arg, const dtrace_probedesc_t *spec)
1472  *
1473  * 1.2.1  Overview
1474  *
1475  *   Called to indicate that the provider should provide all probes.  If the
1476  *   specified description is non-NULL, dtps_provide() is being called because
1477  *   no probe matched a specified probe -- if the provider has the ability to
1478  *   create custom probes, it may wish to create a probe that matches the
1479  *   specified description.
1480  *
1481  * 1.2.2  Arguments and notes
1482  *
1483  *   The first argument is the cookie as passed to dtrace_register().  The
1484  *   second argument is a pointer to a probe description that the provider may
1485  *   wish to consider when creating custom probes.  The provider is expected to
1486  *   call back into the DTrace framework via dtrace_probe_create() to create
1487  *   any necessary probes.  dtps_provide() may be called even if the provider
1488  *   has made available all probes; the provider should check the return value
1489  *   of dtrace_probe_create() to handle this case.  Note that the provider need
1490  *   not implement both dtps_provide() and dtps_provide_module(); see
1491  *   "Arguments and Notes" for dtrace_register(), below.
1492  *
1493  * 1.2.3  Return value
1494  *
1495  *   None.
1496  *
1497  * 1.2.4  Caller's context
1498  *
1499  *   dtps_provide() is typically called from open() or ioctl() context, but may
1500  *   be called from other contexts as well.  The DTrace framework is locked in
1501  *   such a way that providers may not register or unregister.  This means that
1502  *   the provider may not call any DTrace API that affects its registration with
1503  *   the framework, including dtrace_register(), dtrace_unregister(),
1504  *   dtrace_invalidate(), and dtrace_condense().  However, the context is such
1505  *   that the provider may (and indeed, is expected to) call probe-related
1506  *   DTrace routines, including dtrace_probe_create(), dtrace_probe_lookup(),
1507  *   and dtrace_probe_arg().
1508  *
1509  * 1.3  void dtps_provide_module(void *arg, dtrace_modctl_t *mp)
1510  *
1511  * 1.3.1  Overview
1512  *
1513  *   Called to indicate that the provider should provide all probes in the
1514  *   specified module.
1515  *
1516  * 1.3.2  Arguments and notes
1517  *
1518  *   The first argument is the cookie as passed to dtrace_register().  The
1519  *   second argument is a pointer to a modctl structure that indicates the
1520  *   module for which probes should be created.
1521  *
1522  * 1.3.3  Return value
1523  *
1524  *   None.
1525  *
1526  * 1.3.4  Caller's context
1527  *
1528  *   dtps_provide_module() may be called from open() or ioctl() context, but
1529  *   may also be called from a module loading context.  mod_lock is held, and
1530  *   the DTrace framework is locked in such a way that providers may not
1531  *   register or unregister.  This means that the provider may not call any
1532  *   DTrace API that affects its registration with the framework, including
1533  *   dtrace_register(), dtrace_unregister(), dtrace_invalidate(), and
1534  *   dtrace_condense().  However, the context is such that the provider may (and
1535  *   indeed, is expected to) call probe-related DTrace routines, including
1536  *   dtrace_probe_create(), dtrace_probe_lookup(), and dtrace_probe_arg().  Note
1537  *   that the provider need not implement both dtps_provide() and
1538  *   dtps_provide_module(); see "Arguments and Notes" for dtrace_register(),
1539  *   below.
1540  *
1541  * 1.4  void dtps_enable(void *arg, dtrace_id_t id, void *parg)
1542  *
1543  * 1.4.1  Overview
1544  *
1545  *   Called to enable the specified probe.
1546  *
1547  * 1.4.2  Arguments and notes
1548  *
1549  *   The first argument is the cookie as passed to dtrace_register().  The
1550  *   second argument is the identifier of the probe to be enabled.  The third
1551  *   argument is the probe argument as passed to dtrace_probe_create().
1552  *   dtps_enable() will be called when a probe transitions from not being
1553  *   enabled at all to having one or more ECB.  The number of ECBs associated
1554  *   with the probe may change without subsequent calls into the provider.
1555  *   When the number of ECBs drops to zero, the provider will be explicitly
1556  *   told to disable the probe via dtps_disable().  dtrace_probe() should never
1557  *   be called for a probe identifier that hasn't been explicitly enabled via
1558  *   dtps_enable().
1559  *
1560  * 1.4.3  Return value
1561  *
1562  *   None.
1563  *
1564  * 1.4.4  Caller's context
1565  *
1566  *   The DTrace framework is locked in such a way that it may not be called
1567  *   back into at all.  cpu_lock is held.  mod_lock is not held and may not
1568  *   be acquired.
1569  *
1570  * 1.5  void dtps_disable(void *arg, dtrace_id_t id, void *parg)
1571  *
1572  * 1.5.1  Overview
1573  *
1574  *   Called to disable the specified probe.
1575  *
1576  * 1.5.2  Arguments and notes
1577  *
1578  *   The first argument is the cookie as passed to dtrace_register().  The
1579  *   second argument is the identifier of the probe to be disabled.  The third
1580  *   argument is the probe argument as passed to dtrace_probe_create().
1581  *   dtps_disable() will be called when a probe transitions from being enabled
1582  *   to having zero ECBs.  dtrace_probe() should never be called for a probe
1583  *   identifier that has been explicitly enabled via dtps_disable().
1584  *
1585  * 1.5.3  Return value
1586  *
1587  *   None.
1588  *
1589  * 1.5.4  Caller's context
1590  *
1591  *   The DTrace framework is locked in such a way that it may not be called
1592  *   back into at all.  cpu_lock is held.  mod_lock is not held and may not
1593  *   be acquired.
1594  *
1595  * 1.6  void dtps_suspend(void *arg, dtrace_id_t id, void *parg)
1596  *
1597  * 1.6.1  Overview
1598  *
1599  *   Called to suspend the specified enabled probe.  This entry point is for
1600  *   providers that may need to suspend some or all of their probes when CPUs
1601  *   are being powered on or when the boot monitor is being entered for a
1602  *   prolonged period of time.
1603  *
1604  * 1.6.2  Arguments and notes
1605  *
1606  *   The first argument is the cookie as passed to dtrace_register().  The
1607  *   second argument is the identifier of the probe to be suspended.  The
1608  *   third argument is the probe argument as passed to dtrace_probe_create().
1609  *   dtps_suspend will only be called on an enabled probe.  Providers that
1610  *   provide a dtps_suspend entry point will want to take roughly the action
1611  *   that it takes for dtps_disable.
1612  *
1613  * 1.6.3  Return value
1614  *
1615  *   None.
1616  *
1617  * 1.6.4  Caller's context
1618  *
1619  *   Interrupts are disabled.  The DTrace framework is in a state such that the
1620  *   specified probe cannot be disabled or destroyed for the duration of
1621  *   dtps_suspend().  As interrupts are disabled, the provider is afforded
1622  *   little latitude; the provider is expected to do no more than a store to
1623  *   memory.
1624  *
1625  * 1.7  void dtps_resume(void *arg, dtrace_id_t id, void *parg)
1626  *
1627  * 1.7.1  Overview
1628  *
1629  *   Called to resume the specified enabled probe.  This entry point is for
1630  *   providers that may need to resume some or all of their probes after the
1631  *   completion of an event that induced a call to dtps_suspend().
1632  *
1633  * 1.7.2  Arguments and notes
1634  *
1635  *   The first argument is the cookie as passed to dtrace_register().  The
1636  *   second argument is the identifier of the probe to be resumed.  The
1637  *   third argument is the probe argument as passed to dtrace_probe_create().
1638  *   dtps_resume will only be called on an enabled probe.  Providers that
1639  *   provide a dtps_resume entry point will want to take roughly the action
1640  *   that it takes for dtps_enable.
1641  *
1642  * 1.7.3  Return value
1643  *
1644  *   None.
1645  *
1646  * 1.7.4  Caller's context
1647  *
1648  *   Interrupts are disabled.  The DTrace framework is in a state such that the
1649  *   specified probe cannot be disabled or destroyed for the duration of
1650  *   dtps_resume().  As interrupts are disabled, the provider is afforded
1651  *   little latitude; the provider is expected to do no more than a store to
1652  *   memory.
1653  *
1654  * 1.8  void dtps_getargdesc(void *arg, dtrace_id_t id, void *parg,
1655  *           dtrace_argdesc_t *desc)
1656  *
1657  * 1.8.1  Overview
1658  *
1659  *   Called to retrieve the argument description for an args[X] variable.
1660  *
1661  * 1.8.2  Arguments and notes
1662  *
1663  *   The first argument is the cookie as passed to dtrace_register(). The
1664  *   second argument is the identifier of the current probe. The third
1665  *   argument is the probe argument as passed to dtrace_probe_create(). The
1666  *   fourth argument is a pointer to the argument description.  This
1667  *   description is both an input and output parameter:  it contains the
1668  *   index of the desired argument in the dtargd_ndx field, and expects
1669  *   the other fields to be filled in upon return.  If there is no argument
1670  *   corresponding to the specified index, the dtargd_ndx field should be set
1671  *   to DTRACE_ARGNONE.
1672  *
1673  * 1.8.3  Return value
1674  *
1675  *   None.  The dtargd_ndx, dtargd_native, dtargd_xlate and dtargd_mapping
1676  *   members of the dtrace_argdesc_t structure are all output values.
1677  *
1678  * 1.8.4  Caller's context
1679  *
1680  *   dtps_getargdesc() is called from ioctl() context. mod_lock is held, and
1681  *   the DTrace framework is locked in such a way that providers may not
1682  *   register or unregister.  This means that the provider may not call any
1683  *   DTrace API that affects its registration with the framework, including
1684  *   dtrace_register(), dtrace_unregister(), dtrace_invalidate(), and
1685  *   dtrace_condense().
1686  *
1687  * 1.9  uint64_t dtps_getargval(void *arg, dtrace_id_t id, void *parg,
1688  *               int argno, int aframes)
1689  *
1690  * 1.9.1  Overview
1691  *
1692  *   Called to retrieve a value for an argX or args[X] variable.
1693  *
1694  * 1.9.2  Arguments and notes
1695  *
1696  *   The first argument is the cookie as passed to dtrace_register(). The
1697  *   second argument is the identifier of the current probe. The third
1698  *   argument is the probe argument as passed to dtrace_probe_create(). The
1699  *   fourth argument is the number of the argument (the X in the example in
1700  *   1.9.1). The fifth argument is the number of stack frames that were used
1701  *   to get from the actual place in the code that fired the probe to
1702  *   dtrace_probe() itself, the so-called artificial frames. This argument may
1703  *   be used to descend an appropriate number of frames to find the correct
1704  *   values. If this entry point is left NULL, the dtrace_getarg() built-in
1705  *   function is used.
1706  *
1707  * 1.9.3  Return value
1708  *
1709  *   The value of the argument.
1710  *
1711  * 1.9.4  Caller's context
1712  *
1713  *   This is called from within dtrace_probe() meaning that interrupts
1714  *   are disabled. No locks should be taken within this entry point.
1715  *
1716  * 1.10  int dtps_usermode(void *arg, dtrace_id_t id, void *parg)
1717  *
1718  * 1.10.1  Overview
1719  *
1720  *   Called to determine if the probe was fired in a user context.
1721  *
1722  * 1.10.2  Arguments and notes
1723  *
1724  *   The first argument is the cookie as passed to dtrace_register(). The
1725  *   second argument is the identifier of the current probe. The third
1726  *   argument is the probe argument as passed to dtrace_probe_create().  This
1727  *   entry point must not be left NULL for providers whose probes allow for
1728  *   mixed mode tracing, that is to say those probes that can fire during
1729  *   kernel- _or_ user-mode execution
1730  *
1731  * 1.10.3  Return value
1732  *
1733  *   A bitwise OR that encapsulates both the mode (either DTRACE_MODE_KERNEL
1734  *   or DTRACE_MODE_USER) and the policy when the privilege of the enabling
1735  *   is insufficient for that mode (a combination of DTRACE_MODE_NOPRIV_DROP,
1736  *   DTRACE_MODE_NOPRIV_RESTRICT, and DTRACE_MODE_LIMITEDPRIV_RESTRICT).  If
1737  *   DTRACE_MODE_NOPRIV_DROP bit is set, insufficient privilege will result
1738  *   in the probe firing being silently ignored for the enabling; if the
1739  *   DTRACE_NODE_NOPRIV_RESTRICT bit is set, insufficient privilege will not
1740  *   prevent probe processing for the enabling, but restrictions will be in
1741  *   place that induce a UPRIV fault upon attempt to examine probe arguments
1742  *   or current process state.  If the DTRACE_MODE_LIMITEDPRIV_RESTRICT bit
1743  *   is set, similar restrictions will be placed upon operation if the
1744  *   privilege is sufficient to process the enabling, but does not otherwise
1745  *   entitle the enabling to all zones.  The DTRACE_MODE_NOPRIV_DROP and
1746  *   DTRACE_MODE_NOPRIV_RESTRICT are mutually exclusive (and one of these
1747  *   two policies must be specified), but either may be combined (or not)
1748  *   with DTRACE_MODE_LIMITEDPRIV_RESTRICT.
1749  *
1750  * 1.10.4  Caller's context
1751  *
1752  *   This is called from within dtrace_probe() meaning that interrupts
1753  *   are disabled. No locks should be taken within this entry point.
1754  *
1755  * 1.11 void dtps_destroy(void *arg, dtrace_id_t id, void *parg)
1756  *
1757  * 1.11.1 Overview
1758  *
1759  *   Called to destroy the specified probe.
1760  *
1761  * 1.11.2 Arguments and notes
1762  *
1763  *   The first argument is the cookie as passed to dtrace_register().  The
1764  *   second argument is the identifier of the probe to be destroyed.  The third
1765  *   argument is the probe argument as passed to dtrace_probe_create().  The
1766  *   provider should free all state associated with the probe.  The framework
1767  *   guarantees that dtps_destroy() is only called for probes that have either
1768  *   been disabled via dtps_disable() or were never enabled via dtps_enable().
1769  *   Once dtps_disable() has been called for a probe, no further call will be
1770  *   made specifying the probe.
1771  *
1772  * 1.11.3 Return value
1773  *
1774  *   None.
1775  *
1776  * 1.11.4 Caller's context
1777  *
1778  *   The DTrace framework is locked in such a way that it may not be called
1779  *   back into at all.  mod_lock is held.  cpu_lock is not held, and may not be
1780  *   acquired.
1781  *
1782  *
1783  * 2 Provider-to-Framework API
1784  *
1785  * 2.1  Overview
1786  *
1787  * The Provider-to-Framework API provides the mechanism for the provider to
1788  * register itself with the DTrace framework, to create probes, to lookup
1789  * probes and (most importantly) to fire probes.  The Provider-to-Framework
1790  * consists of:
1791  *
1792  *   dtrace_register()       <-- Register a provider with the DTrace framework
1793  *   dtrace_unregister()     <-- Remove a provider's DTrace registration
1794  *   dtrace_invalidate()     <-- Invalidate the specified provider
1795  *   dtrace_condense()       <-- Remove a provider's unenabled probes
1796  *   dtrace_attached()       <-- Indicates whether or not DTrace has attached
1797  *   dtrace_probe_create()   <-- Create a DTrace probe
1798  *   dtrace_probe_lookup()   <-- Lookup a DTrace probe based on its name
1799  *   dtrace_probe_arg()      <-- Return the probe argument for a specific probe
1800  *   dtrace_probe()          <-- Fire the specified probe
1801  *
1802  * 2.2  int dtrace_register(const char *name, const dtrace_pattr_t *pap,
1803  *          uint32_t priv, cred_t *cr, const dtrace_pops_t *pops, void *arg,
1804  *          dtrace_provider_id_t *idp)
1805  *
1806  * 2.2.1  Overview
1807  *
1808  *   dtrace_register() registers the calling provider with the DTrace
1809  *   framework.  It should generally be called by DTrace providers in their
1810  *   attach(9E) entry point.
1811  *
1812  * 2.2.2  Arguments and Notes
1813  *
1814  *   The first argument is the name of the provider.  The second argument is a
1815  *   pointer to the stability attributes for the provider.  The third argument
1816  *   is the privilege flags for the provider, and must be some combination of:
1817  *
1818  *     DTRACE_PRIV_NONE     <= All users may enable probes from this provider
1819  *
1820  *     DTRACE_PRIV_PROC     <= Any user with privilege of PRIV_DTRACE_PROC may
1821  *                             enable probes from this provider
1822  *
1823  *     DTRACE_PRIV_USER     <= Any user with privilege of PRIV_DTRACE_USER may
1824  *                             enable probes from this provider
1825  *
1826  *     DTRACE_PRIV_KERNEL   <= Any user with privilege of PRIV_DTRACE_KERNEL
1827  *                             may enable probes from this provider
1828  *
1829  *     DTRACE_PRIV_OWNER    <= This flag places an additional constraint on
1830  *                             the privilege requirements above. These probes
1831  *                             require either (a) a user ID matching the user
1832  *                             ID of the cred passed in the fourth argument
1833  *                             or (b) the PRIV_PROC_OWNER privilege.
1834  *
1835  *     DTRACE_PRIV_ZONEOWNER<= This flag places an additional constraint on
1836  *                             the privilege requirements above. These probes
1837  *                             require either (a) a zone ID matching the zone
1838  *                             ID of the cred passed in the fourth argument
1839  *                             or (b) the PRIV_PROC_ZONE privilege.
1840  *
1841  *   Note that these flags designate the _visibility_ of the probes, not
1842  *   the conditions under which they may or may not fire.
1843  *
1844  *   The fourth argument is the credential that is associated with the
1845  *   provider.  This argument should be NULL if the privilege flags don't
1846  *   include DTRACE_PRIV_OWNER or DTRACE_PRIV_ZONEOWNER.  If non-NULL, the
1847  *   framework stashes the uid and zoneid represented by this credential
1848  *   for use at probe-time, in implicit predicates.  These limit visibility
1849  *   of the probes to users and/or zones which have sufficient privilege to
1850  *   access them.
1851  *
1852  *   The fifth argument is a DTrace provider operations vector, which provides
1853  *   the implementation for the Framework-to-Provider API.  (See Section 1,
1854  *   above.)  This must be non-NULL, and each member must be non-NULL.  The
1855  *   exceptions to this are (1) the dtps_provide() and dtps_provide_module()
1856  *   members (if the provider so desires, _one_ of these members may be left
1857  *   NULL -- denoting that the provider only implements the other) and (2)
1858  *   the dtps_suspend() and dtps_resume() members, which must either both be
1859  *   NULL or both be non-NULL.
1860  *
1861  *   The sixth argument is a cookie to be specified as the first argument for
1862  *   each function in the Framework-to-Provider API.  This argument may have
1863  *   any value.
1864  *
1865  *   The final argument is a pointer to dtrace_provider_id_t.  If
1866  *   dtrace_register() successfully completes, the provider identifier will be
1867  *   stored in the memory pointed to be this argument.  This argument must be
1868  *   non-NULL.
1869  *
1870  * 2.2.3  Return value
1871  *
1872  *   On success, dtrace_register() returns 0 and stores the new provider's
1873  *   identifier into the memory pointed to by the idp argument.  On failure,
1874  *   dtrace_register() returns an errno:
1875  *
1876  *     EINVAL   The arguments passed to dtrace_register() were somehow invalid.
1877  *              This may because a parameter that must be non-NULL was NULL,
1878  *              because the name was invalid (either empty or an illegal
1879  *              provider name) or because the attributes were invalid.
1880  *
1881  *   No other failure code is returned.
1882  *
1883  * 2.2.4  Caller's context
1884  *
1885  *   dtrace_register() may induce calls to dtrace_provide(); the provider must
1886  *   hold no locks across dtrace_register() that may also be acquired by
1887  *   dtrace_provide().  cpu_lock and mod_lock must not be held.
1888  *
1889  * 2.3  int dtrace_unregister(dtrace_provider_t id)
1890  *
1891  * 2.3.1  Overview
1892  *
1893  *   Unregisters the specified provider from the DTrace framework.  It should
1894  *   generally be called by DTrace providers in their detach(9E) entry point.
1895  *
1896  * 2.3.2  Arguments and Notes
1897  *
1898  *   The only argument is the provider identifier, as returned from a
1899  *   successful call to dtrace_register().  As a result of calling
1900  *   dtrace_unregister(), the DTrace framework will call back into the provider
1901  *   via the dtps_destroy() entry point.  Once dtrace_unregister() successfully
1902  *   completes, however, the DTrace framework will no longer make calls through
1903  *   the Framework-to-Provider API.
1904  *
1905  * 2.3.3  Return value
1906  *
1907  *   On success, dtrace_unregister returns 0.  On failure, dtrace_unregister()
1908  *   returns an errno:
1909  *
1910  *     EBUSY    There are currently processes that have the DTrace pseudodevice
1911  *              open, or there exists an anonymous enabling that hasn't yet
1912  *              been claimed.
1913  *
1914  *   No other failure code is returned.
1915  *
1916  * 2.3.4  Caller's context
1917  *
1918  *   Because a call to dtrace_unregister() may induce calls through the
1919  *   Framework-to-Provider API, the caller may not hold any lock across
1920  *   dtrace_register() that is also acquired in any of the Framework-to-
1921  *   Provider API functions.  Additionally, mod_lock may not be held.
1922  *
1923  * 2.4  void dtrace_invalidate(dtrace_provider_id_t id)
1924  *
1925  * 2.4.1  Overview
1926  *
1927  *   Invalidates the specified provider.  All subsequent probe lookups for the
1928  *   specified provider will fail, but its probes will not be removed.
1929  *
1930  * 2.4.2  Arguments and note
1931  *
1932  *   The only argument is the provider identifier, as returned from a
1933  *   successful call to dtrace_register().  In general, a provider's probes
1934  *   always remain valid; dtrace_invalidate() is a mechanism for invalidating
1935  *   an entire provider, regardless of whether or not probes are enabled or
1936  *   not.  Note that dtrace_invalidate() will _not_ prevent already enabled
1937  *   probes from firing -- it will merely prevent any new enablings of the
1938  *   provider's probes.
1939  *
1940  * 2.5 int dtrace_condense(dtrace_provider_id_t id)
1941  *
1942  * 2.5.1  Overview
1943  *
1944  *   Removes all the unenabled probes for the given provider. This function is
1945  *   not unlike dtrace_unregister(), except that it doesn't remove the
1946  *   provider just as many of its associated probes as it can.
1947  *
1948  * 2.5.2  Arguments and Notes
1949  *
1950  *   As with dtrace_unregister(), the sole argument is the provider identifier
1951  *   as returned from a successful call to dtrace_register().  As a result of
1952  *   calling dtrace_condense(), the DTrace framework will call back into the
1953  *   given provider's dtps_destroy() entry point for each of the provider's
1954  *   unenabled probes.
1955  *
1956  * 2.5.3  Return value
1957  *
1958  *   Currently, dtrace_condense() always returns 0.  However, consumers of this
1959  *   function should check the return value as appropriate; its behavior may
1960  *   change in the future.
1961  *
1962  * 2.5.4  Caller's context
1963  *
1964  *   As with dtrace_unregister(), the caller may not hold any lock across
1965  *   dtrace_condense() that is also acquired in the provider's entry points.
1966  *   Also, mod_lock may not be held.
1967  *
1968  * 2.6 int dtrace_attached()
1969  *
1970  * 2.6.1  Overview
1971  *
1972  *   Indicates whether or not DTrace has attached.
1973  *
1974  * 2.6.2  Arguments and Notes
1975  *
1976  *   For most providers, DTrace makes initial contact beyond registration.
1977  *   That is, once a provider has registered with DTrace, it waits to hear
1978  *   from DTrace to create probes.  However, some providers may wish to
1979  *   proactively create probes without first being told by DTrace to do so.
1980  *   If providers wish to do this, they must first call dtrace_attached() to
1981  *   determine if DTrace itself has attached.  If dtrace_attached() returns 0,
1982  *   the provider must not make any other Provider-to-Framework API call.
1983  *
1984  * 2.6.3  Return value
1985  *
1986  *   dtrace_attached() returns 1 if DTrace has attached, 0 otherwise.
1987  *
1988  * 2.7  int dtrace_probe_create(dtrace_provider_t id, const char *mod,
1989  *	    const char *func, const char *name, int aframes, void *arg)
1990  *
1991  * 2.7.1  Overview
1992  *
1993  *   Creates a probe with specified module name, function name, and name.
1994  *
1995  * 2.7.2  Arguments and Notes
1996  *
1997  *   The first argument is the provider identifier, as returned from a
1998  *   successful call to dtrace_register().  The second, third, and fourth
1999  *   arguments are the module name, function name, and probe name,
2000  *   respectively.  Of these, module name and function name may both be NULL
2001  *   (in which case the probe is considered to be unanchored), or they may both
2002  *   be non-NULL.  The name must be non-NULL, and must point to a non-empty
2003  *   string.
2004  *
2005  *   The fifth argument is the number of artificial stack frames that will be
2006  *   found on the stack when dtrace_probe() is called for the new probe.  These
2007  *   artificial frames will be automatically be pruned should the stack() or
2008  *   stackdepth() functions be called as part of one of the probe's ECBs.  If
2009  *   the parameter doesn't add an artificial frame, this parameter should be
2010  *   zero.
2011  *
2012  *   The final argument is a probe argument that will be passed back to the
2013  *   provider when a probe-specific operation is called.  (e.g., via
2014  *   dtps_enable(), dtps_disable(), etc.)
2015  *
2016  *   Note that it is up to the provider to be sure that the probe that it
2017  *   creates does not already exist -- if the provider is unsure of the probe's
2018  *   existence, it should assure its absence with dtrace_probe_lookup() before
2019  *   calling dtrace_probe_create().
2020  *
2021  * 2.7.3  Return value
2022  *
2023  *   dtrace_probe_create() always succeeds, and always returns the identifier
2024  *   of the newly-created probe.
2025  *
2026  * 2.7.4  Caller's context
2027  *
2028  *   While dtrace_probe_create() is generally expected to be called from
2029  *   dtps_provide() and/or dtps_provide_module(), it may be called from other
2030  *   non-DTrace contexts.  Neither cpu_lock nor mod_lock may be held.
2031  *
2032  * 2.8  dtrace_id_t dtrace_probe_lookup(dtrace_provider_t id, const char *mod,
2033  *	    const char *func, const char *name)
2034  *
2035  * 2.8.1  Overview
2036  *
2037  *   Looks up a probe based on provdider and one or more of module name,
2038  *   function name and probe name.
2039  *
2040  * 2.8.2  Arguments and Notes
2041  *
2042  *   The first argument is the provider identifier, as returned from a
2043  *   successful call to dtrace_register().  The second, third, and fourth
2044  *   arguments are the module name, function name, and probe name,
2045  *   respectively.  Any of these may be NULL; dtrace_probe_lookup() will return
2046  *   the identifier of the first probe that is provided by the specified
2047  *   provider and matches all of the non-NULL matching criteria.
2048  *   dtrace_probe_lookup() is generally used by a provider to be check the
2049  *   existence of a probe before creating it with dtrace_probe_create().
2050  *
2051  * 2.8.3  Return value
2052  *
2053  *   If the probe exists, returns its identifier.  If the probe does not exist,
2054  *   return DTRACE_IDNONE.
2055  *
2056  * 2.8.4  Caller's context
2057  *
2058  *   While dtrace_probe_lookup() is generally expected to be called from
2059  *   dtps_provide() and/or dtps_provide_module(), it may also be called from
2060  *   other non-DTrace contexts.  Neither cpu_lock nor mod_lock may be held.
2061  *
2062  * 2.9  void *dtrace_probe_arg(dtrace_provider_t id, dtrace_id_t probe)
2063  *
2064  * 2.9.1  Overview
2065  *
2066  *   Returns the probe argument associated with the specified probe.
2067  *
2068  * 2.9.2  Arguments and Notes
2069  *
2070  *   The first argument is the provider identifier, as returned from a
2071  *   successful call to dtrace_register().  The second argument is a probe
2072  *   identifier, as returned from dtrace_probe_lookup() or
2073  *   dtrace_probe_create().  This is useful if a probe has multiple
2074  *   provider-specific components to it:  the provider can create the probe
2075  *   once with provider-specific state, and then add to the state by looking
2076  *   up the probe based on probe identifier.
2077  *
2078  * 2.9.3  Return value
2079  *
2080  *   Returns the argument associated with the specified probe.  If the
2081  *   specified probe does not exist, or if the specified probe is not provided
2082  *   by the specified provider, NULL is returned.
2083  *
2084  * 2.9.4  Caller's context
2085  *
2086  *   While dtrace_probe_arg() is generally expected to be called from
2087  *   dtps_provide() and/or dtps_provide_module(), it may also be called from
2088  *   other non-DTrace contexts.  Neither cpu_lock nor mod_lock may be held.
2089  *
2090  * 2.10  void dtrace_probe(dtrace_id_t probe, uintptr_t arg0, uintptr_t arg1,
2091  *		uintptr_t arg2, uintptr_t arg3, uintptr_t arg4)
2092  *
2093  * 2.10.1  Overview
2094  *
2095  *   The epicenter of DTrace:  fires the specified probes with the specified
2096  *   arguments.
2097  *
2098  * 2.10.2  Arguments and Notes
2099  *
2100  *   The first argument is a probe identifier as returned by
2101  *   dtrace_probe_create() or dtrace_probe_lookup().  The second through sixth
2102  *   arguments are the values to which the D variables "arg0" through "arg4"
2103  *   will be mapped.
2104  *
2105  *   dtrace_probe() should be called whenever the specified probe has fired --
2106  *   however the provider defines it.
2107  *
2108  * 2.10.3  Return value
2109  *
2110  *   None.
2111  *
2112  * 2.10.4  Caller's context
2113  *
2114  *   dtrace_probe() may be called in virtually any context:  kernel, user,
2115  *   interrupt, high-level interrupt, with arbitrary adaptive locks held, with
2116  *   dispatcher locks held, with interrupts disabled, etc.  The only latitude
2117  *   that must be afforded to DTrace is the ability to make calls within
2118  *   itself (and to its in-kernel subroutines) and the ability to access
2119  *   arbitrary (but mapped) memory.  On some platforms, this constrains
2120  *   context.  For example, on UltraSPARC, dtrace_probe() cannot be called
2121  *   from any context in which TL is greater than zero.  dtrace_probe() may
2122  *   also not be called from any routine which may be called by dtrace_probe()
2123  *   -- which includes functions in the DTrace framework and some in-kernel
2124  *   DTrace subroutines.  All such functions "dtrace_"; providers that
2125  *   instrument the kernel arbitrarily should be sure to not instrument these
2126  *   routines.
2127  */
2128 
2129 typedef dtrace_modctl_t *mymodctl_p;
2130 
2131 typedef struct dtrace_pops {
2132 	void (*dtps_provide)(void *arg, const dtrace_probedesc_t *spec);
2133 	void (*dtps_provide_module)(void *arg, dtrace_modctl_t *mp);
2134 	int (*dtps_enable)(void *arg, dtrace_id_t id, void *parg);
2135 	void (*dtps_disable)(void *arg, dtrace_id_t id, void *parg);
2136 	void (*dtps_suspend)(void *arg, dtrace_id_t id, void *parg);
2137 	void (*dtps_resume)(void *arg, dtrace_id_t id, void *parg);
2138 	void (*dtps_getargdesc)(void *arg, dtrace_id_t id, void *parg,
2139 	    dtrace_argdesc_t *desc);
2140 	uint64_t (*dtps_getargval)(void *arg, dtrace_id_t id, void *parg,
2141 	    int argno, int aframes);
2142 	int (*dtps_usermode)(void *arg, dtrace_id_t id, void *parg);
2143 	void (*dtps_destroy)(void *arg, dtrace_id_t id, void *parg);
2144 } dtrace_pops_t;
2145 
2146 #define	DTRACE_MODE_KERNEL			0x01
2147 #define	DTRACE_MODE_USER			0x02
2148 #define	DTRACE_MODE_NOPRIV_DROP			0x10
2149 #define	DTRACE_MODE_NOPRIV_RESTRICT		0x20
2150 #define	DTRACE_MODE_LIMITEDPRIV_RESTRICT	0x40
2151 
2152 typedef uintptr_t	dtrace_provider_id_t;
2153 
2154 extern int dtrace_register(const char *, const dtrace_pattr_t *, uint32_t,
2155     cred_t *, const dtrace_pops_t *, void *, dtrace_provider_id_t *);
2156 extern int dtrace_unregister(dtrace_provider_id_t);
2157 extern int dtrace_condense(dtrace_provider_id_t);
2158 extern void dtrace_invalidate(dtrace_provider_id_t);
2159 extern dtrace_id_t dtrace_probe_lookup(dtrace_provider_id_t, const char *,
2160     const char *, const char *);
2161 extern dtrace_id_t dtrace_probe_create(dtrace_provider_id_t, const char *,
2162     const char *, const char *, int, void *);
2163 extern void *dtrace_probe_arg(dtrace_provider_id_t, dtrace_id_t);
2164 extern void dtrace_probe(dtrace_id_t, uintptr_t arg0, uintptr_t arg1,
2165     uintptr_t arg2, uintptr_t arg3, uintptr_t arg4);
2166 
2167 /*
2168  * DTrace Meta Provider API
2169  *
2170  * The following functions are implemented by the DTrace framework and are
2171  * used to implement meta providers. Meta providers plug into the DTrace
2172  * framework and are used to instantiate new providers on the fly. At
2173  * present, there is only one type of meta provider and only one meta
2174  * provider may be registered with the DTrace framework at a time. The
2175  * sole meta provider type provides user-land static tracing facilities
2176  * by taking meta probe descriptions and adding a corresponding provider
2177  * into the DTrace framework.
2178  *
2179  * 1 Framework-to-Provider
2180  *
2181  * 1.1 Overview
2182  *
2183  * The Framework-to-Provider API is represented by the dtrace_mops structure
2184  * that the meta provider passes to the framework when registering itself as
2185  * a meta provider. This structure consists of the following members:
2186  *
2187  *   dtms_create_probe()	<-- Add a new probe to a created provider
2188  *   dtms_provide_pid()		<-- Create a new provider for a given process
2189  *   dtms_remove_pid()		<-- Remove a previously created provider
2190  *
2191  * 1.2  void dtms_create_probe(void *arg, void *parg,
2192  *           dtrace_helper_probedesc_t *probedesc);
2193  *
2194  * 1.2.1  Overview
2195  *
2196  *   Called by the DTrace framework to create a new probe in a provider
2197  *   created by this meta provider.
2198  *
2199  * 1.2.2  Arguments and notes
2200  *
2201  *   The first argument is the cookie as passed to dtrace_meta_register().
2202  *   The second argument is the provider cookie for the associated provider;
2203  *   this is obtained from the return value of dtms_provide_pid(). The third
2204  *   argument is the helper probe description.
2205  *
2206  * 1.2.3  Return value
2207  *
2208  *   None
2209  *
2210  * 1.2.4  Caller's context
2211  *
2212  *   dtms_create_probe() is called from either ioctl() or module load context.
2213  *   The DTrace framework is locked in such a way that meta providers may not
2214  *   register or unregister. This means that the meta provider cannot call
2215  *   dtrace_meta_register() or dtrace_meta_unregister(). However, the context is
2216  *   such that the provider may (and is expected to) call provider-related
2217  *   DTrace provider APIs including dtrace_probe_create().
2218  *
2219  * 1.3  void *dtms_provide_pid(void *arg, dtrace_meta_provider_t *mprov,
2220  *	      pid_t pid)
2221  *
2222  * 1.3.1  Overview
2223  *
2224  *   Called by the DTrace framework to instantiate a new provider given the
2225  *   description of the provider and probes in the mprov argument. The
2226  *   meta provider should call dtrace_register() to insert the new provider
2227  *   into the DTrace framework.
2228  *
2229  * 1.3.2  Arguments and notes
2230  *
2231  *   The first argument is the cookie as passed to dtrace_meta_register().
2232  *   The second argument is a pointer to a structure describing the new
2233  *   helper provider. The third argument is the process identifier for
2234  *   process associated with this new provider. Note that the name of the
2235  *   provider as passed to dtrace_register() should be the contatenation of
2236  *   the dtmpb_provname member of the mprov argument and the processs
2237  *   identifier as a string.
2238  *
2239  * 1.3.3  Return value
2240  *
2241  *   The cookie for the provider that the meta provider creates. This is
2242  *   the same value that it passed to dtrace_register().
2243  *
2244  * 1.3.4  Caller's context
2245  *
2246  *   dtms_provide_pid() is called from either ioctl() or module load context.
2247  *   The DTrace framework is locked in such a way that meta providers may not
2248  *   register or unregister. This means that the meta provider cannot call
2249  *   dtrace_meta_register() or dtrace_meta_unregister(). However, the context
2250  *   is such that the provider may -- and is expected to --  call
2251  *   provider-related DTrace provider APIs including dtrace_register().
2252  *
2253  * 1.4  void dtms_remove_pid(void *arg, dtrace_meta_provider_t *mprov,
2254  *	     pid_t pid)
2255  *
2256  * 1.4.1  Overview
2257  *
2258  *   Called by the DTrace framework to remove a provider that had previously
2259  *   been instantiated via the dtms_provide_pid() entry point. The meta
2260  *   provider need not remove the provider immediately, but this entry
2261  *   point indicates that the provider should be removed as soon as possible
2262  *   using the dtrace_unregister() API.
2263  *
2264  * 1.4.2  Arguments and notes
2265  *
2266  *   The first argument is the cookie as passed to dtrace_meta_register().
2267  *   The second argument is a pointer to a structure describing the helper
2268  *   provider. The third argument is the process identifier for process
2269  *   associated with this new provider.
2270  *
2271  * 1.4.3  Return value
2272  *
2273  *   None
2274  *
2275  * 1.4.4  Caller's context
2276  *
2277  *   dtms_remove_pid() is called from either ioctl() or exit() context.
2278  *   The DTrace framework is locked in such a way that meta providers may not
2279  *   register or unregister. This means that the meta provider cannot call
2280  *   dtrace_meta_register() or dtrace_meta_unregister(). However, the context
2281  *   is such that the provider may -- and is expected to -- call
2282  *   provider-related DTrace provider APIs including dtrace_unregister().
2283  */
2284 typedef struct dtrace_helper_probedesc {
2285 	char *dthpb_mod;			/* probe module */
2286 	char *dthpb_func; 			/* probe function */
2287 	char *dthpb_name; 			/* probe name */
2288 	uint64_t dthpb_base;			/* base address */
2289 	uint32_t *dthpb_offs;			/* offsets array */
2290 	uint32_t *dthpb_enoffs;			/* is-enabled offsets array */
2291 	uint32_t dthpb_noffs;			/* offsets count */
2292 	uint32_t dthpb_nenoffs;			/* is-enabled offsets count */
2293 	uint8_t *dthpb_args;			/* argument mapping array */
2294 	uint8_t dthpb_xargc;			/* translated argument count */
2295 	uint8_t dthpb_nargc;			/* native argument count */
2296 	char *dthpb_xtypes;			/* translated types strings */
2297 	char *dthpb_ntypes;			/* native types strings */
2298 } dtrace_helper_probedesc_t;
2299 
2300 typedef struct dtrace_helper_provdesc {
2301 	char *dthpv_provname;			/* provider name */
2302 	dtrace_pattr_t dthpv_pattr;		/* stability attributes */
2303 } dtrace_helper_provdesc_t;
2304 
2305 typedef struct dtrace_mops {
2306 	void (*dtms_create_probe)(void *, void *, dtrace_helper_probedesc_t *);
2307 	void *(*dtms_provide_pid)(void *, dtrace_helper_provdesc_t *, pid_t);
2308 	void (*dtms_remove_pid)(void *, dtrace_helper_provdesc_t *, pid_t);
2309 } dtrace_mops_t;
2310 
2311 typedef uintptr_t	dtrace_meta_provider_id_t;
2312 
2313 extern int dtrace_meta_register(const char *, const dtrace_mops_t *, void *,
2314     dtrace_meta_provider_id_t *);
2315 extern int dtrace_meta_unregister(dtrace_meta_provider_id_t);
2316 
2317 /*
2318  * DTrace Kernel Hooks
2319  *
2320  * The following functions are implemented by the base kernel and form a set of
2321  * hooks used by the DTrace framework.  DTrace hooks are implemented in either
2322  * uts/common/os/dtrace_subr.c, an ISA-specific assembly file, or in a
2323  * uts/<platform>/os/dtrace_subr.c corresponding to each hardware platform.
2324  */
2325 
2326 typedef enum dtrace_vtime_state {
2327 	DTRACE_VTIME_INACTIVE = 0,	/* No DTrace, no TNF */
2328 	DTRACE_VTIME_ACTIVE,		/* DTrace virtual time, no TNF */
2329 	DTRACE_VTIME_INACTIVE_TNF,	/* No DTrace, TNF active */
2330 	DTRACE_VTIME_ACTIVE_TNF		/* DTrace virtual time _and_ TNF */
2331 } dtrace_vtime_state_t;
2332 
2333 #ifdef illumos
2334 extern dtrace_vtime_state_t dtrace_vtime_active;
2335 #endif
2336 extern void dtrace_vtime_switch(kthread_t *next);
2337 extern void dtrace_vtime_enable_tnf(void);
2338 extern void dtrace_vtime_disable_tnf(void);
2339 extern void dtrace_vtime_enable(void);
2340 extern void dtrace_vtime_disable(void);
2341 
2342 struct regs;
2343 struct reg;
2344 
2345 #ifdef illumos
2346 extern int (*dtrace_pid_probe_ptr)(struct reg *);
2347 extern int (*dtrace_return_probe_ptr)(struct reg *);
2348 extern void (*dtrace_fasttrap_fork_ptr)(proc_t *, proc_t *);
2349 extern void (*dtrace_fasttrap_exec_ptr)(proc_t *);
2350 extern void (*dtrace_fasttrap_exit_ptr)(proc_t *);
2351 extern void dtrace_fasttrap_fork(proc_t *, proc_t *);
2352 #endif
2353 
2354 typedef uintptr_t dtrace_icookie_t;
2355 typedef void (*dtrace_xcall_t)(void *);
2356 
2357 extern dtrace_icookie_t dtrace_interrupt_disable(void);
2358 extern void dtrace_interrupt_enable(dtrace_icookie_t);
2359 
2360 extern void dtrace_membar_producer(void);
2361 extern void dtrace_membar_consumer(void);
2362 
2363 extern void (*dtrace_cpu_init)(processorid_t);
2364 #ifdef illumos
2365 extern void (*dtrace_modload)(dtrace_modctl_t *);
2366 extern void (*dtrace_modunload)(dtrace_modctl_t *);
2367 #endif
2368 extern void (*dtrace_helpers_cleanup)(void);
2369 extern void (*dtrace_helpers_fork)(proc_t *parent, proc_t *child);
2370 extern void (*dtrace_cpustart_init)(void);
2371 extern void (*dtrace_cpustart_fini)(void);
2372 extern void (*dtrace_closef)(void);
2373 
2374 extern void (*dtrace_debugger_init)(void);
2375 extern void (*dtrace_debugger_fini)(void);
2376 extern dtrace_cacheid_t dtrace_predcache_id;
2377 
2378 #ifdef illumos
2379 extern hrtime_t dtrace_gethrtime(void);
2380 #else
2381 void dtrace_debug_printf(const char *, ...) __printflike(1, 2);
2382 #endif
2383 extern void dtrace_sync(void);
2384 extern void dtrace_toxic_ranges(void (*)(uintptr_t, uintptr_t));
2385 extern void dtrace_xcall(processorid_t, dtrace_xcall_t, void *);
2386 extern void dtrace_vpanic(const char *, __va_list);
2387 extern void dtrace_panic(const char *, ...);
2388 
2389 extern int dtrace_safe_defer_signal(void);
2390 extern void dtrace_safe_synchronous_signal(void);
2391 
2392 extern int dtrace_mach_aframes(void);
2393 
2394 #if defined(__i386) || defined(__amd64)
2395 extern int dtrace_instr_size(uchar_t *instr);
2396 extern int dtrace_instr_size_isa(uchar_t *, model_t, int *);
2397 extern void dtrace_invop_callsite(void);
2398 #endif
2399 extern void dtrace_invop_add(int (*)(uintptr_t, uintptr_t *, uintptr_t));
2400 extern void dtrace_invop_remove(int (*)(uintptr_t, uintptr_t *, uintptr_t));
2401 
2402 #ifdef __sparc
2403 extern int dtrace_blksuword32(uintptr_t, uint32_t *, int);
2404 extern void dtrace_getfsr(uint64_t *);
2405 #endif
2406 
2407 #ifndef illumos
2408 extern void dtrace_helpers_duplicate(proc_t *, proc_t *);
2409 extern void dtrace_helpers_destroy(proc_t *);
2410 #endif
2411 
2412 #define	DTRACE_CPUFLAG_ISSET(flag) \
2413 	(cpu_core[cpu_number()].cpuc_dtrace_flags & (flag))
2414 
2415 #define	DTRACE_CPUFLAG_SET(flag) \
2416 	(cpu_core[cpu_number()].cpuc_dtrace_flags |= (flag))
2417 
2418 #define	DTRACE_CPUFLAG_CLEAR(flag) \
2419 	(cpu_core[cpu_number()].cpuc_dtrace_flags &= ~(flag))
2420 
2421 #endif /* _KERNEL */
2422 
2423 #endif	/* _ASM */
2424 
2425 #if defined(__i386) || defined(__amd64)
2426 
2427 #define	DTRACE_INVOP_PUSHL_EBP		1
2428 #define	DTRACE_INVOP_POPL_EBP		2
2429 #define	DTRACE_INVOP_LEAVE		3
2430 #define	DTRACE_INVOP_NOP		4
2431 #define	DTRACE_INVOP_RET		5
2432 
2433 #elif defined(__powerpc__)
2434 
2435 #define DTRACE_INVOP_RET	1
2436 #define DTRACE_INVOP_BCTR	2
2437 #define DTRACE_INVOP_BLR	3
2438 #define DTRACE_INVOP_JUMP	4
2439 #define DTRACE_INVOP_MFLR_R0	5
2440 #define DTRACE_INVOP_NOP	6
2441 
2442 #elif defined(__arm__)
2443 
2444 #define	DTRACE_INVOP_SHIFT	4
2445 #define	DTRACE_INVOP_MASK	((1 << DTRACE_INVOP_SHIFT) - 1)
2446 #define	DTRACE_INVOP_DATA(x)	((x) >> DTRACE_INVOP_SHIFT)
2447 
2448 #define DTRACE_INVOP_PUSHM	1
2449 #define DTRACE_INVOP_POPM	2
2450 #define DTRACE_INVOP_B		3
2451 
2452 #define	DTRACE_INVOP_MOV_IP_SP		1
2453 #define	DTRACE_INVOP_BX_LR		2
2454 #define	DTRACE_INVOP_MOV_PC_LR		3
2455 #define	DTRACE_INVOP_LDM		4
2456 #define	DTRACE_INVOP_LDMIB		5
2457 #define	DTRACE_INVOP_LDR_IMM		6
2458 #define	DTRACE_INVOP_MOVW		7
2459 #define	DTRACE_INVOP_MOV_IMM		8
2460 #define	DTRACE_INVOP_CMP_IMM		9
2461 #define	DTRACE_INVOP_B_LABEL		10
2462 #define	DTRACE_INVOP_PUSH		11
2463 
2464 #elif defined(__aarch64__)
2465 
2466 #define	INSN_SIZE	4
2467 
2468 #define	B_MASK		0xff000000
2469 #define	B_DATA_MASK	0x00ffffff
2470 #define	B_INSTR		0x14000000
2471 
2472 #define	RET_INSTR	0xd65f03c0
2473 
2474 #define	LDP_STP_MASK	0xffc00000
2475 #define	STP_32		0x29800000
2476 #define	STP_64		0xa9800000
2477 #define	LDP_32		0x28c00000
2478 #define	LDP_64		0xa8c00000
2479 #define	LDP_STP_PREIND	(1 << 24)
2480 #define	LDP_STP_DIR	(1 << 22) /* Load instruction */
2481 #define	ARG1_SHIFT	0
2482 #define	ARG1_MASK	0x1f
2483 #define	ARG2_SHIFT	10
2484 #define	ARG2_MASK	0x1f
2485 #define	OFFSET_SHIFT	15
2486 #define	OFFSET_SIZE	7
2487 #define	OFFSET_MASK	((1 << OFFSET_SIZE) - 1)
2488 
2489 #define	DTRACE_INVOP_PUSHM	1
2490 #define	DTRACE_INVOP_RET	2
2491 #define	DTRACE_INVOP_B		3
2492 
2493 #endif
2494 
2495 #ifdef	__cplusplus
2496 }
2497 #endif
2498 
2499 #endif	/* _SYS_DTRACE_H */
2500