1 /**************************************************************************
2  *
3  * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4  * All Rights Reserved.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the
15  * next paragraph) shall be included in all copies or substantial portions
16  * of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21  * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25  *
26  **************************************************************************/
27 
28 #ifndef _I915_REG_H_
29 #define _I915_REG_H_
30 
31 #define CMD_3D (3 << 29)
32 
33 #define I915_SET_FIELD( var, mask, value ) (var &= ~(mask), var |= value)
34 
35 #define PRIM3D			(CMD_3D | (0x1f<<24))
36 #define PRIM3D_INDIRECT_SEQUENTIAL      ((1<<23) | (0<<17))
37 #define PRIM3D_TRILIST		(PRIM3D | (0x0<<18))
38 #define PRIM3D_TRISTRIP		(PRIM3D | (0x1<<18))
39 #define PRIM3D_TRISTRIP_RVRSE	(PRIM3D | (0x2<<18))
40 #define PRIM3D_TRIFAN		(PRIM3D | (0x3<<18))
41 #define PRIM3D_POLY		(PRIM3D | (0x4<<18))
42 #define PRIM3D_LINELIST		(PRIM3D | (0x5<<18))
43 #define PRIM3D_LINESTRIP	(PRIM3D | (0x6<<18))
44 #define PRIM3D_RECTLIST		(PRIM3D | (0x7<<18))
45 #define PRIM3D_POINTLIST	(PRIM3D | (0x8<<18))
46 #define PRIM3D_DIB		(PRIM3D | (0x9<<18))
47 #define PRIM3D_CLEAR_RECT	(PRIM3D | (0xa<<18))
48 #define PRIM3D_ZONE_INIT	(PRIM3D | (0xd<<18))
49 #define PRIM3D_MASK		(0x1f<<18)
50 
51 
52 /* p137 */
53 #define _3DSTATE_AA_CMD			(CMD_3D | (0x06<<24))
54 #define AA_LINE_ECAAR_WIDTH_ENABLE	(1<<16)
55 #define AA_LINE_ECAAR_WIDTH_0_5		0
56 #define AA_LINE_ECAAR_WIDTH_1_0		(1<<14)
57 #define AA_LINE_ECAAR_WIDTH_2_0		(2<<14)
58 #define AA_LINE_ECAAR_WIDTH_4_0		(3<<14)
59 #define AA_LINE_REGION_WIDTH_ENABLE	(1<<8)
60 #define AA_LINE_REGION_WIDTH_0_5	0
61 #define AA_LINE_REGION_WIDTH_1_0	(1<<6)
62 #define AA_LINE_REGION_WIDTH_2_0	(2<<6)
63 #define AA_LINE_REGION_WIDTH_4_0	(3<<6)
64 
65 /* 3DSTATE_BACKFACE_STENCIL_OPS, p138*/
66 #define _3DSTATE_BACKFACE_STENCIL_OPS    (CMD_3D | (0x8<<24))
67 #define BFO_ENABLE_STENCIL_REF          (1<<23)
68 #define BFO_STENCIL_REF_SHIFT           15
69 #define BFO_STENCIL_REF_MASK            (0xff<<15)
70 #define BFO_ENABLE_STENCIL_FUNCS        (1<<14)
71 #define BFO_STENCIL_TEST_SHIFT          11
72 #define BFO_STENCIL_TEST_MASK           (0x7<<11)
73 #define BFO_STENCIL_FAIL_SHIFT          8
74 #define BFO_STENCIL_FAIL_MASK           (0x7<<8)
75 #define BFO_STENCIL_PASS_Z_FAIL_SHIFT   5
76 #define BFO_STENCIL_PASS_Z_FAIL_MASK    (0x7<<5)
77 #define BFO_STENCIL_PASS_Z_PASS_SHIFT   2
78 #define BFO_STENCIL_PASS_Z_PASS_MASK    (0x7<<2)
79 #define BFO_ENABLE_STENCIL_TWO_SIDE     (1<<1)
80 #define BFO_STENCIL_TWO_SIDE            (1<<0)
81 
82 /* 3DSTATE_BACKFACE_STENCIL_MASKS, p140 */
83 #define _3DSTATE_BACKFACE_STENCIL_MASKS    (CMD_3D | (0x9<<24))
84 #define BFM_ENABLE_STENCIL_TEST_MASK      (1<<17)
85 #define BFM_ENABLE_STENCIL_WRITE_MASK     (1<<16)
86 #define BFM_STENCIL_TEST_MASK_SHIFT       8
87 #define BFM_STENCIL_TEST_MASK_MASK        (0xff<<8)
88 #define BFM_STENCIL_WRITE_MASK_SHIFT      0
89 #define BFM_STENCIL_WRITE_MASK_MASK       (0xff<<0)
90 
91 /* 3DSTATE_BIN_CONTROL p141 */
92 
93 /* p143 */
94 #define _3DSTATE_BUF_INFO_CMD	(CMD_3D | (0x1d<<24) | (0x8e<<16) | 1)
95 /* Dword 1 */
96 #define BUF_3D_ID_COLOR_BACK	(0x3<<24)
97 #define BUF_3D_ID_DEPTH		(0x7<<24)
98 #define BUF_3D_USE_FENCE	(1<<23)
99 #define BUF_3D_TILED_SURFACE	(1<<22)
100 #define BUF_3D_TILE_WALK_X	0
101 #define BUF_3D_TILE_WALK_Y	(1<<21)
102 /* Dword 2 */
103 #define BUF_3D_ADDR(x)		((x) & ~0x3)
104 
105 /* 3DSTATE_CHROMA_KEY */
106 
107 /* 3DSTATE_CLEAR_PARAMETERS, p150 */
108 #define _3DSTATE_CLEAR_PARAMETERS   (CMD_3D | (0x1d<<24) | (0x9c<<16) | 5)
109 /* Dword 1 */
110 #define CLEARPARAM_CLEAR_RECT	    (1 << 16)
111 #define CLEARPARAM_ZONE_INIT	    (0 << 16)
112 #define CLEARPARAM_WRITE_COLOR	    (1 << 2)
113 #define CLEARPARAM_WRITE_DEPTH	    (1 << 1)
114 #define CLEARPARAM_WRITE_STENCIL    (1 << 0)
115 
116 /* 3DSTATE_CONSTANT_BLEND_COLOR, p153 */
117 #define _3DSTATE_CONST_BLEND_COLOR_CMD	(CMD_3D | (0x1d<<24) | (0x88<<16))
118 
119 /* 3DSTATE_COORD_SET_BINDINGS, p154 */
120 #define _3DSTATE_COORD_SET_BINDINGS      (CMD_3D | (0x16<<24))
121 #define CSB_TCB(iunit, eunit)           ((eunit)<<(iunit*3))
122 
123 /* p156 */
124 #define _3DSTATE_DFLT_DIFFUSE_CMD	(CMD_3D | (0x1d<<24) | (0x99<<16))
125 
126 /* p157 */
127 #define _3DSTATE_DFLT_SPEC_CMD		(CMD_3D | (0x1d<<24) | (0x9a<<16))
128 
129 /* p158 */
130 #define _3DSTATE_DFLT_Z_CMD		(CMD_3D | (0x1d<<24) | (0x98<<16))
131 
132 /* 3DSTATE_DEPTH_OFFSET_SCALE, p159 */
133 #define _3DSTATE_DEPTH_OFFSET_SCALE       (CMD_3D | (0x1d<<24) | (0x97<<16))
134 /* scale in dword 1 */
135 
136 /* The depth subrectangle is not supported, but must be disabled. */
137 /* 3DSTATE_DEPTH_SUBRECT_DISABLE, p160 */
138 #define _3DSTATE_DEPTH_SUBRECT_DISABLE	(CMD_3D | (0x1c<<24) | (0x11<<19) | (1 << 1) | (0 << 0))
139 
140 /* p161 */
141 #define _3DSTATE_DST_BUF_VARS_CMD	(CMD_3D | (0x1d<<24) | (0x85<<16))
142 /* Dword 1 */
143 #define TEX_DEFAULT_COLOR_OGL           (0<<30)
144 #define TEX_DEFAULT_COLOR_D3D           (1<<30)
145 #define ZR_EARLY_DEPTH                  (1<<29)
146 #define LOD_PRECLAMP_OGL                (1<<28)
147 #define LOD_PRECLAMP_D3D                (0<<28)
148 #define DITHER_FULL_ALWAYS              (0<<26)
149 #define DITHER_FULL_ON_FB_BLEND         (1<<26)
150 #define DITHER_CLAMPED_ALWAYS           (2<<26)
151 #define LINEAR_GAMMA_BLEND_32BPP        (1<<25)
152 #define DEBUG_DISABLE_ENH_DITHER        (1<<24)
153 #define DSTORG_HORT_BIAS(x)		((x)<<20)
154 #define DSTORG_VERT_BIAS(x)		((x)<<16)
155 #define COLOR_4_2_2_CHNL_WRT_ALL	0
156 #define COLOR_4_2_2_CHNL_WRT_Y		(1<<12)
157 #define COLOR_4_2_2_CHNL_WRT_CR		(2<<12)
158 #define COLOR_4_2_2_CHNL_WRT_CB		(3<<12)
159 #define COLOR_4_2_2_CHNL_WRT_CRCB	(4<<12)
160 #define COLR_BUF_8BIT			0
161 #define COLR_BUF_RGB555			(1<<8)
162 #define COLR_BUF_RGB565			(2<<8)
163 #define COLR_BUF_ARGB8888		(3<<8)
164 #define COLR_BUF_ARGB4444		(8<<8)
165 #define COLR_BUF_ARGB1555		(9<<8)
166 #define COLR_BUF_ARGB2AAA		(0xa<<8)
167 #define DEPTH_IS_Z			0
168 #define DEPTH_IS_W			(1<<6)
169 #define DEPTH_FRMT_16_FIXED		0
170 #define DEPTH_FRMT_16_FLOAT		(1<<2)
171 #define DEPTH_FRMT_24_FIXED_8_OTHER	(2<<2)
172 #define DEPTH_FRMT_24_FLOAT_8_OTHER	(3<<2)
173 #define VERT_LINE_STRIDE_1		(1<<1)
174 #define VERT_LINE_STRIDE_0		0
175 #define VERT_LINE_STRIDE_OFS_1		1
176 #define VERT_LINE_STRIDE_OFS_0		0
177 
178 /* p166 */
179 #define _3DSTATE_DRAW_RECT_CMD		(CMD_3D|(0x1d<<24)|(0x80<<16)|3)
180 /* Dword 1 */
181 #define DRAW_RECT_DIS_DEPTH_OFS		(1<<30)
182 #define DRAW_DITHER_OFS_X(x)		((x)<<26)
183 #define DRAW_DITHER_OFS_Y(x)		((x)<<24)
184 /* Dword 2 */
185 #define DRAW_YMIN(x)			((uint16_t)(x)<<16)
186 #define DRAW_XMIN(x)			((uint16_t)(x))
187 /* Dword 3 */
188 #define DRAW_YMAX(x)			((uint16_t)(x)<<16)
189 #define DRAW_XMAX(x)			((uint16_t)(x))
190 /* Dword 4 */
191 #define DRAW_YORG(x)			((uint16_t)(x)<<16)
192 #define DRAW_XORG(x)			((uint16_t)(x))
193 
194 /* 3DSTATE_FILTER_COEFFICIENTS_4X4, p170 */
195 
196 /* 3DSTATE_FILTER_COEFFICIENTS_6X5, p172 */
197 
198 /* _3DSTATE_FOG_COLOR, p173 */
199 #define _3DSTATE_FOG_COLOR_CMD		(CMD_3D|(0x15<<24))
200 #define FOG_COLOR_RED(x)		((x)<<16)
201 #define FOG_COLOR_GREEN(x)		((x)<<8)
202 #define FOG_COLOR_BLUE(x)		(x)
203 
204 /* _3DSTATE_FOG_MODE, p174 */
205 #define _3DSTATE_FOG_MODE_CMD		(CMD_3D|(0x1d<<24)|(0x89<<16)|2)
206 /* Dword 1 */
207 #define FMC1_FOGFUNC_MODIFY_ENABLE	(1<<31)
208 #define FMC1_FOGFUNC_VERTEX		(0<<28)
209 #define FMC1_FOGFUNC_PIXEL_EXP		(1<<28)
210 #define FMC1_FOGFUNC_PIXEL_EXP2		(2<<28)
211 #define FMC1_FOGFUNC_PIXEL_LINEAR	(3<<28)
212 #define FMC1_FOGFUNC_MASK		(3<<28)
213 #define FMC1_FOGINDEX_MODIFY_ENABLE     (1<<27)
214 #define FMC1_FOGINDEX_Z		        (0<<25)
215 #define FMC1_FOGINDEX_W			(1<<25)
216 #define FMC1_C1_C2_MODIFY_ENABLE	(1<<24)
217 #define FMC1_DENSITY_MODIFY_ENABLE	(1<<23)
218 #define FMC1_C1_ONE			(1<<13)
219 #define FMC1_C1_MASK		        (0xffff<<4)
220 /* Dword 2 */
221 #define FMC2_C2_ONE		        (1<<16)
222 /* Dword 3 */
223 #define FMC3_D_ONE			(1<<16)
224 
225 /* _3DSTATE_INDEPENDENT_ALPHA_BLEND, p177 */
226 #define _3DSTATE_INDEPENDENT_ALPHA_BLEND_CMD	(CMD_3D|(0x0b<<24))
227 #define IAB_MODIFY_ENABLE	        (1<<23)
228 #define IAB_ENABLE			(1<<22)
229 #define IAB_MODIFY_FUNC			(1<<21)
230 #define IAB_FUNC_SHIFT			16
231 #define IAB_MODIFY_SRC_FACTOR		(1<<11)
232 #define IAB_SRC_FACTOR_SHIFT		6
233 #define IAB_SRC_FACTOR_MASK		(BLENDFACT_MASK<<6)
234 #define IAB_MODIFY_DST_FACTOR	        (1<<5)
235 #define IAB_DST_FACTOR_SHIFT		0
236 #define IAB_DST_FACTOR_MASK		(BLENDFACT_MASK<<0)
237 
238 #define BLENDFACT_ZERO			0x01
239 #define BLENDFACT_ONE			0x02
240 #define BLENDFACT_SRC_COLR		0x03
241 #define BLENDFACT_INV_SRC_COLR		0x04
242 #define BLENDFACT_SRC_ALPHA		0x05
243 #define BLENDFACT_INV_SRC_ALPHA		0x06
244 #define BLENDFACT_DST_ALPHA		0x07
245 #define BLENDFACT_INV_DST_ALPHA		0x08
246 #define BLENDFACT_DST_COLR		0x09
247 #define BLENDFACT_INV_DST_COLR		0x0a
248 #define BLENDFACT_SRC_ALPHA_SATURATE	0x0b
249 #define BLENDFACT_CONST_COLOR		0x0c
250 #define BLENDFACT_INV_CONST_COLOR	0x0d
251 #define BLENDFACT_CONST_ALPHA		0x0e
252 #define BLENDFACT_INV_CONST_ALPHA	0x0f
253 #define BLENDFACT_MASK			0x0f
254 
255 #define BLENDFUNC_ADD			0x0
256 #define BLENDFUNC_SUBTRACT		0x1
257 #define BLENDFUNC_REVERSE_SUBTRACT	0x2
258 #define BLENDFUNC_MIN			0x3
259 #define BLENDFUNC_MAX			0x4
260 #define BLENDFUNC_MASK			0x7
261 
262 /* 3DSTATE_LOAD_INDIRECT, p180 */
263 
264 #define _3DSTATE_LOAD_INDIRECT	        (CMD_3D|(0x1d<<24)|(0x7<<16))
265 #define LI0_STATE_STATIC_INDIRECT       (0x01<<8)
266 #define LI0_STATE_DYNAMIC_INDIRECT      (0x02<<8)
267 #define LI0_STATE_SAMPLER               (0x04<<8)
268 #define LI0_STATE_MAP                   (0x08<<8)
269 #define LI0_STATE_PROGRAM               (0x10<<8)
270 #define LI0_STATE_CONSTANTS             (0x20<<8)
271 
272 #define SIS0_BUFFER_ADDRESS(x)          ((x)&~0x3)
273 #define SIS0_FORCE_LOAD                 (1<<1)
274 #define SIS0_BUFFER_VALID               (1<<0)
275 #define SIS1_BUFFER_LENGTH(x)           ((x)&0xff)
276 
277 #define DIS0_BUFFER_ADDRESS(x)          ((x)&~0x3)
278 #define DIS0_BUFFER_RESET               (1<<1)
279 #define DIS0_BUFFER_VALID               (1<<0)
280 
281 #define SSB0_BUFFER_ADDRESS(x)          ((x)&~0x3)
282 #define SSB0_FORCE_LOAD                 (1<<1)
283 #define SSB0_BUFFER_VALID               (1<<0)
284 #define SSB1_BUFFER_LENGTH(x)           ((x)&0xff)
285 
286 #define MSB0_BUFFER_ADDRESS(x)          ((x)&~0x3)
287 #define MSB0_FORCE_LOAD                 (1<<1)
288 #define MSB0_BUFFER_VALID               (1<<0)
289 #define MSB1_BUFFER_LENGTH(x)           ((x)&0xff)
290 
291 #define PSP0_BUFFER_ADDRESS(x)          ((x)&~0x3)
292 #define PSP0_FORCE_LOAD                 (1<<1)
293 #define PSP0_BUFFER_VALID               (1<<0)
294 #define PSP1_BUFFER_LENGTH(x)           ((x)&0xff)
295 
296 #define PSC0_BUFFER_ADDRESS(x)          ((x)&~0x3)
297 #define PSC0_FORCE_LOAD                 (1<<1)
298 #define PSC0_BUFFER_VALID               (1<<0)
299 #define PSC1_BUFFER_LENGTH(x)           ((x)&0xff)
300 
301 /* _3DSTATE_RASTERIZATION_RULES */
302 #define _3DSTATE_RASTER_RULES_CMD	(CMD_3D|(0x07<<24))
303 #define ENABLE_POINT_RASTER_RULE	(1<<15)
304 #define OGL_POINT_RASTER_RULE		(1<<13)
305 #define ENABLE_TEXKILL_3D_4D            (1<<10)
306 #define TEXKILL_3D                      (0<<9)
307 #define TEXKILL_4D                      (1<<9)
308 #define ENABLE_LINE_STRIP_PROVOKE_VRTX	(1<<8)
309 #define ENABLE_TRI_FAN_PROVOKE_VRTX	(1<<5)
310 #define LINE_STRIP_PROVOKE_VRTX(x)	((x)<<6)
311 #define TRI_FAN_PROVOKE_VRTX(x) 	((x)<<3)
312 
313 /* _3DSTATE_SCISSOR_ENABLE, p256 */
314 #define _3DSTATE_SCISSOR_ENABLE_CMD	(CMD_3D|(0x1c<<24)|(0x10<<19))
315 #define ENABLE_SCISSOR_RECT		((1<<1) | 1)
316 #define DISABLE_SCISSOR_RECT		(1<<1)
317 
318 /* _3DSTATE_SCISSOR_RECTANGLE_0, p257 */
319 #define _3DSTATE_SCISSOR_RECT_0_CMD	(CMD_3D|(0x1d<<24)|(0x81<<16)|1)
320 /* Dword 1 */
321 #define SCISSOR_RECT_0_YMIN(x)		((x)<<16)
322 #define SCISSOR_RECT_0_XMIN(x)		(x)
323 /* Dword 2 */
324 #define SCISSOR_RECT_0_YMAX(x)		((x)<<16)
325 #define SCISSOR_RECT_0_XMAX(x)		(x)
326 
327 /* p189 */
328 #define _3DSTATE_LOAD_STATE_IMMEDIATE_1   ((0x3<<29)|(0x1d<<24)|(0x04<<16))
329 #define I1_LOAD_S(n)                      (1<<(4+n))
330 
331 #define S0_VB_OFFSET_MASK              0xffffffc
332 #define S0_AUTO_CACHE_INV_DISABLE      (1<<0)
333 
334 #define S1_VERTEX_WIDTH_SHIFT          24
335 #define S1_VERTEX_WIDTH_MASK           (0x3f<<24)
336 #define S1_VERTEX_PITCH_SHIFT          16
337 #define S1_VERTEX_PITCH_MASK           (0x3f<<16)
338 
339 #define TEXCOORDFMT_2D                 0x0
340 #define TEXCOORDFMT_3D                 0x1
341 #define TEXCOORDFMT_4D                 0x2
342 #define TEXCOORDFMT_1D                 0x3
343 #define TEXCOORDFMT_2D_16              0x4
344 #define TEXCOORDFMT_4D_16              0x5
345 #define TEXCOORDFMT_NOT_PRESENT        0xf
346 #define S2_TEXCOORD_FMT0_MASK            0xf
347 #define S2_TEXCOORD_FMT1_SHIFT           4
348 #define S2_TEXCOORD_FMT(unit, type)    ((type)<<(unit*4))
349 #define S2_TEXCOORD_NONE               (~0)
350 
351 #define TEXCOORD_WRAP_SHORTEST_TCX	8
352 #define TEXCOORD_WRAP_SHORTEST_TCY	4
353 #define TEXCOORD_WRAP_SHORTEST_TCZ	2
354 #define TEXCOORD_PERSPECTIVE_DISABLE	1
355 
356 #define S3_WRAP_SHORTEST_TCX(unit)	(TEXCOORD_WRAP_SHORTEST_TCX << ((unit) * 4))
357 #define S3_WRAP_SHORTEST_TCY(unit)	(TEXCOORD_WRAP_SHORTEST_TCY << ((unit) * 4))
358 #define S3_WRAP_SHORTEST_TCZ(unit)	(TEXCOORD_WRAP_SHORTEST_TCZ << ((unit) * 4))
359 #define S3_PERSPECTIVE_DISABLE(unit)	(TEXCOORD_PERSPECTIVE_DISABLE << ((unit) * 4))
360 
361 /* S3 not interesting */
362 
363 #define S4_POINT_WIDTH_SHIFT           23
364 #define S4_POINT_WIDTH_MASK            (0x1ff<<23)
365 #define S4_LINE_WIDTH_SHIFT            19
366 #define S4_LINE_WIDTH_ONE              (0x2<<19)
367 #define S4_LINE_WIDTH_MASK             (0xf<<19)
368 #define S4_FLATSHADE_ALPHA             (1<<18)
369 #define S4_FLATSHADE_FOG               (1<<17)
370 #define S4_FLATSHADE_SPECULAR          (1<<16)
371 #define S4_FLATSHADE_COLOR             (1<<15)
372 #define S4_CULLMODE_BOTH	       (0<<13)
373 #define S4_CULLMODE_NONE	       (1<<13)
374 #define S4_CULLMODE_CW		       (2<<13)
375 #define S4_CULLMODE_CCW		       (3<<13)
376 #define S4_CULLMODE_MASK	       (3<<13)
377 #define S4_VFMT_POINT_WIDTH            (1<<12)
378 #define S4_VFMT_SPEC_FOG               (1<<11)
379 #define S4_VFMT_COLOR                  (1<<10)
380 #define S4_VFMT_DEPTH_OFFSET           (1<<9)
381 #define S4_VFMT_XYZ     	       (1<<6)
382 #define S4_VFMT_XYZW     	       (2<<6)
383 #define S4_VFMT_XY     		       (3<<6)
384 #define S4_VFMT_XYW     	       (4<<6)
385 #define S4_VFMT_XYZW_MASK              (7<<6)
386 #define S4_FORCE_DEFAULT_DIFFUSE       (1<<5)
387 #define S4_FORCE_DEFAULT_SPECULAR      (1<<4)
388 #define S4_LOCAL_DEPTH_OFFSET_ENABLE   (1<<3)
389 #define S4_VFMT_FOG_PARAM              (1<<2)
390 #define S4_SPRITE_POINT_ENABLE         (1<<1)
391 #define S4_LINE_ANTIALIAS_ENABLE       (1<<0)
392 
393 #define S4_VFMT_MASK (S4_VFMT_POINT_WIDTH   | 	\
394 		      S4_VFMT_SPEC_FOG      |	\
395 		      S4_VFMT_COLOR         |	\
396 		      S4_VFMT_DEPTH_OFFSET  |	\
397 		      S4_VFMT_XYZW_MASK     |	\
398 		      S4_VFMT_FOG_PARAM)
399 
400 #define S5_WRITEDISABLE_ALPHA          (1<<31)
401 #define S5_WRITEDISABLE_RED            (1<<30)
402 #define S5_WRITEDISABLE_GREEN          (1<<29)
403 #define S5_WRITEDISABLE_BLUE           (1<<28)
404 #define S5_WRITEDISABLE_MASK           (0xf<<28)
405 #define S5_FORCE_DEFAULT_POINT_SIZE    (1<<27)
406 #define S5_LAST_PIXEL_ENABLE           (1<<26)
407 #define S5_GLOBAL_DEPTH_OFFSET_ENABLE  (1<<25)
408 #define S5_FOG_ENABLE                  (1<<24)
409 #define S5_STENCIL_REF_SHIFT           16
410 #define S5_STENCIL_REF_MASK            (0xff<<16)
411 #define S5_STENCIL_TEST_FUNC_SHIFT     13
412 #define S5_STENCIL_TEST_FUNC_MASK      (0x7<<13)
413 #define S5_STENCIL_FAIL_SHIFT          10
414 #define S5_STENCIL_FAIL_MASK           (0x7<<10)
415 #define S5_STENCIL_PASS_Z_FAIL_SHIFT   7
416 #define S5_STENCIL_PASS_Z_FAIL_MASK    (0x7<<7)
417 #define S5_STENCIL_PASS_Z_PASS_SHIFT   4
418 #define S5_STENCIL_PASS_Z_PASS_MASK    (0x7<<4)
419 #define S5_STENCIL_WRITE_ENABLE        (1<<3)
420 #define S5_STENCIL_TEST_ENABLE         (1<<2)
421 #define S5_COLOR_DITHER_ENABLE         (1<<1)
422 #define S5_LOGICOP_ENABLE              (1<<0)
423 
424 #define S6_ALPHA_TEST_ENABLE           (1<<31)
425 #define S6_ALPHA_TEST_FUNC_SHIFT       28
426 #define S6_ALPHA_TEST_FUNC_MASK        (0x7<<28)
427 #define S6_ALPHA_REF_SHIFT             20
428 #define S6_ALPHA_REF_MASK              (0xff<<20)
429 #define S6_DEPTH_TEST_ENABLE           (1<<19)
430 #define S6_DEPTH_TEST_FUNC_SHIFT       16
431 #define S6_DEPTH_TEST_FUNC_MASK        (0x7<<16)
432 #define S6_CBUF_BLEND_ENABLE           (1<<15)
433 #define S6_CBUF_BLEND_FUNC_SHIFT       12
434 #define S6_CBUF_BLEND_FUNC_MASK        (0x7<<12)
435 #define S6_CBUF_SRC_BLEND_FACT_SHIFT   8
436 #define S6_CBUF_SRC_BLEND_FACT_MASK    (0xf<<8)
437 #define S6_CBUF_DST_BLEND_FACT_SHIFT   4
438 #define S6_CBUF_DST_BLEND_FACT_MASK    (0xf<<4)
439 #define S6_DEPTH_WRITE_ENABLE          (1<<3)
440 #define S6_COLOR_WRITE_ENABLE          (1<<2)
441 #define S6_TRISTRIP_PV_SHIFT           0
442 #define S6_TRISTRIP_PV_MASK            (0x3<<0)
443 
444 #define S7_DEPTH_OFFSET_CONST_MASK     ~0
445 
446 /* 3DSTATE_MAP_DEINTERLACER_PARAMETERS */
447 /* 3DSTATE_MAP_PALETTE_LOAD_32, p206 */
448 
449 /* _3DSTATE_MODES_4, p218 */
450 #define _3DSTATE_MODES_4_CMD		(CMD_3D|(0x0d<<24))
451 #define ENABLE_LOGIC_OP_FUNC		(1<<23)
452 #define LOGIC_OP_FUNC(x)		((x)<<18)
453 #define LOGICOP_MASK			(0xf<<18)
454 #define LOGICOP_COPY			0xc
455 #define MODE4_ENABLE_STENCIL_TEST_MASK	((1<<17)|(0xff00))
456 #define ENABLE_STENCIL_TEST_MASK	(1<<17)
457 #define STENCIL_TEST_MASK(x)		((x)<<8)
458 #define MODE4_ENABLE_STENCIL_WRITE_MASK	((1<<16)|(0x00ff))
459 #define ENABLE_STENCIL_WRITE_MASK	(1<<16)
460 #define STENCIL_WRITE_MASK(x)		((x)&0xff)
461 
462 /* _3DSTATE_MODES_5, p220 */
463 #define _3DSTATE_MODES_5_CMD		(CMD_3D|(0x0c<<24))
464 #define PIPELINE_FLUSH_RENDER_CACHE	(1<<18)
465 #define PIPELINE_FLUSH_TEXTURE_CACHE	(1<<16)
466 
467 /* p221 */
468 #define _3DSTATE_PIXEL_SHADER_CONSTANTS  (CMD_3D|(0x1d<<24)|(0x6<<16))
469 #define PS1_REG(n)                      (1<<(n))
470 #define PS2_CONST_X(n)                  (n)
471 #define PS3_CONST_Y(n)                  (n)
472 #define PS4_CONST_Z(n)                  (n)
473 #define PS5_CONST_W(n)                  (n)
474 
475 /* p222 */
476 
477 #define I915_MAX_TEX_INDIRECT 4
478 #define I915_MAX_TEX_INSN     32
479 #define I915_MAX_ALU_INSN     64
480 #define I915_MAX_DECL_INSN    27
481 #define I915_MAX_TEMPORARY    16
482 
483 /* Each instruction is 3 dwords long, though most don't require all
484  * this space.  Maximum of 123 instructions.  Smaller maxes per insn
485  * type.
486  */
487 #define _3DSTATE_PIXEL_SHADER_PROGRAM    (CMD_3D|(0x1d<<24)|(0x5<<16))
488 
489 #define REG_TYPE_R                 0	/* temporary regs, no need to
490 					 * dcl, must be written before
491 					 * read -- Preserved between
492 					 * phases.
493 					 */
494 #define REG_TYPE_T                 1	/* Interpolated values, must be
495 					 * dcl'ed before use.
496 					 *
497 					 * 0..7: texture coord,
498 					 * 8: diffuse spec,
499 					 * 9: specular color,
500 					 * 10: fog parameter in w.
501 					 */
502 #define REG_TYPE_CONST             2	/* Restriction: only one const
503 					 * can be referenced per
504 					 * instruction, though it may be
505 					 * selected for multiple inputs.
506 					 * Constants not initialized
507 					 * default to zero.
508 					 */
509 #define REG_TYPE_S                 3	/* sampler */
510 #define REG_TYPE_OC                4	/* output color (rgba) */
511 #define REG_TYPE_OD                5	/* output depth (w), xyz are
512 					 * temporaries.  If not written,
513 					 * interpolated depth is used?
514 					 */
515 #define REG_TYPE_U                 6	/* unpreserved temporaries */
516 #define REG_TYPE_MASK              0x7
517 #define REG_NR_MASK                0xf
518 
519 /* REG_TYPE_T:
520  */
521 #define T_TEX0     0
522 #define T_TEX1     1
523 #define T_TEX2     2
524 #define T_TEX3     3
525 #define T_TEX4     4
526 #define T_TEX5     5
527 #define T_TEX6     6
528 #define T_TEX7     7
529 #define T_DIFFUSE  8
530 #define T_SPECULAR 9
531 #define T_FOG_W    10		/* interpolated fog is in W coord */
532 
533 /* Arithmetic instructions */
534 
535 /* .replicate_swizzle == selection and replication of a particular
536  * scalar channel, ie., .xxxx, .yyyy, .zzzz or .wwww
537  */
538 #define A0_NOP    (0x0<<24)	/* no operation */
539 #define A0_ADD    (0x1<<24)	/* dst = src0 + src1 */
540 #define A0_MOV    (0x2<<24)	/* dst = src0 */
541 #define A0_MUL    (0x3<<24)	/* dst = src0 * src1 */
542 #define A0_MAD    (0x4<<24)	/* dst = src0 * src1 + src2 */
543 #define A0_DP2ADD (0x5<<24)	/* dst.xyzw = src0.xy dot src1.xy + src2.replicate_swizzle */
544 #define A0_DP3    (0x6<<24)	/* dst.xyzw = src0.xyz dot src1.xyz */
545 #define A0_DP4    (0x7<<24)	/* dst.xyzw = src0.xyzw dot src1.xyzw */
546 #define A0_FRC    (0x8<<24)	/* dst = src0 - floor(src0) */
547 #define A0_RCP    (0x9<<24)	/* dst.xyzw = 1/(src0.replicate_swizzle) */
548 #define A0_RSQ    (0xa<<24)	/* dst.xyzw = 1/(sqrt(abs(src0.replicate_swizzle))) */
549 #define A0_EXP    (0xb<<24)	/* dst.xyzw = exp2(src0.replicate_swizzle) */
550 #define A0_LOG    (0xc<<24)	/* dst.xyzw = log2(abs(src0.replicate_swizzle)) */
551 #define A0_CMP    (0xd<<24)	/* dst = (src0 >= 0.0) ? src1 : src2 */
552 #define A0_MIN    (0xe<<24)	/* dst = (src0 < src1) ? src0 : src1 */
553 #define A0_MAX    (0xf<<24)	/* dst = (src0 >= src1) ? src0 : src1 */
554 #define A0_FLR    (0x10<<24)	/* dst = floor(src0) */
555 #define A0_MOD    (0x11<<24)	/* dst = src0 fmod 1.0 */
556 #define A0_TRC    (0x12<<24)	/* dst = int(src0) */
557 #define A0_SGE    (0x13<<24)	/* dst = src0 >= src1 ? 1.0 : 0.0 */
558 #define A0_SLT    (0x14<<24)	/* dst = src0 < src1 ? 1.0 : 0.0 */
559 #define A0_DEST_SATURATE                 (1<<22)
560 #define A0_DEST_TYPE_SHIFT                19
561 /* Allow: R, OC, OD, U */
562 #define A0_DEST_NR_SHIFT                 14
563 /* Allow R: 0..15, OC,OD: 0..0, U: 0..2 */
564 #define A0_DEST_CHANNEL_X                (1<<10)
565 #define A0_DEST_CHANNEL_Y                (2<<10)
566 #define A0_DEST_CHANNEL_Z                (4<<10)
567 #define A0_DEST_CHANNEL_W                (8<<10)
568 #define A0_DEST_CHANNEL_ALL              (0xf<<10)
569 #define A0_DEST_CHANNEL_SHIFT            10
570 #define A0_SRC0_TYPE_SHIFT               7
571 #define A0_SRC0_NR_SHIFT                 2
572 
573 #define A0_DEST_CHANNEL_XY              (A0_DEST_CHANNEL_X|A0_DEST_CHANNEL_Y)
574 #define A0_DEST_CHANNEL_XYZ             (A0_DEST_CHANNEL_XY|A0_DEST_CHANNEL_Z)
575 
576 #define SRC_X        0
577 #define SRC_Y        1
578 #define SRC_Z        2
579 #define SRC_W        3
580 #define SRC_ZERO     4
581 #define SRC_ONE      5
582 
583 #define A1_SRC0_CHANNEL_X_NEGATE         (1<<31)
584 #define A1_SRC0_CHANNEL_X_SHIFT          28
585 #define A1_SRC0_CHANNEL_Y_NEGATE         (1<<27)
586 #define A1_SRC0_CHANNEL_Y_SHIFT          24
587 #define A1_SRC0_CHANNEL_Z_NEGATE         (1<<23)
588 #define A1_SRC0_CHANNEL_Z_SHIFT          20
589 #define A1_SRC0_CHANNEL_W_NEGATE         (1<<19)
590 #define A1_SRC0_CHANNEL_W_SHIFT          16
591 #define A1_SRC1_TYPE_SHIFT               13
592 #define A1_SRC1_NR_SHIFT                 8
593 #define A1_SRC1_CHANNEL_X_NEGATE         (1<<7)
594 #define A1_SRC1_CHANNEL_X_SHIFT          4
595 #define A1_SRC1_CHANNEL_Y_NEGATE         (1<<3)
596 #define A1_SRC1_CHANNEL_Y_SHIFT          0
597 
598 #define A2_SRC1_CHANNEL_Z_NEGATE         (1<<31)
599 #define A2_SRC1_CHANNEL_Z_SHIFT          28
600 #define A2_SRC1_CHANNEL_W_NEGATE         (1<<27)
601 #define A2_SRC1_CHANNEL_W_SHIFT          24
602 #define A2_SRC2_TYPE_SHIFT               21
603 #define A2_SRC2_NR_SHIFT                 16
604 #define A2_SRC2_CHANNEL_X_NEGATE         (1<<15)
605 #define A2_SRC2_CHANNEL_X_SHIFT          12
606 #define A2_SRC2_CHANNEL_Y_NEGATE         (1<<11)
607 #define A2_SRC2_CHANNEL_Y_SHIFT          8
608 #define A2_SRC2_CHANNEL_Z_NEGATE         (1<<7)
609 #define A2_SRC2_CHANNEL_Z_SHIFT          4
610 #define A2_SRC2_CHANNEL_W_NEGATE         (1<<3)
611 #define A2_SRC2_CHANNEL_W_SHIFT          0
612 
613 /* Texture instructions */
614 #define T0_TEXLD     (0x15<<24)	/* Sample texture using predeclared
615 				 * sampler and address, and output
616 				 * filtered texel data to destination
617 				 * register */
618 #define T0_TEXLDP    (0x16<<24)	/* Same as texld but performs a
619 				 * perspective divide of the texture
620 				 * coordinate .xyz values by .w before
621 				 * sampling. */
622 #define T0_TEXLDB    (0x17<<24)	/* Same as texld but biases the
623 				 * computed LOD by w.  Only S4.6 two's
624 				 * comp is used.  This implies that a
625 				 * float to fixed conversion is
626 				 * done. */
627 #define T0_TEXKILL   (0x18<<24)	/* Does not perform a sampling
628 				 * operation.  Simply kills the pixel
629 				 * if any channel of the address
630 				 * register is < 0.0. */
631 #define T0_DEST_TYPE_SHIFT                19
632 /* Allow: R, OC, OD, U */
633 /* Note: U (unpreserved) regs do not retain their values between
634  * phases (cannot be used for feedback)
635  *
636  * Note: oC and OD registers can only be used as the destination of a
637  * texture instruction once per phase (this is an implementation
638  * restriction).
639  */
640 #define T0_DEST_NR_SHIFT                 14
641 /* Allow R: 0..15, OC,OD: 0..0, U: 0..2 */
642 #define T0_SAMPLER_NR_SHIFT              0	/* This field ignored for TEXKILL */
643 #define T0_SAMPLER_NR_MASK               (0xf<<0)
644 
645 #define T1_ADDRESS_REG_TYPE_SHIFT        24	/* Reg to use as texture coord */
646 /* Allow R, T, OC, OD -- R, OC, OD are 'dependent' reads, new program phase */
647 #define T1_ADDRESS_REG_NR_SHIFT          17
648 #define T2_MBZ                           0
649 
650 /* Declaration instructions */
651 #define D0_DCL       (0x19<<24)	/* Declare a t (interpolated attrib)
652 				 * register or an s (sampler)
653 				 * register. */
654 #define D0_SAMPLE_TYPE_SHIFT              22
655 #define D0_SAMPLE_TYPE_2D                 (0x0<<22)
656 #define D0_SAMPLE_TYPE_CUBE               (0x1<<22)
657 #define D0_SAMPLE_TYPE_VOLUME             (0x2<<22)
658 #define D0_SAMPLE_TYPE_MASK               (0x3<<22)
659 
660 #define D0_TYPE_SHIFT                19
661 /* Allow: T, S */
662 #define D0_NR_SHIFT                  14
663 /* Allow T: 0..10, S: 0..15 */
664 #define D0_CHANNEL_X                (1<<10)
665 #define D0_CHANNEL_Y                (2<<10)
666 #define D0_CHANNEL_Z                (4<<10)
667 #define D0_CHANNEL_W                (8<<10)
668 #define D0_CHANNEL_ALL              (0xf<<10)
669 #define D0_CHANNEL_NONE             (0<<10)
670 
671 #define D0_CHANNEL_XY               (D0_CHANNEL_X|D0_CHANNEL_Y)
672 #define D0_CHANNEL_XYZ              (D0_CHANNEL_XY|D0_CHANNEL_Z)
673 
674 /* I915 Errata: Do not allow (xz), (xw), (xzw) combinations for diffuse
675  * or specular declarations.
676  *
677  * For T dcls, only allow: (x), (xy), (xyz), (w), (xyzw)
678  *
679  * Must be zero for S (sampler) dcls
680  */
681 #define D1_MBZ                          0
682 #define D2_MBZ                          0
683 
684 /* p207.
685  * The DWORD count is 3 times the number of bits set in MS1_MAPMASK_MASK
686  */
687 #define _3DSTATE_MAP_STATE               (CMD_3D|(0x1d<<24)|(0x0<<16))
688 
689 #define MS1_MAPMASK_SHIFT               0
690 #define MS1_MAPMASK_MASK                (0x8fff<<0)
691 
692 #define MS2_UNTRUSTED_SURFACE           (1<<31)
693 #define MS2_ADDRESS_MASK                0xfffffffc
694 #define MS2_VERTICAL_LINE_STRIDE        (1<<1)
695 #define MS2_VERTICAL_OFFSET             (1<<1)
696 
697 #define MS3_HEIGHT_SHIFT              21
698 #define MS3_WIDTH_SHIFT               10
699 #define MS3_PALETTE_SELECT            (1<<9)
700 #define MS3_MAPSURF_FORMAT_SHIFT      7
701 #define MS3_MAPSURF_FORMAT_MASK       (0x7<<7)
702 #define    MAPSURF_8BIT			   (1<<7)
703 #define    MAPSURF_16BIT		   (2<<7)
704 #define    MAPSURF_32BIT		   (3<<7)
705 #define    MAPSURF_422			   (5<<7)
706 #define    MAPSURF_COMPRESSED		   (6<<7)
707 #define    MAPSURF_4BIT_INDEXED		   (7<<7)
708 #define MS3_MT_FORMAT_MASK         (0x7 << 3)
709 #define MS3_MT_FORMAT_SHIFT        3
710 #define    MT_4BIT_IDX_ARGB8888	           (7<<3)	/* SURFACE_4BIT_INDEXED */
711 #define    MT_8BIT_I8		           (0<<3)	/* SURFACE_8BIT */
712 #define    MT_8BIT_L8		           (1<<3)
713 #define    MT_8BIT_A8		           (4<<3)
714 #define    MT_8BIT_MONO8	           (5<<3)
715 #define    MT_16BIT_RGB565		   (0<<3)	/* SURFACE_16BIT */
716 #define    MT_16BIT_ARGB1555		   (1<<3)
717 #define    MT_16BIT_ARGB4444		   (2<<3)
718 #define    MT_16BIT_AY88		   (3<<3)
719 #define    MT_16BIT_88DVDU	           (5<<3)
720 #define    MT_16BIT_BUMP_655LDVDU	   (6<<3)
721 #define    MT_16BIT_I16	                   (7<<3)
722 #define    MT_16BIT_L16	                   (8<<3)
723 #define    MT_16BIT_A16	                   (9<<3)
724 #define    MT_32BIT_ARGB8888		   (0<<3)	/* SURFACE_32BIT */
725 #define    MT_32BIT_ABGR8888		   (1<<3)
726 #define    MT_32BIT_XRGB8888		   (2<<3)
727 #define    MT_32BIT_XBGR8888		   (3<<3)
728 #define    MT_32BIT_QWVU8888		   (4<<3)
729 #define    MT_32BIT_AXVU8888		   (5<<3)
730 #define    MT_32BIT_LXVU8888	           (6<<3)
731 #define    MT_32BIT_XLVU8888	           (7<<3)
732 #define    MT_32BIT_ARGB2101010	           (8<<3)
733 #define    MT_32BIT_ABGR2101010	           (9<<3)
734 #define    MT_32BIT_AWVU2101010	           (0xA<<3)
735 #define    MT_32BIT_GR1616	           (0xB<<3)
736 #define    MT_32BIT_VU1616	           (0xC<<3)
737 #define    MT_32BIT_xI824	           (0xD<<3)
738 #define    MT_32BIT_xA824	           (0xE<<3)
739 #define    MT_32BIT_xL824	           (0xF<<3)
740 #define    MT_422_YCRCB_SWAPY	           (0<<3)	/* SURFACE_422 */
741 #define    MT_422_YCRCB_NORMAL	           (1<<3)
742 #define    MT_422_YCRCB_SWAPUV	           (2<<3)
743 #define    MT_422_YCRCB_SWAPUVY	           (3<<3)
744 #define    MT_COMPRESS_DXT1		   (0<<3)	/* SURFACE_COMPRESSED */
745 #define    MT_COMPRESS_DXT2_3	           (1<<3)
746 #define    MT_COMPRESS_DXT4_5	           (2<<3)
747 #define    MT_COMPRESS_FXT1		   (3<<3)
748 #define    MT_COMPRESS_DXT1_RGB		   (4<<3)
749 #define MS3_USE_FENCE_REGS              (1<<2)
750 #define MS3_TILED_SURFACE             (1<<1)
751 #define MS3_TILE_WALK                 (1<<0)
752 
753 /* The pitch is the pitch measured in DWORDS, minus 1 */
754 #define MS4_PITCH_SHIFT                 21
755 #define MS4_CUBE_FACE_ENA_NEGX          (1<<20)
756 #define MS4_CUBE_FACE_ENA_POSX          (1<<19)
757 #define MS4_CUBE_FACE_ENA_NEGY          (1<<18)
758 #define MS4_CUBE_FACE_ENA_POSY          (1<<17)
759 #define MS4_CUBE_FACE_ENA_NEGZ          (1<<16)
760 #define MS4_CUBE_FACE_ENA_POSZ          (1<<15)
761 #define MS4_CUBE_FACE_ENA_MASK          (0x3f<<15)
762 #define MS4_MAX_LOD_SHIFT		9
763 #define MS4_MAX_LOD_MASK		(0x3f<<9)
764 #define MS4_MIP_LAYOUT_LEGACY           (0<<8)
765 #define MS4_MIP_LAYOUT_BELOW_LPT        (0<<8)
766 #define MS4_MIP_LAYOUT_RIGHT_LPT        (1<<8)
767 #define MS4_VOLUME_DEPTH_SHIFT          0
768 #define MS4_VOLUME_DEPTH_MASK           (0xff<<0)
769 
770 /* p244.
771  * The DWORD count is 3 times the number of bits set in SS1_MAPMASK_MASK.
772  */
773 #define _3DSTATE_SAMPLER_STATE         (CMD_3D|(0x1d<<24)|(0x1<<16))
774 
775 #define SS1_MAPMASK_SHIFT               0
776 #define SS1_MAPMASK_MASK                (0x8fff<<0)
777 
778 #define SS2_REVERSE_GAMMA_ENABLE        (1<<31)
779 #define SS2_PACKED_TO_PLANAR_ENABLE     (1<<30)
780 #define SS2_COLORSPACE_CONVERSION       (1<<29)
781 #define SS2_CHROMAKEY_SHIFT             27
782 #define SS2_BASE_MIP_LEVEL_SHIFT        22
783 #define SS2_BASE_MIP_LEVEL_MASK         (0x1f<<22)
784 #define SS2_MIP_FILTER_SHIFT            20
785 #define SS2_MIP_FILTER_MASK             (0x3<<20)
786 #define   MIPFILTER_NONE       	0
787 #define   MIPFILTER_NEAREST	1
788 #define   MIPFILTER_LINEAR	3
789 #define SS2_MAG_FILTER_SHIFT          17
790 #define SS2_MAG_FILTER_MASK           (0x7<<17)
791 #define   FILTER_NEAREST	0
792 #define   FILTER_LINEAR		1
793 #define   FILTER_ANISOTROPIC	2
794 #define   FILTER_4X4_1    	3
795 #define   FILTER_4X4_2    	4
796 #define   FILTER_4X4_FLAT 	5
797 #define   FILTER_6X5_MONO   	6	/* XXX - check */
798 #define SS2_MIN_FILTER_SHIFT          14
799 #define SS2_MIN_FILTER_MASK           (0x7<<14)
800 #define SS2_LOD_BIAS_SHIFT            5
801 #define SS2_LOD_BIAS_ONE              (0x10<<5)
802 #define SS2_LOD_BIAS_MASK             (0x1ff<<5)
803 /* Shadow requires:
804  *  MT_X8{I,L,A}24 or MT_{I,L,A}16 texture format
805  *  FILTER_4X4_x  MIN and MAG filters
806  */
807 #define SS2_SHADOW_ENABLE             (1<<4)
808 #define SS2_MAX_ANISO_MASK            (1<<3)
809 #define SS2_MAX_ANISO_2               (0<<3)
810 #define SS2_MAX_ANISO_4               (1<<3)
811 #define SS2_SHADOW_FUNC_SHIFT         0
812 #define SS2_SHADOW_FUNC_MASK          (0x7<<0)
813 /* SS2_SHADOW_FUNC values: see COMPAREFUNC_* */
814 
815 #define SS3_MIN_LOD_SHIFT            24
816 #define SS3_MIN_LOD_ONE              (0x10<<24)
817 #define SS3_MIN_LOD_MASK             (0xff<<24)
818 #define SS3_KILL_PIXEL_ENABLE        (1<<17)
819 #define SS3_TCX_ADDR_MODE_SHIFT      12
820 #define SS3_TCX_ADDR_MODE_MASK       (0x7<<12)
821 #define   TEXCOORDMODE_WRAP		0
822 #define   TEXCOORDMODE_MIRROR		1
823 #define   TEXCOORDMODE_CLAMP_EDGE	2
824 #define   TEXCOORDMODE_CUBE       	3
825 #define   TEXCOORDMODE_CLAMP_BORDER	4
826 #define   TEXCOORDMODE_MIRROR_ONCE      5
827 #define SS3_TCY_ADDR_MODE_SHIFT      9
828 #define SS3_TCY_ADDR_MODE_MASK       (0x7<<9)
829 #define SS3_TCZ_ADDR_MODE_SHIFT      6
830 #define SS3_TCZ_ADDR_MODE_MASK       (0x7<<6)
831 #define SS3_NORMALIZED_COORDS        (1<<5)
832 #define SS3_TEXTUREMAP_INDEX_SHIFT   1
833 #define SS3_TEXTUREMAP_INDEX_MASK    (0xf<<1)
834 #define SS3_DEINTERLACER_ENABLE      (1<<0)
835 
836 #define SS4_BORDER_COLOR_MASK        (~0)
837 
838 /* 3DSTATE_SPAN_STIPPLE, p258
839  */
840 #define _3DSTATE_STIPPLE           ((0x3<<29)|(0x1d<<24)|(0x83<<16))
841 #define ST1_ENABLE               (1<<16)
842 #define ST1_MASK                 (0xffff)
843 
844 #define FLUSH_MAP_CACHE    (1<<0)
845 #define FLUSH_RENDER_CACHE (1<<1)
846 
847 #endif
848 /* -*- c-basic-offset: 4 -*- */
849 /*
850  * Copyright © 2006,2010 Intel Corporation
851  *
852  * Permission is hereby granted, free of charge, to any person obtaining a
853  * copy of this software and associated documentation files (the "Software"),
854  * to deal in the Software without restriction, including without limitation
855  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
856  * and/or sell copies of the Software, and to permit persons to whom the
857  * Software is furnished to do so, subject to the following conditions:
858  *
859  * The above copyright notice and this permission notice (including the next
860  * paragraph) shall be included in all copies or substantial portions of the
861  * Software.
862  *
863  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
864  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
865  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
866  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
867  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
868  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
869  * SOFTWARE.
870  *
871  * Authors:
872  *    Eric Anholt <eric@anholt.net>
873  *    Chris Wilson <chris@chris-wilson.co.uk>
874  *
875  */
876 
877 /* Each instruction is 3 dwords long, though most don't require all
878  * this space.  Maximum of 123 instructions.  Smaller maxes per insn
879  * type.
880  */
881 #define _3DSTATE_PIXEL_SHADER_PROGRAM    (CMD_3D|(0x1d<<24)|(0x5<<16))
882 
883 #define REG_TYPE_R                 0 /* temporary regs, no need to
884 				      * dcl, must be written before
885 				      * read -- Preserved between
886 				      * phases.
887 				      */
888 #define REG_TYPE_T                 1 /* Interpolated values, must be
889 				      * dcl'ed before use.
890 				      *
891 				      * 0..7: texture coord,
892 				      * 8: diffuse spec,
893 				      * 9: specular color,
894 				      * 10: fog parameter in w.
895 				      */
896 #define REG_TYPE_CONST             2 /* Restriction: only one const
897 				      * can be referenced per
898 				      * instruction, though it may be
899 				      * selected for multiple inputs.
900 				      * Constants not initialized
901 				      * default to zero.
902 				      */
903 #define REG_TYPE_S                 3 /* sampler */
904 #define REG_TYPE_OC                4 /* output color (rgba) */
905 #define REG_TYPE_OD                5 /* output depth (w), xyz are
906 				      * temporaries.  If not written,
907 				      * interpolated depth is used?
908 				      */
909 #define REG_TYPE_U                 6 /* unpreserved temporaries */
910 #define REG_TYPE_MASK              0x7
911 #define REG_TYPE_SHIFT		   4
912 #define REG_NR_MASK                0xf
913 
914 /* REG_TYPE_T:
915 */
916 #define T_TEX0     0
917 #define T_TEX1     1
918 #define T_TEX2     2
919 #define T_TEX3     3
920 #define T_TEX4     4
921 #define T_TEX5     5
922 #define T_TEX6     6
923 #define T_TEX7     7
924 #define T_DIFFUSE  8
925 #define T_SPECULAR 9
926 #define T_FOG_W    10		/* interpolated fog is in W coord */
927 
928 /* Arithmetic instructions */
929 
930 /* .replicate_swizzle == selection and replication of a particular
931  * scalar channel, ie., .xxxx, .yyyy, .zzzz or .wwww
932  */
933 #define A0_NOP    (0x0<<24)		/* no operation */
934 #define A0_ADD    (0x1<<24)		/* dst = src0 + src1 */
935 #define A0_MOV    (0x2<<24)		/* dst = src0 */
936 #define A0_MUL    (0x3<<24)		/* dst = src0 * src1 */
937 #define A0_MAD    (0x4<<24)		/* dst = src0 * src1 + src2 */
938 #define A0_DP2ADD (0x5<<24)		/* dst.xyzw = src0.xy dot src1.xy + src2.replicate_swizzle */
939 #define A0_DP3    (0x6<<24)		/* dst.xyzw = src0.xyz dot src1.xyz */
940 #define A0_DP4    (0x7<<24)		/* dst.xyzw = src0.xyzw dot src1.xyzw */
941 #define A0_FRC    (0x8<<24)		/* dst = src0 - floor(src0) */
942 #define A0_RCP    (0x9<<24)		/* dst.xyzw = 1/(src0.replicate_swizzle) */
943 #define A0_RSQ    (0xa<<24)		/* dst.xyzw = 1/(sqrt(abs(src0.replicate_swizzle))) */
944 #define A0_EXP    (0xb<<24)		/* dst.xyzw = exp2(src0.replicate_swizzle) */
945 #define A0_LOG    (0xc<<24)		/* dst.xyzw = log2(abs(src0.replicate_swizzle)) */
946 #define A0_CMP    (0xd<<24)		/* dst = (src0 >= 0.0) ? src1 : src2 */
947 #define A0_MIN    (0xe<<24)		/* dst = (src0 < src1) ? src0 : src1 */
948 #define A0_MAX    (0xf<<24)		/* dst = (src0 >= src1) ? src0 : src1 */
949 #define A0_FLR    (0x10<<24)		/* dst = floor(src0) */
950 #define A0_MOD    (0x11<<24)		/* dst = src0 fmod 1.0 */
951 #define A0_TRC    (0x12<<24)		/* dst = int(src0) */
952 #define A0_SGE    (0x13<<24)		/* dst = src0 >= src1 ? 1.0 : 0.0 */
953 #define A0_SLT    (0x14<<24)		/* dst = src0 < src1 ? 1.0 : 0.0 */
954 #define A0_DEST_SATURATE                 (1<<22)
955 #define A0_DEST_TYPE_SHIFT                19
956 /* Allow: R, OC, OD, U */
957 #define A0_DEST_NR_SHIFT                 14
958 /* Allow R: 0..15, OC,OD: 0..0, U: 0..2 */
959 #define A0_DEST_CHANNEL_X                (1<<10)
960 #define A0_DEST_CHANNEL_Y                (2<<10)
961 #define A0_DEST_CHANNEL_Z                (4<<10)
962 #define A0_DEST_CHANNEL_W                (8<<10)
963 #define A0_DEST_CHANNEL_ALL              (0xf<<10)
964 #define A0_DEST_CHANNEL_SHIFT            10
965 #define A0_SRC0_TYPE_SHIFT               7
966 #define A0_SRC0_NR_SHIFT                 2
967 
968 #define A0_DEST_CHANNEL_XY              (A0_DEST_CHANNEL_X|A0_DEST_CHANNEL_Y)
969 #define A0_DEST_CHANNEL_XYZ             (A0_DEST_CHANNEL_XY|A0_DEST_CHANNEL_Z)
970 
971 #define SRC_X        0
972 #define SRC_Y        1
973 #define SRC_Z        2
974 #define SRC_W        3
975 #define SRC_ZERO     4
976 #define SRC_ONE      5
977 
978 #define A1_SRC0_CHANNEL_X_NEGATE         (1<<31)
979 #define A1_SRC0_CHANNEL_X_SHIFT          28
980 #define A1_SRC0_CHANNEL_Y_NEGATE         (1<<27)
981 #define A1_SRC0_CHANNEL_Y_SHIFT          24
982 #define A1_SRC0_CHANNEL_Z_NEGATE         (1<<23)
983 #define A1_SRC0_CHANNEL_Z_SHIFT          20
984 #define A1_SRC0_CHANNEL_W_NEGATE         (1<<19)
985 #define A1_SRC0_CHANNEL_W_SHIFT          16
986 #define A1_SRC1_TYPE_SHIFT               13
987 #define A1_SRC1_NR_SHIFT                 8
988 #define A1_SRC1_CHANNEL_X_NEGATE         (1<<7)
989 #define A1_SRC1_CHANNEL_X_SHIFT          4
990 #define A1_SRC1_CHANNEL_Y_NEGATE         (1<<3)
991 #define A1_SRC1_CHANNEL_Y_SHIFT          0
992 
993 #define A2_SRC1_CHANNEL_Z_NEGATE         (1<<31)
994 #define A2_SRC1_CHANNEL_Z_SHIFT          28
995 #define A2_SRC1_CHANNEL_W_NEGATE         (1<<27)
996 #define A2_SRC1_CHANNEL_W_SHIFT          24
997 #define A2_SRC2_TYPE_SHIFT               21
998 #define A2_SRC2_NR_SHIFT                 16
999 #define A2_SRC2_CHANNEL_X_NEGATE         (1<<15)
1000 #define A2_SRC2_CHANNEL_X_SHIFT          12
1001 #define A2_SRC2_CHANNEL_Y_NEGATE         (1<<11)
1002 #define A2_SRC2_CHANNEL_Y_SHIFT          8
1003 #define A2_SRC2_CHANNEL_Z_NEGATE         (1<<7)
1004 #define A2_SRC2_CHANNEL_Z_SHIFT          4
1005 #define A2_SRC2_CHANNEL_W_NEGATE         (1<<3)
1006 #define A2_SRC2_CHANNEL_W_SHIFT          0
1007 
1008 /* Texture instructions */
1009 #define T0_TEXLD     (0x15<<24)	/* Sample texture using predeclared
1010 				 * sampler and address, and output
1011 				 * filtered texel data to destination
1012 				 * register */
1013 #define T0_TEXLDP    (0x16<<24)	/* Same as texld but performs a
1014 				 * perspective divide of the texture
1015 				 * coordinate .xyz values by .w before
1016 				 * sampling. */
1017 #define T0_TEXLDB    (0x17<<24)	/* Same as texld but biases the
1018 				 * computed LOD by w.  Only S4.6 two's
1019 				 * comp is used.  This implies that a
1020 				 * float to fixed conversion is
1021 				 * done. */
1022 #define T0_TEXKILL   (0x18<<24)	/* Does not perform a sampling
1023 				 * operation.  Simply kills the pixel
1024 				 * if any channel of the address
1025 				 * register is < 0.0. */
1026 #define T0_DEST_TYPE_SHIFT                19
1027 /* Allow: R, OC, OD, U */
1028 /* Note: U (unpreserved) regs do not retain their values between
1029  * phases (cannot be used for feedback)
1030  *
1031  * Note: oC and OD registers can only be used as the destination of a
1032  * texture instruction once per phase (this is an implementation
1033  * restriction).
1034  */
1035 #define T0_DEST_NR_SHIFT                 14
1036 /* Allow R: 0..15, OC,OD: 0..0, U: 0..2 */
1037 #define T0_SAMPLER_NR_SHIFT              0 /* This field ignored for TEXKILL */
1038 #define T0_SAMPLER_NR_MASK               (0xf<<0)
1039 
1040 #define T1_ADDRESS_REG_TYPE_SHIFT        24 /* Reg to use as texture coord */
1041 /* Allow R, T, OC, OD -- R, OC, OD are 'dependent' reads, new program phase */
1042 #define T1_ADDRESS_REG_NR_SHIFT          17
1043 #define T2_MBZ                           0
1044 
1045 /* Declaration instructions */
1046 #define D0_DCL       (0x19<<24)	/* Declare a t (interpolated attrib)
1047 				 * register or an s (sampler)
1048 				 * register. */
1049 #define D0_SAMPLE_TYPE_SHIFT              22
1050 #define D0_SAMPLE_TYPE_2D                 (0x0<<22)
1051 #define D0_SAMPLE_TYPE_CUBE               (0x1<<22)
1052 #define D0_SAMPLE_TYPE_VOLUME             (0x2<<22)
1053 #define D0_SAMPLE_TYPE_MASK               (0x3<<22)
1054 
1055 #define D0_TYPE_SHIFT                19
1056 /* Allow: T, S */
1057 #define D0_NR_SHIFT                  14
1058 /* Allow T: 0..10, S: 0..15 */
1059 #define D0_CHANNEL_X                (1<<10)
1060 #define D0_CHANNEL_Y                (2<<10)
1061 #define D0_CHANNEL_Z                (4<<10)
1062 #define D0_CHANNEL_W                (8<<10)
1063 #define D0_CHANNEL_ALL              (0xf<<10)
1064 #define D0_CHANNEL_NONE             (0<<10)
1065 
1066 #define D0_CHANNEL_XY               (D0_CHANNEL_X|D0_CHANNEL_Y)
1067 #define D0_CHANNEL_XYZ              (D0_CHANNEL_XY|D0_CHANNEL_Z)
1068 
1069 /* I915 Errata: Do not allow (xz), (xw), (xzw) combinations for diffuse
1070  * or specular declarations.
1071  *
1072  * For T dcls, only allow: (x), (xy), (xyz), (w), (xyzw)
1073  *
1074  * Must be zero for S (sampler) dcls
1075  */
1076 #define D1_MBZ                          0
1077 #define D2_MBZ                          0
1078 
1079 
1080 /* MASK_* are the unshifted bitmasks of the destination mask in arithmetic
1081  * operations
1082  */
1083 #define MASK_X			0x1
1084 #define MASK_Y			0x2
1085 #define MASK_Z			0x4
1086 #define MASK_W			0x8
1087 #define MASK_XYZ		(MASK_X | MASK_Y | MASK_Z)
1088 #define MASK_XYZW		(MASK_XYZ | MASK_W)
1089 #define MASK_SATURATE		0x10
1090 
1091 /* Temporary, undeclared regs. Preserved between phases */
1092 #define FS_R0			((REG_TYPE_R << REG_TYPE_SHIFT) | 0)
1093 #define FS_R1			((REG_TYPE_R << REG_TYPE_SHIFT) | 1)
1094 #define FS_R2			((REG_TYPE_R << REG_TYPE_SHIFT) | 2)
1095 #define FS_R3			((REG_TYPE_R << REG_TYPE_SHIFT) | 3)
1096 
1097 /* Texture coordinate regs.  Must be declared. */
1098 #define FS_T0			((REG_TYPE_T << REG_TYPE_SHIFT) | 0)
1099 #define FS_T1			((REG_TYPE_T << REG_TYPE_SHIFT) | 1)
1100 #define FS_T2			((REG_TYPE_T << REG_TYPE_SHIFT) | 2)
1101 #define FS_T3			((REG_TYPE_T << REG_TYPE_SHIFT) | 3)
1102 #define FS_T4			((REG_TYPE_T << REG_TYPE_SHIFT) | 4)
1103 #define FS_T5			((REG_TYPE_T << REG_TYPE_SHIFT) | 5)
1104 #define FS_T6			((REG_TYPE_T << REG_TYPE_SHIFT) | 6)
1105 #define FS_T7			((REG_TYPE_T << REG_TYPE_SHIFT) | 7)
1106 #define FS_T8			((REG_TYPE_T << REG_TYPE_SHIFT) | 8)
1107 #define FS_T9			((REG_TYPE_T << REG_TYPE_SHIFT) | 9)
1108 #define FS_T10			((REG_TYPE_T << REG_TYPE_SHIFT) | 10)
1109 
1110 /* Constant values */
1111 #define FS_C0			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 0)
1112 #define FS_C1			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 1)
1113 #define FS_C2			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 2)
1114 #define FS_C3			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 3)
1115 #define FS_C4			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 4)
1116 #define FS_C5			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 5)
1117 #define FS_C6			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 6)
1118 #define FS_C7			((REG_TYPE_CONST << REG_TYPE_SHIFT) | 7)
1119 
1120 /* Sampler regs */
1121 #define FS_S0			((REG_TYPE_S << REG_TYPE_SHIFT) | 0)
1122 #define FS_S1			((REG_TYPE_S << REG_TYPE_SHIFT) | 1)
1123 #define FS_S2			((REG_TYPE_S << REG_TYPE_SHIFT) | 2)
1124 #define FS_S3			((REG_TYPE_S << REG_TYPE_SHIFT) | 3)
1125 
1126 /* Output color */
1127 #define FS_OC			((REG_TYPE_OC << REG_TYPE_SHIFT) | 0)
1128 
1129 /* Output depth */
1130 #define FS_OD			((REG_TYPE_OD << REG_TYPE_SHIFT) | 0)
1131 
1132 /* Unpreserved temporary regs */
1133 #define FS_U0			((REG_TYPE_U << REG_TYPE_SHIFT) | 0)
1134 #define FS_U1			((REG_TYPE_U << REG_TYPE_SHIFT) | 1)
1135 #define FS_U2			((REG_TYPE_U << REG_TYPE_SHIFT) | 2)
1136 #define FS_U3			((REG_TYPE_U << REG_TYPE_SHIFT) | 3)
1137 
1138 #define X_CHANNEL_SHIFT (REG_TYPE_SHIFT + 3)
1139 #define Y_CHANNEL_SHIFT (X_CHANNEL_SHIFT + 4)
1140 #define Z_CHANNEL_SHIFT (Y_CHANNEL_SHIFT + 4)
1141 #define W_CHANNEL_SHIFT (Z_CHANNEL_SHIFT + 4)
1142 
1143 #define REG_CHANNEL_MASK 0xf
1144 
1145 #define REG_NR(reg)		((reg) & REG_NR_MASK)
1146 #define REG_TYPE(reg)		(((reg) >> REG_TYPE_SHIFT) & REG_TYPE_MASK)
1147 #define REG_X(reg)		(((reg) >> X_CHANNEL_SHIFT) & REG_CHANNEL_MASK)
1148 #define REG_Y(reg)		(((reg) >> Y_CHANNEL_SHIFT) & REG_CHANNEL_MASK)
1149 #define REG_Z(reg)		(((reg) >> Z_CHANNEL_SHIFT) & REG_CHANNEL_MASK)
1150 #define REG_W(reg)		(((reg) >> W_CHANNEL_SHIFT) & REG_CHANNEL_MASK)
1151 
1152 enum gen3_fs_channel {
1153 	X_CHANNEL_VAL = 0,
1154 	Y_CHANNEL_VAL,
1155 	Z_CHANNEL_VAL,
1156 	W_CHANNEL_VAL,
1157 	ZERO_CHANNEL_VAL,
1158 	ONE_CHANNEL_VAL,
1159 
1160 	NEG_X_CHANNEL_VAL = X_CHANNEL_VAL | 0x8,
1161 	NEG_Y_CHANNEL_VAL = Y_CHANNEL_VAL | 0x8,
1162 	NEG_Z_CHANNEL_VAL = Z_CHANNEL_VAL | 0x8,
1163 	NEG_W_CHANNEL_VAL = W_CHANNEL_VAL | 0x8,
1164 	NEG_ONE_CHANNEL_VAL = ONE_CHANNEL_VAL | 0x8
1165 };
1166 
1167 #define gen3_fs_operand(reg, x, y, z, w) \
1168 	(reg) | \
1169 (x##_CHANNEL_VAL << X_CHANNEL_SHIFT) | \
1170 (y##_CHANNEL_VAL << Y_CHANNEL_SHIFT) | \
1171 (z##_CHANNEL_VAL << Z_CHANNEL_SHIFT) | \
1172 (w##_CHANNEL_VAL << W_CHANNEL_SHIFT)
1173 
1174 /**
1175  * Construct an operand description for using a register with no swizzling
1176  */
1177 #define gen3_fs_operand_reg(reg)					\
1178 	gen3_fs_operand(reg, X, Y, Z, W)
1179 
1180 #define gen3_fs_operand_reg_negate(reg)					\
1181 	gen3_fs_operand(reg, NEG_X, NEG_Y, NEG_Z, NEG_W)
1182 
1183 /**
1184  * Returns an operand containing (0.0, 0.0, 0.0, 0.0).
1185  */
1186 #define gen3_fs_operand_zero() gen3_fs_operand(FS_R0, ZERO, ZERO, ZERO, ZERO)
1187 
1188 /**
1189  * Returns an unused operand
1190  */
1191 #define gen3_fs_operand_none() gen3_fs_operand_zero()
1192 
1193 /**
1194  * Returns an operand containing (1.0, 1.0, 1.0, 1.0).
1195  */
1196 #define gen3_fs_operand_one() gen3_fs_operand(FS_R0, ONE, ONE, ONE, ONE)
1197 
1198 #define gen3_get_hardware_channel_val(val, shift, negate) \
1199 	(((val & 0x7) << shift) | ((val & 0x8) ? negate : 0))
1200 
1201 /**
1202  * Outputs a fragment shader command to declare a sampler or texture register.
1203  */
1204 #define gen3_fs_dcl(reg)						\
1205 	do {									\
1206 		OUT_BATCH(D0_DCL | \
1207 			  (REG_TYPE(reg) << D0_TYPE_SHIFT) | \
1208 			  (REG_NR(reg) << D0_NR_SHIFT) | \
1209 			  ((REG_TYPE(reg) != REG_TYPE_S) ? D0_CHANNEL_ALL : 0)); \
1210 		OUT_BATCH(0); \
1211 		OUT_BATCH(0); \
1212 	} while (0)
1213 
1214 #define gen3_fs_texld(dest_reg, sampler_reg, address_reg)		\
1215 	do {									\
1216 		OUT_BATCH(T0_TEXLD | \
1217 			  (REG_TYPE(dest_reg) << T0_DEST_TYPE_SHIFT) | \
1218 			  (REG_NR(dest_reg) << T0_DEST_NR_SHIFT) | \
1219 			  (REG_NR(sampler_reg) << T0_SAMPLER_NR_SHIFT)); \
1220 		OUT_BATCH((REG_TYPE(address_reg) << T1_ADDRESS_REG_TYPE_SHIFT) | \
1221 			  (REG_NR(address_reg) << T1_ADDRESS_REG_NR_SHIFT)); \
1222 		OUT_BATCH(0); \
1223 	} while (0)
1224 
1225 #define gen3_fs_texldp(dest_reg, sampler_reg, address_reg)		\
1226 	do {									\
1227 		OUT_BATCH(T0_TEXLDP | \
1228 			  (REG_TYPE(dest_reg) << T0_DEST_TYPE_SHIFT) | \
1229 			  (REG_NR(dest_reg) << T0_DEST_NR_SHIFT) | \
1230 			  (REG_NR(sampler_reg) << T0_SAMPLER_NR_SHIFT)); \
1231 		OUT_BATCH((REG_TYPE(address_reg) << T1_ADDRESS_REG_TYPE_SHIFT) | \
1232 			  (REG_NR(address_reg) << T1_ADDRESS_REG_NR_SHIFT)); \
1233 		OUT_BATCH(0); \
1234 	} while (0)
1235 
1236 #define gen3_fs_arith_masked(op, dest_reg, dest_mask, operand0, operand1, operand2)	\
1237 	_gen3_fs_arith_masked(A0_##op, dest_reg, dest_mask, operand0, operand1, operand2)
1238 
1239 #define gen3_fs_arith(op, dest_reg, operand0, operand1, operand2)	\
1240 	_gen3_fs_arith(A0_##op, dest_reg, operand0, operand1, operand2)
1241 
1242 #define _gen3_fs_arith_masked(cmd, dest_reg, dest_mask, operand0, operand1, operand2) \
1243 	do { \
1244 		/* Set up destination register and write mask */ \
1245 		OUT_BATCH(cmd | \
1246 			  (REG_TYPE(dest_reg) << A0_DEST_TYPE_SHIFT) | \
1247 			  (REG_NR(dest_reg) << A0_DEST_NR_SHIFT) | \
1248 			  (((dest_mask) & ~MASK_SATURATE) << A0_DEST_CHANNEL_SHIFT) | \
1249 			  (((dest_mask) & MASK_SATURATE) ? A0_DEST_SATURATE : 0) | \
1250 			  /* Set up operand 0 */ \
1251 			  (REG_TYPE(operand0) << A0_SRC0_TYPE_SHIFT) | \
1252 			  (REG_NR(operand0) << A0_SRC0_NR_SHIFT)); \
1253 		OUT_BATCH(gen3_get_hardware_channel_val(REG_X(operand0), \
1254 							A1_SRC0_CHANNEL_X_SHIFT, \
1255 							A1_SRC0_CHANNEL_X_NEGATE) | \
1256 			  gen3_get_hardware_channel_val(REG_Y(operand0), \
1257 							A1_SRC0_CHANNEL_Y_SHIFT, \
1258 							A1_SRC0_CHANNEL_Y_NEGATE) | \
1259 			  gen3_get_hardware_channel_val(REG_Z(operand0), \
1260 							A1_SRC0_CHANNEL_Z_SHIFT, \
1261 							A1_SRC0_CHANNEL_Z_NEGATE) | \
1262 			  gen3_get_hardware_channel_val(REG_W(operand0), \
1263 							A1_SRC0_CHANNEL_W_SHIFT, \
1264 							A1_SRC0_CHANNEL_W_NEGATE) | \
1265 			  /* Set up operand 1 */ \
1266 			  (REG_TYPE(operand1) << A1_SRC1_TYPE_SHIFT) | \
1267 			  (REG_NR(operand1) << A1_SRC1_NR_SHIFT) | \
1268 			  gen3_get_hardware_channel_val(REG_X(operand1), \
1269 							A1_SRC1_CHANNEL_X_SHIFT, \
1270 							A1_SRC1_CHANNEL_X_NEGATE) | \
1271 			  gen3_get_hardware_channel_val(REG_Y(operand1), \
1272 							A1_SRC1_CHANNEL_Y_SHIFT, \
1273 							A1_SRC1_CHANNEL_Y_NEGATE)); \
1274 		OUT_BATCH(gen3_get_hardware_channel_val(REG_Z(operand1), \
1275 							A2_SRC1_CHANNEL_Z_SHIFT, \
1276 							A2_SRC1_CHANNEL_Z_NEGATE) | \
1277 			  gen3_get_hardware_channel_val(REG_W(operand1), \
1278 							A2_SRC1_CHANNEL_W_SHIFT, \
1279 							A2_SRC1_CHANNEL_W_NEGATE) | \
1280 			  /* Set up operand 2 */ \
1281 			  (REG_TYPE(operand2) << A2_SRC2_TYPE_SHIFT) | \
1282 			  (REG_NR(operand2) << A2_SRC2_NR_SHIFT) | \
1283 			  gen3_get_hardware_channel_val(REG_X(operand2), \
1284 							A2_SRC2_CHANNEL_X_SHIFT, \
1285 							A2_SRC2_CHANNEL_X_NEGATE) | \
1286 			  gen3_get_hardware_channel_val(REG_Y(operand2), \
1287 							A2_SRC2_CHANNEL_Y_SHIFT, \
1288 							A2_SRC2_CHANNEL_Y_NEGATE) | \
1289 			  gen3_get_hardware_channel_val(REG_Z(operand2), \
1290 							A2_SRC2_CHANNEL_Z_SHIFT, \
1291 							A2_SRC2_CHANNEL_Z_NEGATE) | \
1292 			  gen3_get_hardware_channel_val(REG_W(operand2), \
1293 							A2_SRC2_CHANNEL_W_SHIFT, \
1294 							A2_SRC2_CHANNEL_W_NEGATE)); \
1295 	} while (0)
1296 
1297 #define _gen3_fs_arith(cmd, dest_reg, operand0, operand1, operand2) do {\
1298 	/* Set up destination register and write mask */ \
1299 	OUT_BATCH(cmd | \
1300 		  (REG_TYPE(dest_reg) << A0_DEST_TYPE_SHIFT) | \
1301 		  (REG_NR(dest_reg) << A0_DEST_NR_SHIFT) | \
1302 		  (A0_DEST_CHANNEL_ALL) | \
1303 		  /* Set up operand 0 */ \
1304 		  (REG_TYPE(operand0) << A0_SRC0_TYPE_SHIFT) | \
1305 		  (REG_NR(operand0) << A0_SRC0_NR_SHIFT)); \
1306 	OUT_BATCH(gen3_get_hardware_channel_val(REG_X(operand0), \
1307 						A1_SRC0_CHANNEL_X_SHIFT, \
1308 						A1_SRC0_CHANNEL_X_NEGATE) | \
1309 		  gen3_get_hardware_channel_val(REG_Y(operand0), \
1310 						A1_SRC0_CHANNEL_Y_SHIFT, \
1311 						A1_SRC0_CHANNEL_Y_NEGATE) | \
1312 		  gen3_get_hardware_channel_val(REG_Z(operand0), \
1313 						A1_SRC0_CHANNEL_Z_SHIFT, \
1314 						A1_SRC0_CHANNEL_Z_NEGATE) | \
1315 		  gen3_get_hardware_channel_val(REG_W(operand0), \
1316 						A1_SRC0_CHANNEL_W_SHIFT, \
1317 						A1_SRC0_CHANNEL_W_NEGATE) | \
1318 		  /* Set up operand 1 */ \
1319 		  (REG_TYPE(operand1) << A1_SRC1_TYPE_SHIFT) | \
1320 		  (REG_NR(operand1) << A1_SRC1_NR_SHIFT) | \
1321 		  gen3_get_hardware_channel_val(REG_X(operand1), \
1322 						A1_SRC1_CHANNEL_X_SHIFT, \
1323 						A1_SRC1_CHANNEL_X_NEGATE) | \
1324 		  gen3_get_hardware_channel_val(REG_Y(operand1), \
1325 						A1_SRC1_CHANNEL_Y_SHIFT, \
1326 						A1_SRC1_CHANNEL_Y_NEGATE)); \
1327 	OUT_BATCH(gen3_get_hardware_channel_val(REG_Z(operand1), \
1328 						A2_SRC1_CHANNEL_Z_SHIFT, \
1329 						A2_SRC1_CHANNEL_Z_NEGATE) | \
1330 		  gen3_get_hardware_channel_val(REG_W(operand1), \
1331 						A2_SRC1_CHANNEL_W_SHIFT, \
1332 						A2_SRC1_CHANNEL_W_NEGATE) | \
1333 		  /* Set up operand 2 */ \
1334 		  (REG_TYPE(operand2) << A2_SRC2_TYPE_SHIFT) | \
1335 		  (REG_NR(operand2) << A2_SRC2_NR_SHIFT) | \
1336 		  gen3_get_hardware_channel_val(REG_X(operand2), \
1337 						A2_SRC2_CHANNEL_X_SHIFT, \
1338 						A2_SRC2_CHANNEL_X_NEGATE) | \
1339 		  gen3_get_hardware_channel_val(REG_Y(operand2), \
1340 						A2_SRC2_CHANNEL_Y_SHIFT, \
1341 						A2_SRC2_CHANNEL_Y_NEGATE) | \
1342 		  gen3_get_hardware_channel_val(REG_Z(operand2), \
1343 						A2_SRC2_CHANNEL_Z_SHIFT, \
1344 						A2_SRC2_CHANNEL_Z_NEGATE) | \
1345 		  gen3_get_hardware_channel_val(REG_W(operand2), \
1346 						A2_SRC2_CHANNEL_W_SHIFT, \
1347 						A2_SRC2_CHANNEL_W_NEGATE)); \
1348 } while (0)
1349 
1350 #define gen3_fs_mov(dest_reg, operand0)					\
1351 	gen3_fs_arith(MOV, dest_reg, \
1352 		      operand0,			\
1353 		      gen3_fs_operand_none(),			\
1354 		      gen3_fs_operand_none())
1355 
1356 #define gen3_fs_mov_masked(dest_reg, dest_mask, operand0)		\
1357 	gen3_fs_arith_masked (MOV, dest_reg, dest_mask, \
1358 			      operand0, \
1359 			      gen3_fs_operand_none(), \
1360 			      gen3_fs_operand_none())
1361 
1362 
1363 #define gen3_fs_frc(dest_reg, operand0)					\
1364 	gen3_fs_arith (FRC, dest_reg, \
1365 		       operand0,			\
1366 		       gen3_fs_operand_none(),			\
1367 		       gen3_fs_operand_none())
1368 
1369 /** Add operand0 and operand1 and put the result in dest_reg */
1370 #define gen3_fs_add(dest_reg, operand0, operand1)			\
1371 	gen3_fs_arith (ADD, dest_reg, \
1372 		       operand0, operand1,	\
1373 		       gen3_fs_operand_none())
1374 
1375 /** Multiply operand0 and operand1 and put the result in dest_reg */
1376 #define gen3_fs_mul(dest_reg, operand0, operand1)			\
1377 	gen3_fs_arith (MUL, dest_reg, \
1378 		       operand0, operand1,	\
1379 		       gen3_fs_operand_none())
1380 
1381 /** Computes 1/(operand0.replicate_swizzle) puts the result in dest_reg */
1382 #define gen3_fs_rcp(dest_reg, dest_mask, operand0)		\
1383 	do {									\
1384 		if (dest_mask) {							\
1385 			gen3_fs_arith_masked (RCP, dest_reg, dest_mask, \
1386 					      operand0,			\
1387 					      gen3_fs_operand_none (),			\
1388 					      gen3_fs_operand_none ());			\
1389 		} else { \
1390 			gen3_fs_arith (RCP, dest_reg, \
1391 				       operand0, \
1392 				       gen3_fs_operand_none (), \
1393 				       gen3_fs_operand_none ()); \
1394 		} \
1395 	} while (0)
1396 
1397 /** Computes 1/sqrt(operand0.replicate_swizzle) puts the result in dest_reg */
1398 #define gen3_fs_rsq(dest_reg, dest_mask, operand0)		\
1399 	do {									\
1400 		if (dest_mask) {							\
1401 			gen3_fs_arith_masked (RSQ, dest_reg, dest_mask, \
1402 					      operand0,			\
1403 					      gen3_fs_operand_none (),			\
1404 					      gen3_fs_operand_none ());			\
1405 		} else { \
1406 			gen3_fs_arith (RSQ, dest_reg, \
1407 				       operand0, \
1408 				       gen3_fs_operand_none (), \
1409 				       gen3_fs_operand_none ()); \
1410 		} \
1411 	} while (0)
1412 
1413 /** Puts the minimum of operand0 and operand1 in dest_reg */
1414 #define gen3_fs_min(dest_reg, operand0, operand1)			\
1415 	gen3_fs_arith (MIN, dest_reg, \
1416 		       operand0, operand1, \
1417 		       gen3_fs_operand_none())
1418 
1419 /** Puts the maximum of operand0 and operand1 in dest_reg */
1420 #define gen3_fs_max(dest_reg, operand0, operand1)			\
1421 	gen3_fs_arith (MAX, dest_reg, \
1422 		       operand0, operand1, \
1423 		       gen3_fs_operand_none())
1424 
1425 #define gen3_fs_cmp(dest_reg, operand0, operand1, operand2)		\
1426 	gen3_fs_arith (CMP, dest_reg, operand0, operand1, operand2)
1427 
1428 /** Perform operand0 * operand1 + operand2 and put the result in dest_reg */
1429 #define gen3_fs_mad(dest_reg, dest_mask, op0, op1, op2)	\
1430 	do {									\
1431 		if (dest_mask) {							\
1432 			gen3_fs_arith_masked (MAD, dest_reg, dest_mask, op0, op1, op2); \
1433 		} else { \
1434 			gen3_fs_arith (MAD, dest_reg, op0, op1, op2); \
1435 		} \
1436 	} while (0)
1437 
1438 #define gen3_fs_dp2add(dest_reg, dest_mask, op0, op1, op2)	\
1439 	do {									\
1440 		if (dest_mask) {							\
1441 			gen3_fs_arith_masked (DP2ADD, dest_reg, dest_mask, op0, op1, op2); \
1442 		} else { \
1443 			gen3_fs_arith (DP2ADD, dest_reg, op0, op1, op2); \
1444 		} \
1445 	} while (0)
1446 
1447 /**
1448  * Perform a 3-component dot-product of operand0 and operand1 and put the
1449  * resulting scalar in the channels of dest_reg specified by the dest_mask.
1450  */
1451 #define gen3_fs_dp3(dest_reg, dest_mask, op0, op1)	\
1452 	do {									\
1453 		if (dest_mask) {							\
1454 			gen3_fs_arith_masked (DP3, dest_reg, dest_mask, \
1455 					      op0, op1,\
1456 					      gen3_fs_operand_none());			\
1457 		} else { \
1458 			gen3_fs_arith (DP3, dest_reg, op0, op1,\
1459 				       gen3_fs_operand_none());			\
1460 		} \
1461 	} while (0)
1462 
1463 /**
1464  * Perform a 4-component dot-product of operand0 and operand1 and put the
1465  * resulting scalar in the channels of dest_reg specified by the dest_mask.
1466  */
1467 #define gen3_fs_dp4(dest_reg, dest_mask, op0, op1)	\
1468 	do {									\
1469 		if (dest_mask) {							\
1470 			gen3_fs_arith_masked (DP4, dest_reg, dest_mask, \
1471 					      op0, op1,\
1472 					      gen3_fs_operand_none());			\
1473 		} else { \
1474 			gen3_fs_arith (DP4, dest_reg, op0, op1,\
1475 				       gen3_fs_operand_none());			\
1476 		} \
1477 	} while (0)
1478 
1479 #define SHADER_TRAPEZOIDS (1 << 24)
1480