1 /**********************************************************
2  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person
5  * obtaining a copy of this software and associated documentation
6  * files (the "Software"), to deal in the Software without
7  * restriction, including without limitation the rights to use, copy,
8  * modify, merge, publish, distribute, sublicense, and/or sell copies
9  * of the Software, and to permit persons to whom the Software is
10  * furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be
13  * included in all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  *
24  **********************************************************/
25 
26 #ifndef SVGA_CONTEXT_H
27 #define SVGA_CONTEXT_H
28 
29 
30 #include "pipe/p_context.h"
31 #include "pipe/p_defines.h"
32 #include "pipe/p_state.h"
33 
34 #include "util/os_time.h"
35 
36 #include "util/u_blitter.h"
37 #include "util/list.h"
38 
39 #include "tgsi/tgsi_scan.h"
40 
41 #include "svga_screen.h"
42 #include "svga_state.h"
43 #include "svga_winsys.h"
44 #include "svga_hw_reg.h"
45 #include "svga3d_shaderdefs.h"
46 #include "svga_debug.h"
47 
48 /** Non-GPU queries for gallium HUD */
49 enum svga_hud {
50 /* per-frame counters */
51    SVGA_QUERY_NUM_DRAW_CALLS = PIPE_QUERY_DRIVER_SPECIFIC,
52    SVGA_QUERY_NUM_FALLBACKS,
53    SVGA_QUERY_NUM_FLUSHES,
54    SVGA_QUERY_NUM_VALIDATIONS,
55    SVGA_QUERY_MAP_BUFFER_TIME,
56    SVGA_QUERY_NUM_BUFFERS_MAPPED,
57    SVGA_QUERY_NUM_TEXTURES_MAPPED,
58    SVGA_QUERY_NUM_BYTES_UPLOADED,
59    SVGA_QUERY_NUM_COMMAND_BUFFERS,
60    SVGA_QUERY_COMMAND_BUFFER_SIZE,
61    SVGA_QUERY_FLUSH_TIME,
62    SVGA_QUERY_SURFACE_WRITE_FLUSHES,
63    SVGA_QUERY_NUM_READBACKS,
64    SVGA_QUERY_NUM_RESOURCE_UPDATES,
65    SVGA_QUERY_NUM_BUFFER_UPLOADS,
66    SVGA_QUERY_NUM_CONST_BUF_UPDATES,
67    SVGA_QUERY_NUM_CONST_UPDATES,
68    SVGA_QUERY_NUM_SHADER_RELOCATIONS,
69    SVGA_QUERY_NUM_SURFACE_RELOCATIONS,
70 
71 /* running total counters */
72    SVGA_QUERY_MEMORY_USED,
73    SVGA_QUERY_NUM_SHADERS,
74    SVGA_QUERY_NUM_RESOURCES,
75    SVGA_QUERY_NUM_STATE_OBJECTS,
76    SVGA_QUERY_NUM_SURFACE_VIEWS,
77    SVGA_QUERY_NUM_GENERATE_MIPMAP,
78    SVGA_QUERY_NUM_FAILED_ALLOCATIONS,
79    SVGA_QUERY_NUM_COMMANDS_PER_DRAW,
80    SVGA_QUERY_SHADER_MEM_USED,
81 
82 /*SVGA_QUERY_MAX has to be last because it is size of an array*/
83    SVGA_QUERY_MAX
84 };
85 
86 /**
87  * Maximum supported number of constant buffers per shader
88  */
89 #define SVGA_MAX_CONST_BUFS 14
90 
91 /**
92  * Maximum constant buffer size that can be set in the
93  * DXSetSingleConstantBuffer command is
94  * DX10 constant buffer element count * 4 4-bytes components
95  */
96 #define SVGA_MAX_CONST_BUF_SIZE (4096 * 4 * sizeof(int))
97 
98 #define CONST0_UPLOAD_ALIGNMENT 256
99 
100 struct draw_vertex_shader;
101 struct draw_fragment_shader;
102 struct svga_shader_variant;
103 struct SVGACmdMemory;
104 struct util_bitmask;
105 
106 
107 struct svga_cache_context;
108 struct svga_tracked_state;
109 
110 struct svga_blend_state {
111    unsigned need_white_fragments:1;
112    unsigned independent_blend_enable:1;
113    unsigned alpha_to_coverage:1;
114    unsigned alpha_to_one:1;
115    unsigned blend_color_alpha:1;  /**< set blend color to alpha value */
116    unsigned logicop_enabled:1;
117    unsigned logicop_mode:5;
118 
119    /** Per-render target state */
120    struct {
121       uint8_t writemask;
122 
123       boolean blend_enable;
124       uint8_t srcblend;
125       uint8_t dstblend;
126       uint8_t blendeq;
127 
128       boolean separate_alpha_blend_enable;
129       uint8_t srcblend_alpha;
130       uint8_t dstblend_alpha;
131       uint8_t blendeq_alpha;
132    } rt[PIPE_MAX_COLOR_BUFS];
133 
134    SVGA3dBlendStateId id;  /**< vgpu10 */
135 };
136 
137 struct svga_depth_stencil_state {
138    unsigned zfunc:8;
139    unsigned zenable:1;
140    unsigned zwriteenable:1;
141 
142    unsigned alphatestenable:1;
143    unsigned alphafunc:8;
144 
145    struct {
146       unsigned enabled:1;
147       unsigned func:8;
148       unsigned fail:8;
149       unsigned zfail:8;
150       unsigned pass:8;
151    } stencil[2];
152 
153    /* SVGA3D has one ref/mask/writemask triple shared between front &
154     * back face stencil.  We really need two:
155     */
156    unsigned stencil_mask:8;
157    unsigned stencil_writemask:8;
158 
159    float    alpharef;
160 
161    SVGA3dDepthStencilStateId id;  /**< vgpu10 */
162 };
163 
164 #define SVGA_UNFILLED_DISABLE 0
165 #define SVGA_UNFILLED_LINE    1
166 #define SVGA_UNFILLED_POINT   2
167 
168 #define SVGA_PIPELINE_FLAG_POINTS   (1<<PIPE_PRIM_POINTS)
169 #define SVGA_PIPELINE_FLAG_LINES    (1<<PIPE_PRIM_LINES)
170 #define SVGA_PIPELINE_FLAG_TRIS     (1<<PIPE_PRIM_TRIANGLES)
171 
172 struct svga_rasterizer_state {
173    struct pipe_rasterizer_state templ; /* needed for draw module */
174 
175    unsigned shademode:8;
176    unsigned cullmode:8;
177    unsigned scissortestenable:1;
178    unsigned multisampleantialias:1;
179    unsigned antialiasedlineenable:1;
180    unsigned lastpixel:1;
181    unsigned pointsprite:1;
182 
183    unsigned linepattern;
184 
185    float slopescaledepthbias;
186    float depthbias;
187    float pointsize;
188    float linewidth;
189 
190    unsigned hw_fillmode:2;         /* PIPE_POLYGON_MODE_x */
191 
192    /** Which prims do we need help for?  Bitmask of (1 << PIPE_PRIM_x) flags */
193    unsigned need_pipeline:16;
194 
195    SVGA3dRasterizerStateId id;    /**< vgpu10 */
196 
197    /** For debugging: */
198    const char* need_pipeline_tris_str;
199    const char* need_pipeline_lines_str;
200    const char* need_pipeline_points_str;
201 };
202 
203 struct svga_sampler_state {
204    unsigned mipfilter;
205    unsigned magfilter;
206    unsigned minfilter;
207    unsigned aniso_level;
208    float lod_bias;
209    unsigned addressu;
210    unsigned addressv;
211    unsigned addressw;
212    unsigned bordercolor;
213    unsigned normalized_coords:1;
214    unsigned compare_mode:1;
215    unsigned compare_func:3;
216 
217    unsigned min_lod;
218    unsigned view_min_lod;
219    unsigned view_max_lod;
220 
221    SVGA3dSamplerId id[2];
222 };
223 
224 
225 struct svga_pipe_sampler_view
226 {
227    struct pipe_sampler_view base;
228 
229    SVGA3dShaderResourceViewId id;
230 };
231 
232 
233 static inline struct svga_pipe_sampler_view *
svga_pipe_sampler_view(struct pipe_sampler_view * v)234 svga_pipe_sampler_view(struct pipe_sampler_view *v)
235 {
236    return (struct svga_pipe_sampler_view *) v;
237 }
238 
239 
240 struct svga_velems_state {
241    unsigned count;
242    struct pipe_vertex_element velem[PIPE_MAX_ATTRIBS];
243    SVGA3dDeclType decl_type[PIPE_MAX_ATTRIBS]; /**< vertex attrib formats */
244 
245    /** Bitmasks indicating which attributes need format conversion */
246    unsigned adjust_attrib_range;     /**< range adjustment */
247    unsigned attrib_is_pure_int;      /**< pure int */
248    unsigned adjust_attrib_w_1;       /**< set w = 1 */
249    unsigned adjust_attrib_itof;      /**< int->float */
250    unsigned adjust_attrib_utof;      /**< uint->float */
251    unsigned attrib_is_bgra;          /**< R / B swizzling */
252    unsigned attrib_puint_to_snorm;   /**< 10_10_10_2 packed uint -> snorm */
253    unsigned attrib_puint_to_uscaled; /**< 10_10_10_2 packed uint -> uscaled */
254    unsigned attrib_puint_to_sscaled; /**< 10_10_10_2 packed uint -> sscaled */
255 
256    boolean need_swvfetch;
257 
258    SVGA3dElementLayoutId id; /**< VGPU10 */
259 };
260 
261 struct svga_constant_buffer {
262    struct svga_winsys_surface *handle;
263    unsigned size;
264 };
265 
266 /* Use to calculate differences between state emitted to hardware and
267  * current driver-calculated state.
268  */
269 struct svga_state
270 {
271    const struct svga_blend_state *blend;
272    const struct svga_depth_stencil_state *depth;
273    const struct svga_rasterizer_state *rast;
274    const struct svga_sampler_state *sampler[PIPE_SHADER_TYPES][PIPE_MAX_SAMPLERS];
275    const struct svga_velems_state *velems;
276 
277    struct pipe_sampler_view *sampler_views[PIPE_SHADER_TYPES][PIPE_MAX_SAMPLERS]; /* or texture ID's? */
278    struct svga_fragment_shader *fs;
279    struct svga_vertex_shader *vs;
280    struct svga_geometry_shader *user_gs; /* user-specified GS */
281    struct svga_geometry_shader *gs;      /* derived GS */
282    /* derived tessellation control shader */
283    struct svga_tcs_shader *tcs;
284    /* derived tessellation evaluation shader */
285    struct svga_tes_shader *tes;
286    struct svga_compute_shader *cs;
287 
288    struct pipe_vertex_buffer vb[PIPE_MAX_ATTRIBS];
289    /** Constant buffers for each shader.
290     * The size should probably always match with that of
291     * svga_shader_emitter_v10.num_shader_consts.
292     */
293    struct pipe_constant_buffer constbufs[PIPE_SHADER_TYPES][SVGA_MAX_CONST_BUFS];
294 
295    struct pipe_framebuffer_state framebuffer;
296    float depthscale;
297 
298    /* Hack to limit the number of different render targets between
299     * flushes.  Helps avoid blowing out our surface cache in EXA.
300     */
301    int nr_fbs;
302 
303    struct pipe_poly_stipple poly_stipple;
304    struct pipe_scissor_state scissor[SVGA3D_DX_MAX_VIEWPORTS];
305    struct pipe_blend_color blend_color;
306    struct pipe_stencil_ref stencil_ref;
307    struct pipe_clip_state clip;
308    struct pipe_viewport_state viewport[SVGA3D_DX_MAX_VIEWPORTS];
309 
310    unsigned num_samplers[PIPE_SHADER_TYPES];
311    unsigned num_sampler_views[PIPE_SHADER_TYPES];
312    unsigned num_vertex_buffers;
313    enum pipe_prim_type reduced_prim;
314 
315    unsigned vertex_id_bias;
316 
317    struct {
318       unsigned flag_1d;
319       unsigned flag_srgb;
320    } tex_flags;
321 
322    unsigned sample_mask;
323    unsigned vertices_per_patch;
324    float default_tesslevels[6]; /* tessellation (outer[4] + inner[2]) levels */
325    struct {
326       /* Determine the layout of the grid (in block units) to be used. */
327       unsigned size[3];
328       /* If DispatchIndirect is used, this will has grid size info*/
329       struct pipe_resource *indirect;
330    } grid_info;
331 };
332 
333 struct svga_prescale {
334    float translate[4];
335    float scale[4];
336    boolean enabled;
337 };
338 
339 struct svga_depthrange {
340    float zmin;
341    float zmax;
342 };
343 
344 /* Updated by calling svga_update_state( SVGA_STATE_HW_CLEAR )
345  */
346 struct svga_hw_clear_state
347 {
348    struct pipe_framebuffer_state framebuffer;
349 
350    /* VGPU9 only */
351    SVGA3dRect viewport;
352    struct svga_depthrange depthrange;
353 
354    /* VGPU10 state */
355    SVGA3dViewport viewports[SVGA3D_DX_MAX_VIEWPORTS];
356    struct svga_prescale prescale[SVGA3D_DX_MAX_VIEWPORTS];
357    struct pipe_scissor_state scissors[SVGA3D_DX_MAX_VIEWPORTS];
358    unsigned num_prescale;
359 
360    unsigned num_rendertargets;
361    struct pipe_surface *rtv[SVGA3D_MAX_RENDER_TARGETS];
362    struct pipe_surface *dsv;
363 };
364 
365 struct svga_hw_view_state
366 {
367    struct pipe_resource *texture;
368    struct svga_sampler_view *v;
369    unsigned min_lod;
370    unsigned max_lod;
371    boolean dirty;
372 };
373 
374 /* Updated by calling svga_update_state( SVGA_STATE_HW_DRAW )
375  */
376 struct svga_hw_draw_state
377 {
378    /** VGPU9 rasterization state */
379    unsigned rs[SVGA3D_RS_MAX];
380    /** VGPU9 texture sampler and bindings state */
381    unsigned ts[SVGA3D_PIXEL_SAMPLERREG_MAX][SVGA3D_TS_MAX];
382 
383    /** VGPU9 texture views */
384    unsigned num_views;
385    unsigned num_backed_views; /* views with backing copy of texture */
386    struct svga_hw_view_state views[PIPE_MAX_SAMPLERS];
387 
388    /** VGPU9 constant buffer values */
389    float cb[PIPE_SHADER_TYPES][SVGA3D_CONSTREG_MAX][4];
390 
391    /** Currently bound shaders */
392    struct svga_shader_variant *fs;
393    struct svga_shader_variant *vs;
394    struct svga_shader_variant *gs;
395    struct svga_shader_variant *tcs;
396    struct svga_shader_variant *tes;
397    struct svga_shader_variant *cs;
398 
399    /** Currently bound constant buffer, per shader stage */
400    struct pipe_resource *constbuf[PIPE_SHADER_TYPES][SVGA_MAX_CONST_BUFS];
401    struct svga_constant_buffer constbufoffsets[PIPE_SHADER_TYPES][SVGA_MAX_CONST_BUFS];
402 
403    /** Bitmask of enabled constant buffers */
404    unsigned enabled_constbufs[PIPE_SHADER_TYPES];
405 
406    /**
407     * These are used to reduce the number of times we call u_upload_unmap()
408     * while updating the zero-th/default VGPU10 constant buffer.
409     */
410    struct pipe_resource *const0_buffer;
411    struct svga_winsys_surface *const0_handle;
412 
413    /** VGPU10 HW state (used to prevent emitting redundant state) */
414    SVGA3dDepthStencilStateId depth_stencil_id;
415    unsigned stencil_ref;
416    SVGA3dBlendStateId blend_id;
417    float blend_factor[4];
418    unsigned blend_sample_mask;
419    SVGA3dRasterizerStateId rasterizer_id;
420    SVGA3dElementLayoutId layout_id;
421    SVGA3dPrimitiveType topology;
422 
423    /** Vertex buffer state */
424    SVGA3dVertexBuffer vbuffer_attrs[PIPE_MAX_ATTRIBS];
425    struct pipe_resource *vbuffers[PIPE_MAX_ATTRIBS];
426    unsigned num_vbuffers;
427 
428    struct pipe_resource *ib;  /**< index buffer for drawing */
429    SVGA3dSurfaceFormat ib_format;
430    unsigned ib_offset;
431 
432    unsigned num_samplers[PIPE_SHADER_TYPES];
433    SVGA3dSamplerId samplers[PIPE_SHADER_TYPES][PIPE_MAX_SAMPLERS];
434 
435    unsigned num_sampler_views[PIPE_SHADER_TYPES];
436    struct pipe_sampler_view
437       *sampler_views[PIPE_SHADER_TYPES][PIPE_MAX_SAMPLERS];
438 
439    /* used for rebinding */
440    unsigned default_constbuf_size[PIPE_SHADER_TYPES];
441 
442    boolean rasterizer_discard; /* set if rasterization is disabled */
443    boolean has_backed_views;   /* set if any of the rtv/dsv is a backed surface view */
444 };
445 
446 
447 /* Updated by calling svga_update_state( SVGA_STATE_NEED_SWTNL )
448  */
449 struct svga_sw_state
450 {
451    /* which parts we need */
452    boolean need_swvfetch;
453    boolean need_pipeline;
454    boolean need_swtnl;
455 
456    /* Flag to make sure that need sw is on while
457     * updating state within a swtnl call.
458     */
459    boolean in_swtnl_draw;
460 };
461 
462 
463 /* Queue some state updates (like rss) and submit them to hardware in
464  * a single packet.
465  */
466 struct svga_hw_queue;
467 
468 struct svga_query;
469 struct svga_qmem_alloc_entry;
470 
471 struct svga_context
472 {
473    struct pipe_context pipe;
474    struct svga_winsys_context *swc;
475    struct blitter_context *blitter;
476    struct u_upload_mgr *const0_upload;
477    struct u_upload_mgr *tex_upload;
478 
479    struct {
480       boolean no_swtnl;
481       boolean force_swtnl;
482       boolean use_min_mipmap;
483 
484       /* incremented for each shader */
485       unsigned shader_id;
486 
487       boolean no_line_width;
488       boolean force_hw_line_stipple;
489 
490       /** To report perf/conformance/etc issues to the gallium frontend */
491       struct pipe_debug_callback callback;
492    } debug;
493 
494    struct {
495       struct draw_context *draw;
496       struct vbuf_render *backend;
497       unsigned hw_prim;
498       boolean new_vbuf;
499       boolean new_vdecl;
500    } swtnl;
501 
502    /* Bitmask of blend state objects IDs */
503    struct util_bitmask *blend_object_id_bm;
504 
505    /* Bitmask of depth/stencil state objects IDs */
506    struct util_bitmask *ds_object_id_bm;
507 
508    /* Bitmask of input element object IDs */
509    struct util_bitmask *input_element_object_id_bm;
510 
511    /* Bitmask of rasterizer object IDs */
512    struct util_bitmask *rast_object_id_bm;
513 
514    /* Bitmask of sampler state objects IDs */
515    struct util_bitmask *sampler_object_id_bm;
516 
517    /* Bitmask of sampler view IDs */
518    struct util_bitmask *sampler_view_id_bm;
519 
520    /* Bitmask of used shader IDs */
521    struct util_bitmask *shader_id_bm;
522 
523    /* Bitmask of used surface view IDs */
524    struct util_bitmask *surface_view_id_bm;
525 
526    /* Bitmask of used stream output IDs */
527    struct util_bitmask *stream_output_id_bm;
528 
529    /* Bitmask of used query IDs */
530    struct util_bitmask *query_id_bm;
531 
532    struct {
533       uint64_t dirty[SVGA_STATE_MAX];
534 
535       /** bitmasks of which const buffers are changed */
536       unsigned dirty_constbufs[PIPE_SHADER_TYPES];
537 
538       unsigned texture_timestamp;
539 
540       struct svga_sw_state          sw;
541       struct svga_hw_draw_state     hw_draw;
542       struct svga_hw_clear_state    hw_clear;
543    } state;
544 
545    struct svga_state curr;      /* state from the gallium frontend */
546    uint64_t dirty;              /* statechanges since last update_state() */
547 
548    union {
549       struct {
550          unsigned rendertargets:1;
551          unsigned texture_samplers:1;
552          unsigned constbufs:1;
553          unsigned vs:1;
554          unsigned fs:1;
555          unsigned gs:1;
556          unsigned tcs:1;
557          unsigned tes:1;
558          unsigned cs:1;
559          unsigned query:1;
560       } flags;
561       unsigned val;
562    } rebind;
563 
564    struct svga_hwtnl *hwtnl;
565 
566    /** Queries states */
567    struct svga_winsys_gb_query *gb_query;     /**< gb query object, one per context */
568    unsigned gb_query_len;                     /**< gb query object size */
569    struct util_bitmask *gb_query_alloc_mask;  /**< gb query object allocation mask */
570    struct svga_qmem_alloc_entry *gb_query_map[SVGA_QUERY_MAX];
571                                               /**< query mem block mapping */
572    struct svga_query *sq[SVGA_QUERY_MAX+12];  /**< queries currently in progress */
573                                               /* The last 12 entries are for streamout
574                                                * queries for stream 0..3
575                                                */
576 
577    /** List of buffers with queued transfers */
578    struct list_head dirty_buffers;
579 
580    /** performance / info queries for HUD */
581    struct {
582       uint64_t num_draw_calls;          /**< SVGA_QUERY_DRAW_CALLS */
583       uint64_t num_fallbacks;           /**< SVGA_QUERY_NUM_FALLBACKS */
584       uint64_t num_flushes;             /**< SVGA_QUERY_NUM_FLUSHES */
585       uint64_t num_validations;         /**< SVGA_QUERY_NUM_VALIDATIONS */
586       uint64_t map_buffer_time;         /**< SVGA_QUERY_MAP_BUFFER_TIME */
587       uint64_t num_buffers_mapped;      /**< SVGA_QUERY_NUM_BUFFERS_MAPPED */
588       uint64_t num_textures_mapped;     /**< SVGA_QUERY_NUM_TEXTURES_MAPPED */
589       uint64_t num_command_buffers;     /**< SVGA_QUERY_NUM_COMMAND_BUFFERS */
590       uint64_t command_buffer_size;     /**< SVGA_QUERY_COMMAND_BUFFER_SIZE */
591       uint64_t flush_time;              /**< SVGA_QUERY_FLUSH_TIME */
592       uint64_t surface_write_flushes;   /**< SVGA_QUERY_SURFACE_WRITE_FLUSHES */
593       uint64_t num_readbacks;           /**< SVGA_QUERY_NUM_READBACKS */
594       uint64_t num_resource_updates;    /**< SVGA_QUERY_NUM_RESOURCE_UPDATES */
595       uint64_t num_buffer_uploads;      /**< SVGA_QUERY_NUM_BUFFER_UPLOADS */
596       uint64_t num_const_buf_updates;   /**< SVGA_QUERY_NUM_CONST_BUF_UPDATES */
597       uint64_t num_const_updates;       /**< SVGA_QUERY_NUM_CONST_UPDATES */
598       uint64_t num_shaders;             /**< SVGA_QUERY_NUM_SHADERS */
599 
600       /** The following are summed for SVGA_QUERY_NUM_STATE_OBJECTS */
601       uint64_t num_blend_objects;
602       uint64_t num_depthstencil_objects;
603       uint64_t num_rasterizer_objects;
604       uint64_t num_sampler_objects;
605       uint64_t num_samplerview_objects;
606       uint64_t num_vertexelement_objects;
607 
608       uint64_t num_surface_views;       /**< SVGA_QUERY_NUM_SURFACE_VIEWS */
609       uint64_t num_bytes_uploaded;      /**< SVGA_QUERY_NUM_BYTES_UPLOADED */
610       uint64_t num_generate_mipmap;     /**< SVGA_QUERY_NUM_GENERATE_MIPMAP */
611       uint64_t shader_mem_used;         /**< SVGA_QUERY_SHADER_MEM_USED */
612 
613       boolean uses_time;                /**< os_time_get() calls needed? */
614    } hud;
615 
616    /** The currently bound stream output targets */
617    boolean in_streamout;                /* Set if streamout is active */
618    unsigned num_so_targets;
619    struct svga_winsys_surface *so_surfaces[SVGA3D_DX_MAX_SOTARGETS];
620    struct pipe_stream_output_target *so_targets[SVGA3D_DX_MAX_SOTARGETS];
621    struct svga_stream_output *current_so;
622 
623    /**
624     * The following states are used in the workaround for auto draw with
625     * stream instancing.
626     */
627 
628    /* Last bound SO targets that can be used to get vertex count */
629    struct pipe_stream_output_target *vcount_so_targets[SVGA3D_DX_MAX_SOTARGETS];
630    unsigned vcount_buffer_stream;       /* SO buffer to stream index mask */
631    struct pipe_query *so_queries[4];    /* SO stat queries for each stream */
632 
633    /** A blend state with blending disabled, for falling back to when blending
634     * is illegal (e.g. an integer texture is bound)
635     */
636    struct svga_blend_state *noop_blend;
637 
638    struct {
639       struct pipe_resource *texture;
640       struct svga_pipe_sampler_view *sampler_view;
641       void *sampler;
642    } polygon_stipple;
643 
644    /** Alternate rasterizer states created for point sprite */
645    struct svga_rasterizer_state *rasterizer_no_cull[2];
646 
647    /** Depth stencil state created to disable depth stencil test */
648    struct svga_depth_stencil_state *depthstencil_disable;
649 
650    /** Current conditional rendering predicate */
651    struct {
652       SVGA3dQueryId query_id;
653       boolean cond;
654    } pred;
655 
656    boolean render_condition;
657    boolean disable_rasterizer; /* Set if to disable rasterization */
658    uint8_t patch_vertices;
659 
660    struct {
661       struct svga_tcs_shader *passthrough_tcs;
662       struct svga_vertex_shader *vs;
663       struct svga_tes_shader *tes;
664       unsigned vertices_per_patch;
665       boolean passthrough;
666    } tcs;
667 
668 };
669 
670 /* A flag for each frontend state object:
671  */
672 #define SVGA_NEW_BLEND               ((uint64_t) 0x1)
673 #define SVGA_NEW_DEPTH_STENCIL_ALPHA ((uint64_t) 0x2)
674 #define SVGA_NEW_RAST                ((uint64_t) 0x4)
675 #define SVGA_NEW_SAMPLER             ((uint64_t) 0x8)
676 #define SVGA_NEW_TEXTURE             ((uint64_t) 0x10)
677 #define SVGA_NEW_VBUFFER             ((uint64_t) 0x20)
678 #define SVGA_NEW_VELEMENT            ((uint64_t) 0x40)
679 #define SVGA_NEW_FS                  ((uint64_t) 0x80)
680 #define SVGA_NEW_VS                  ((uint64_t) 0x100)
681 #define SVGA_NEW_FS_CONST_BUFFER     ((uint64_t) 0x200)
682 #define SVGA_NEW_VS_CONST_BUFFER     ((uint64_t) 0x400)
683 #define SVGA_NEW_FRAME_BUFFER        ((uint64_t) 0x800)
684 #define SVGA_NEW_STIPPLE             ((uint64_t) 0x1000)
685 #define SVGA_NEW_SCISSOR             ((uint64_t) 0x2000)
686 #define SVGA_NEW_BLEND_COLOR         ((uint64_t) 0x4000)
687 #define SVGA_NEW_CLIP                ((uint64_t) 0x8000)
688 #define SVGA_NEW_VIEWPORT            ((uint64_t) 0x10000)
689 #define SVGA_NEW_PRESCALE            ((uint64_t) 0x20000)
690 #define SVGA_NEW_REDUCED_PRIMITIVE   ((uint64_t) 0x40000)
691 #define SVGA_NEW_TEXTURE_BINDING     ((uint64_t) 0x80000)
692 #define SVGA_NEW_NEED_PIPELINE       ((uint64_t) 0x100000)
693 #define SVGA_NEW_NEED_SWVFETCH       ((uint64_t) 0x200000)
694 #define SVGA_NEW_NEED_SWTNL          ((uint64_t) 0x400000)
695 #define SVGA_NEW_FS_VARIANT          ((uint64_t) 0x800000)
696 #define SVGA_NEW_VS_VARIANT          ((uint64_t) 0x1000000)
697 #define SVGA_NEW_TEXTURE_FLAGS       ((uint64_t) 0x4000000)
698 #define SVGA_NEW_STENCIL_REF         ((uint64_t) 0x8000000)
699 #define SVGA_NEW_GS                  ((uint64_t) 0x10000000)
700 #define SVGA_NEW_GS_CONST_BUFFER     ((uint64_t) 0x20000000)
701 #define SVGA_NEW_GS_VARIANT          ((uint64_t) 0x40000000)
702 #define SVGA_NEW_TEXTURE_CONSTS      ((uint64_t) 0x80000000)
703 #define SVGA_NEW_TCS                 ((uint64_t) 0x100000000)
704 #define SVGA_NEW_TES                 ((uint64_t) 0x200000000)
705 #define SVGA_NEW_TCS_VARIANT         ((uint64_t) 0x400000000)
706 #define SVGA_NEW_TES_VARIANT         ((uint64_t) 0x800000000)
707 #define SVGA_NEW_TCS_CONST_BUFFER    ((uint64_t) 0x1000000000)
708 #define SVGA_NEW_TES_CONST_BUFFER    ((uint64_t) 0x2000000000)
709 #define SVGA_NEW_TCS_PARAM           ((uint64_t) 0x4000000000)
710 #define SVGA_NEW_FS_CONSTS           ((uint64_t) 0x8000000000)
711 #define SVGA_NEW_VS_CONSTS           ((uint64_t) 0x10000000000)
712 #define SVGA_NEW_GS_CONSTS           ((uint64_t) 0x20000000000)
713 #define SVGA_NEW_TCS_CONSTS          ((uint64_t) 0x40000000000)
714 #define SVGA_NEW_TES_CONSTS          ((uint64_t) 0x800000000000)
715 #define SVGA_NEW_ALL                 ((uint64_t) 0xFFFFFFFFFFFFFFFF)
716 
717 #define SVGA_NEW_CONST_BUFFER \
718    (SVGA_NEW_FS_CONST_BUFFER | SVGA_NEW_VS_CONST_BUFFER | \
719     SVGA_NEW_GS_CONST_BUFFER | \
720     SVGA_NEW_TCS_CONST_BUFFER | SVGA_NEW_TES_CONST_BUFFER)
721 
722 
723 void svga_init_state_functions( struct svga_context *svga );
724 void svga_init_flush_functions( struct svga_context *svga );
725 void svga_init_string_functions( struct svga_context *svga );
726 void svga_init_blit_functions(struct svga_context *svga);
727 
728 void svga_init_blend_functions( struct svga_context *svga );
729 void svga_init_depth_stencil_functions( struct svga_context *svga );
730 void svga_init_misc_functions( struct svga_context *svga );
731 void svga_init_rasterizer_functions( struct svga_context *svga );
732 void svga_init_sampler_functions( struct svga_context *svga );
733 void svga_init_cs_functions( struct svga_context *svga );
734 void svga_init_fs_functions( struct svga_context *svga );
735 void svga_init_vs_functions( struct svga_context *svga );
736 void svga_init_gs_functions( struct svga_context *svga );
737 void svga_init_ts_functions( struct svga_context *svga );
738 void svga_init_vertex_functions( struct svga_context *svga );
739 void svga_init_constbuffer_functions( struct svga_context *svga );
740 void svga_init_draw_functions( struct svga_context *svga );
741 void svga_init_query_functions( struct svga_context *svga );
742 void svga_init_surface_functions(struct svga_context *svga);
743 void svga_init_stream_output_functions( struct svga_context *svga );
744 void svga_init_clear_functions( struct svga_context *svga );
745 
746 void svga_cleanup_vertex_state( struct svga_context *svga );
747 void svga_cleanup_sampler_state( struct svga_context *svga );
748 void svga_cleanup_tss_binding( struct svga_context *svga );
749 void svga_cleanup_framebuffer( struct svga_context *svga );
750 void svga_cleanup_tcs_state( struct svga_context *svga );
751 
752 void svga_context_flush( struct svga_context *svga,
753                          struct pipe_fence_handle **pfence );
754 
755 void svga_context_finish(struct svga_context *svga);
756 
757 void svga_hwtnl_flush_retry( struct svga_context *svga );
758 void svga_hwtnl_flush_buffer( struct svga_context *svga,
759                               struct pipe_resource *buffer );
760 boolean svga_hwtnl_has_pending_prim(struct svga_hwtnl *);
761 
762 void svga_surfaces_flush(struct svga_context *svga);
763 
764 struct pipe_context *
765 svga_context_create(struct pipe_screen *screen,
766                     void *priv, unsigned flags);
767 
768 void svga_toggle_render_condition(struct svga_context *svga,
769                                   boolean render_condition_enabled,
770                                   boolean on);
771 
772 /***********************************************************************
773  * Inline conversion functions.  These are better-typed than the
774  * macros used previously:
775  */
776 static inline struct svga_context *
svga_context(struct pipe_context * pipe)777 svga_context( struct pipe_context *pipe )
778 {
779    return (struct svga_context *)pipe;
780 }
781 
782 static inline struct svga_winsys_screen *
svga_sws(struct svga_context * svga)783 svga_sws(struct svga_context *svga)
784 {
785    return svga_screen(svga->pipe.screen)->sws;
786 }
787 
788 static inline boolean
svga_have_gb_objects(const struct svga_context * svga)789 svga_have_gb_objects(const struct svga_context *svga)
790 {
791    return svga_screen(svga->pipe.screen)->sws->have_gb_objects;
792 }
793 
794 static inline boolean
svga_have_gb_dma(const struct svga_context * svga)795 svga_have_gb_dma(const struct svga_context *svga)
796 {
797    return svga_screen(svga->pipe.screen)->sws->have_gb_dma;
798 }
799 
800 static inline boolean
svga_have_vgpu10(const struct svga_context * svga)801 svga_have_vgpu10(const struct svga_context *svga)
802 {
803    return svga_screen(svga->pipe.screen)->sws->have_vgpu10;
804 }
805 
806 static inline boolean
svga_have_sm4_1(const struct svga_context * svga)807 svga_have_sm4_1(const struct svga_context *svga)
808 {
809    return svga_screen(svga->pipe.screen)->sws->have_sm4_1;
810 }
811 
812 static inline boolean
svga_have_sm5(const struct svga_context * svga)813 svga_have_sm5(const struct svga_context *svga)
814 {
815    return svga_screen(svga->pipe.screen)->sws->have_sm5;
816 }
817 
818 static inline boolean
svga_need_to_rebind_resources(const struct svga_context * svga)819 svga_need_to_rebind_resources(const struct svga_context *svga)
820 {
821    return svga_screen(svga->pipe.screen)->sws->need_to_rebind_resources;
822 }
823 
824 static inline boolean
svga_rects_equal(const SVGA3dRect * r1,const SVGA3dRect * r2)825 svga_rects_equal(const SVGA3dRect *r1, const SVGA3dRect *r2)
826 {
827    return memcmp(r1, r2, sizeof(*r1)) == 0;
828 }
829 
830 /**
831  * If the Gallium HUD is enabled, this will return the current time.
832  * Otherwise, just return zero.
833  */
834 static inline int64_t
svga_get_time(struct svga_context * svga)835 svga_get_time(struct svga_context *svga)
836 {
837    return svga->hud.uses_time ? os_time_get() : 0;
838 }
839 
840 /*
841  * The SVGA_TRY_XX family of macros can be used to optionally replace a
842  * function call with an error value, the purpose is to trigger and test
843  * retry path handling.
844  */
845 #ifdef DEBUG
846 
847 /*
848  * Optionally replace a function call with a PIPE_ERROR_OUT_OF_MEMORY
849  * return value
850  */
851 #define SVGA_TRY(_func) \
852    ((SVGA_DEBUG & DEBUG_RETRY) ? PIPE_ERROR_OUT_OF_MEMORY : (_func))
853 
854 /* Optionally replace a function call with a NULL return value */
855 #define SVGA_TRY_PTR(_func) \
856    ((SVGA_DEBUG & DEBUG_RETRY) ? NULL : (_func))
857 
858 /*
859  * Optionally replace a function call with a NULL return value, and set
860  * the _retry parameter to TRUE.
861  */
862 #define SVGA_TRY_MAP(_func, _retry) \
863    ((SVGA_DEBUG & DEBUG_RETRY) ? (_retry) = TRUE, NULL : (_func))
864 #else
865 
866 #define SVGA_TRY(_func) (_func)
867 
868 #define SVGA_TRY_PTR(_func) (_func)
869 
870 #define SVGA_TRY_MAP(_func, _retry) (_func)
871 #endif
872 
873 /**
874  * Enter retry processing after hitting out-of-command space
875  */
876 static inline void
svga_retry_enter(struct svga_context * svga)877 svga_retry_enter(struct svga_context *svga)
878 {
879    /* We shouldn't nest retries, but currently we do. */
880    if ((SVGA_DEBUG & DEBUG_RETRY) && svga->swc->in_retry) {
881       debug_printf("WARNING: Recursive retry. Level: %u.\n",
882                    svga->swc->in_retry);
883    }
884    svga->swc->in_retry++;
885 }
886 
887 /**
888  * Exit retry processing after hitting out-of-command space
889  */
890 static inline void
svga_retry_exit(struct svga_context * svga)891 svga_retry_exit(struct svga_context *svga)
892 {
893    assert(svga->swc->in_retry > 0);
894    svga->swc->in_retry--;
895 }
896 
897 /**
898  * Perform a function call, and on failure flush the context and retry,
899  * asserting that the retry succeeded. On return, the boolean argument
900  * _retried indicates whether the function call was retried or not.
901  */
902 #define SVGA_RETRY_CHECK(_svga, _func, _retried)       \
903    do {                                                \
904       enum pipe_error ret;                             \
905                                                        \
906       ret = SVGA_TRY(_func);                           \
907       (_retried) = (ret != PIPE_OK);                   \
908       if (_retried) {                                  \
909          svga_retry_enter(_svga);                      \
910          svga_context_flush(_svga, NULL);              \
911          ret = (_func);                                \
912          assert(ret == PIPE_OK);                       \
913          svga_retry_exit(_svga);                       \
914       }                                                \
915    } while(0)
916 
917 /**
918  * Perform a function call, and on failure flush the context and retry,
919  * asserting that the retry succeeded.
920  */
921 #define SVGA_RETRY(_svga, _func)                \
922    do {                                         \
923       UNUSED boolean retried;                   \
924                                                 \
925       SVGA_RETRY_CHECK(_svga, _func, retried);  \
926    } while(0)
927 
928 /**
929  * Perform a function call, and on out-of-memory, flush the context and
930  * retry. The retry return value is stored in _ret for reuse.
931  */
932 #define SVGA_RETRY_OOM(_svga, _ret, _func)              \
933    do {                                                 \
934       (_ret) = SVGA_TRY(_func);                         \
935       if ((_ret) == PIPE_ERROR_OUT_OF_MEMORY) {         \
936          svga_retry_enter(_svga);                       \
937          svga_context_flush(_svga, NULL);               \
938          (_ret) = (_func);                              \
939          svga_retry_exit(_svga);                        \
940       }                                                 \
941    } while (0);
942 
943 #endif
944