1 /**********************************************************
2  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person
5  * obtaining a copy of this software and associated documentation
6  * files (the "Software"), to deal in the Software without
7  * restriction, including without limitation the rights to use, copy,
8  * modify, merge, publish, distribute, sublicense, and/or sell copies
9  * of the Software, and to permit persons to whom the Software is
10  * furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be
13  * included in all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  *
24  **********************************************************/
25 
26 #include "svga_cmd.h"
27 
28 #include "util/u_inlines.h"
29 #include "util/u_prim.h"
30 #include "indices/u_indices.h"
31 
32 #include "svga_hw_reg.h"
33 #include "svga_draw.h"
34 #include "svga_draw_private.h"
35 #include "svga_context.h"
36 #include "svga_shader.h"
37 
38 
39 #define DBG 0
40 
41 
42 static enum pipe_error
generate_indices(struct svga_hwtnl * hwtnl,unsigned nr,unsigned index_size,u_generate_func generate,struct pipe_resource ** out_buf)43 generate_indices(struct svga_hwtnl *hwtnl,
44                  unsigned nr,
45                  unsigned index_size,
46                  u_generate_func generate, struct pipe_resource **out_buf)
47 {
48    struct pipe_context *pipe = &hwtnl->svga->pipe;
49    struct pipe_transfer *transfer;
50    unsigned size = index_size * nr;
51    struct pipe_resource *dst = NULL;
52    void *dst_map = NULL;
53 
54    dst = pipe_buffer_create(pipe->screen, PIPE_BIND_INDEX_BUFFER,
55                             PIPE_USAGE_IMMUTABLE, size);
56    if (!dst)
57       goto fail;
58 
59    dst_map = pipe_buffer_map(pipe, dst, PIPE_MAP_WRITE, &transfer);
60    if (!dst_map)
61       goto fail;
62 
63    generate(0, nr, dst_map);
64 
65    pipe_buffer_unmap(pipe, transfer);
66 
67    *out_buf = dst;
68    return PIPE_OK;
69 
70 fail:
71    if (dst_map)
72       pipe_buffer_unmap(pipe, transfer);
73 
74    if (dst)
75       pipe->screen->resource_destroy(pipe->screen, dst);
76 
77    return PIPE_ERROR_OUT_OF_MEMORY;
78 }
79 
80 
81 static boolean
compare(unsigned cached_nr,unsigned nr,unsigned type)82 compare(unsigned cached_nr, unsigned nr, unsigned type)
83 {
84    if (type == U_GENERATE_REUSABLE)
85       return cached_nr >= nr;
86    else
87       return cached_nr == nr;
88 }
89 
90 
91 static enum pipe_error
retrieve_or_generate_indices(struct svga_hwtnl * hwtnl,enum pipe_prim_type prim,unsigned gen_type,unsigned gen_nr,unsigned gen_size,u_generate_func generate,struct pipe_resource ** out_buf)92 retrieve_or_generate_indices(struct svga_hwtnl *hwtnl,
93                              enum pipe_prim_type prim,
94                              unsigned gen_type,
95                              unsigned gen_nr,
96                              unsigned gen_size,
97                              u_generate_func generate,
98                              struct pipe_resource **out_buf)
99 {
100    enum pipe_error ret = PIPE_OK;
101    int i;
102 
103    SVGA_STATS_TIME_PUSH(svga_sws(hwtnl->svga), SVGA_STATS_TIME_GENERATEINDICES);
104 
105    for (i = 0; i < IDX_CACHE_MAX; i++) {
106       if (hwtnl->index_cache[prim][i].buffer != NULL &&
107           hwtnl->index_cache[prim][i].generate == generate) {
108          if (compare(hwtnl->index_cache[prim][i].gen_nr, gen_nr, gen_type)) {
109             pipe_resource_reference(out_buf,
110                                     hwtnl->index_cache[prim][i].buffer);
111 
112             if (DBG)
113                debug_printf("%s retrieve %d/%d\n", __FUNCTION__, i, gen_nr);
114 
115             goto done;
116          }
117          else if (gen_type == U_GENERATE_REUSABLE) {
118             pipe_resource_reference(&hwtnl->index_cache[prim][i].buffer,
119                                     NULL);
120 
121             if (DBG)
122                debug_printf("%s discard %d/%d\n", __FUNCTION__,
123                             i, hwtnl->index_cache[prim][i].gen_nr);
124 
125             break;
126          }
127       }
128    }
129 
130    if (i == IDX_CACHE_MAX) {
131       unsigned smallest = 0;
132       unsigned smallest_size = ~0;
133 
134       for (i = 0; i < IDX_CACHE_MAX && smallest_size; i++) {
135          if (hwtnl->index_cache[prim][i].buffer == NULL) {
136             smallest = i;
137             smallest_size = 0;
138          }
139          else if (hwtnl->index_cache[prim][i].gen_nr < smallest) {
140             smallest = i;
141             smallest_size = hwtnl->index_cache[prim][i].gen_nr;
142          }
143       }
144 
145       assert(smallest != IDX_CACHE_MAX);
146 
147       pipe_resource_reference(&hwtnl->index_cache[prim][smallest].buffer,
148                               NULL);
149 
150       if (DBG)
151          debug_printf("%s discard smallest %d/%d\n", __FUNCTION__,
152                       smallest, smallest_size);
153 
154       i = smallest;
155    }
156 
157    ret = generate_indices(hwtnl, gen_nr, gen_size, generate, out_buf);
158    if (ret != PIPE_OK)
159       goto done;
160 
161    hwtnl->index_cache[prim][i].generate = generate;
162    hwtnl->index_cache[prim][i].gen_nr = gen_nr;
163    pipe_resource_reference(&hwtnl->index_cache[prim][i].buffer, *out_buf);
164 
165    if (DBG)
166       debug_printf("%s cache %d/%d\n", __FUNCTION__,
167                    i, hwtnl->index_cache[prim][i].gen_nr);
168 
169 done:
170    SVGA_STATS_TIME_POP(svga_sws(hwtnl->svga));
171    return ret;
172 }
173 
174 
175 static enum pipe_error
simple_draw_arrays(struct svga_hwtnl * hwtnl,enum pipe_prim_type prim,unsigned start,unsigned count,unsigned start_instance,unsigned instance_count,ubyte vertices_per_patch)176 simple_draw_arrays(struct svga_hwtnl *hwtnl,
177                    enum pipe_prim_type prim, unsigned start, unsigned count,
178                    unsigned start_instance, unsigned instance_count,
179                    ubyte vertices_per_patch)
180 {
181    SVGA3dPrimitiveRange range;
182    unsigned hw_prim;
183    unsigned hw_count;
184 
185    hw_prim = svga_translate_prim(prim, count, &hw_count, vertices_per_patch);
186    if (hw_count == 0)
187       return PIPE_ERROR_BAD_INPUT;
188 
189    range.primType = hw_prim;
190    range.primitiveCount = hw_count;
191    range.indexArray.surfaceId = SVGA3D_INVALID_ID;
192    range.indexArray.offset = 0;
193    range.indexArray.stride = 0;
194    range.indexWidth = 0;
195    range.indexBias = start;
196 
197    /* Min/max index should be calculated prior to applying bias, so we
198     * end up with min_index = 0, max_index = count - 1 and everybody
199     * looking at those numbers knows to adjust them by
200     * range.indexBias.
201     */
202    return svga_hwtnl_prim(hwtnl, &range, count,
203                           0, count - 1, NULL,
204                           start_instance, instance_count,
205                           NULL, NULL);
206 }
207 
208 
209 enum pipe_error
svga_hwtnl_draw_arrays(struct svga_hwtnl * hwtnl,enum pipe_prim_type prim,unsigned start,unsigned count,unsigned start_instance,unsigned instance_count,ubyte vertices_per_patch)210 svga_hwtnl_draw_arrays(struct svga_hwtnl *hwtnl,
211                        enum pipe_prim_type prim, unsigned start, unsigned count,
212                        unsigned start_instance, unsigned instance_count,
213                        ubyte vertices_per_patch)
214 {
215    enum pipe_prim_type gen_prim;
216    unsigned gen_size, gen_nr;
217    enum indices_mode gen_type;
218    u_generate_func gen_func;
219    enum pipe_error ret = PIPE_OK;
220    unsigned api_pv = hwtnl->api_pv;
221    struct svga_context *svga = hwtnl->svga;
222 
223    SVGA_STATS_TIME_PUSH(svga_sws(svga), SVGA_STATS_TIME_HWTNLDRAWARRAYS);
224 
225    if (svga->curr.rast->templ.fill_front !=
226        svga->curr.rast->templ.fill_back) {
227       assert(hwtnl->api_fillmode == PIPE_POLYGON_MODE_FILL);
228    }
229 
230    if (svga->curr.rast->templ.flatshade &&
231          svga_fs_variant(svga->state.hw_draw.fs)->constant_color_output) {
232       /* The fragment color is a constant, not per-vertex so the whole
233        * primitive will be the same color (except for possible blending).
234        * We can ignore the current provoking vertex state and use whatever
235        * the hardware wants.
236        */
237       api_pv = hwtnl->hw_pv;
238 
239       if (hwtnl->api_fillmode == PIPE_POLYGON_MODE_FILL) {
240          /* Do some simple primitive conversions to avoid index buffer
241           * generation below.  Note that polygons and quads are not directly
242           * supported by the svga device.  Also note, we can only do this
243           * for flat/constant-colored rendering because of provoking vertex.
244           */
245          if (prim == PIPE_PRIM_POLYGON) {
246             prim = PIPE_PRIM_TRIANGLE_FAN;
247          }
248          else if (prim == PIPE_PRIM_QUADS && count == 4) {
249             prim = PIPE_PRIM_TRIANGLE_FAN;
250          }
251       }
252    }
253 
254    if (svga_need_unfilled_fallback(hwtnl, prim)) {
255       /* Convert unfilled polygons into points, lines, triangles */
256       gen_type = u_unfilled_generator(prim,
257                                       start,
258                                       count,
259                                       hwtnl->api_fillmode,
260                                       &gen_prim,
261                                       &gen_size, &gen_nr, &gen_func);
262    }
263    else {
264       /* Convert PIPE_PRIM_LINE_LOOP to PIPE_PRIM_LINESTRIP,
265        * convert PIPE_PRIM_POLYGON to PIPE_PRIM_TRIANGLE_FAN,
266        * etc, if needed (as determined by svga_hw_prims mask).
267        */
268       gen_type = u_index_generator(svga_hw_prims,
269                                    prim,
270                                    start,
271                                    count,
272                                    api_pv,
273                                    hwtnl->hw_pv,
274                                    &gen_prim, &gen_size, &gen_nr, &gen_func);
275    }
276 
277    if (gen_type == U_GENERATE_LINEAR) {
278       ret = simple_draw_arrays(hwtnl, gen_prim, start, count,
279                                start_instance, instance_count,
280                                vertices_per_patch);
281    }
282    else {
283       struct pipe_resource *gen_buf = NULL;
284 
285       /* Need to draw as indexed primitive.
286        * Potentially need to run the gen func to build an index buffer.
287        */
288       ret = retrieve_or_generate_indices(hwtnl,
289                                          prim,
290                                          gen_type,
291                                          gen_nr,
292                                          gen_size, gen_func, &gen_buf);
293       if (ret == PIPE_OK) {
294          pipe_debug_message(&svga->debug.callback, PERF_INFO,
295                             "generating temporary index buffer for drawing %s",
296                             u_prim_name(prim));
297 
298          ret = svga_hwtnl_simple_draw_range_elements(hwtnl,
299                                                      gen_buf,
300                                                      gen_size,
301                                                      start,
302                                                      0,
303                                                      count - 1,
304                                                      gen_prim, 0, gen_nr,
305                                                      start_instance,
306                                                      instance_count,
307                                                      vertices_per_patch);
308       }
309 
310       if (gen_buf) {
311          pipe_resource_reference(&gen_buf, NULL);
312       }
313    }
314 
315    SVGA_STATS_TIME_POP(svga_sws(svga));
316    return ret;
317 }
318