1 /*
2 * Copyright 2002-2005 Jason Edmeades
3 * Copyright 2002-2005 Raphael Junqueira
4 * Copyright 2004 Christian Costa
5 * Copyright 2005 Oliver Stieber
6 * Copyright 2007-2011, 2013-2014 Stefan Dösinger for CodeWeavers
7 * Copyright 2009-2010 Henri Verbeet for CodeWeavers
8 *
9 * This library is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
13 *
14 * This library is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with this library; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
22 *
23 */
24
25 #include "config.h"
26 #include "wine/port.h"
27
28 #include "wined3d_private.h"
29
30 WINE_DEFAULT_DEBUG_CHANNEL(d3d);
31
32 #define WINED3D_BUFFER_HASDESC 0x01 /* A vertex description has been found. */
33 #define WINED3D_BUFFER_USE_BO 0x02 /* Use a buffer object for this buffer. */
34 #define WINED3D_BUFFER_PIN_SYSMEM 0x04 /* Keep a system memory copy for this buffer. */
35 #define WINED3D_BUFFER_DISCARD 0x08 /* A DISCARD lock has occurred since the last preload. */
36 #define WINED3D_BUFFER_APPLESYNC 0x10 /* Using sync as in GL_APPLE_flush_buffer_range. */
37
38 #define VB_MAXDECLCHANGES 100 /* After that number of decl changes we stop converting */
39 #define VB_RESETDECLCHANGE 1000 /* Reset the decl changecount after that number of draws */
40 #define VB_MAXFULLCONVERSIONS 5 /* Number of full conversions before we stop converting */
41 #define VB_RESETFULLCONVS 20 /* Reset full conversion counts after that number of draws */
42
wined3d_buffer_evict_sysmem(struct wined3d_buffer * buffer)43 static void wined3d_buffer_evict_sysmem(struct wined3d_buffer *buffer)
44 {
45 if (buffer->flags & WINED3D_BUFFER_PIN_SYSMEM)
46 {
47 TRACE("Not evicting system memory for buffer %p.\n", buffer);
48 return;
49 }
50
51 TRACE("Evicting system memory for buffer %p.\n", buffer);
52 wined3d_buffer_invalidate_location(buffer, WINED3D_LOCATION_SYSMEM);
53 wined3d_resource_free_sysmem(&buffer->resource);
54 }
55
buffer_invalidate_bo_range(struct wined3d_buffer * buffer,unsigned int offset,unsigned int size)56 static void buffer_invalidate_bo_range(struct wined3d_buffer *buffer, unsigned int offset, unsigned int size)
57 {
58 if (!offset && (!size || size == buffer->resource.size))
59 goto invalidate_all;
60
61 if (offset > buffer->resource.size || size > buffer->resource.size - offset)
62 {
63 WARN("Invalid range specified, invalidating entire buffer.\n");
64 goto invalidate_all;
65 }
66
67 if (!wined3d_array_reserve((void **)&buffer->maps, &buffer->maps_size,
68 buffer->modified_areas + 1, sizeof(*buffer->maps)))
69 {
70 ERR("Failed to allocate maps array, invalidating entire buffer.\n");
71 goto invalidate_all;
72 }
73
74 buffer->maps[buffer->modified_areas].offset = offset;
75 buffer->maps[buffer->modified_areas].size = size;
76 ++buffer->modified_areas;
77 return;
78
79 invalidate_all:
80 buffer->modified_areas = 1;
81 buffer->maps[0].offset = 0;
82 buffer->maps[0].size = buffer->resource.size;
83 }
84
buffer_clear_dirty_areas(struct wined3d_buffer * This)85 static inline void buffer_clear_dirty_areas(struct wined3d_buffer *This)
86 {
87 This->modified_areas = 0;
88 }
89
buffer_is_dirty(const struct wined3d_buffer * buffer)90 static BOOL buffer_is_dirty(const struct wined3d_buffer *buffer)
91 {
92 return !!buffer->modified_areas;
93 }
94
buffer_is_fully_dirty(const struct wined3d_buffer * buffer)95 static BOOL buffer_is_fully_dirty(const struct wined3d_buffer *buffer)
96 {
97 return buffer->modified_areas == 1
98 && !buffer->maps->offset && buffer->maps->size == buffer->resource.size;
99 }
100
wined3d_buffer_validate_location(struct wined3d_buffer * buffer,DWORD location)101 static void wined3d_buffer_validate_location(struct wined3d_buffer *buffer, DWORD location)
102 {
103 TRACE("buffer %p, location %s.\n", buffer, wined3d_debug_location(location));
104
105 if (location & WINED3D_LOCATION_BUFFER)
106 buffer_clear_dirty_areas(buffer);
107
108 buffer->locations |= location;
109
110 TRACE("New locations flags are %s.\n", wined3d_debug_location(buffer->locations));
111 }
112
wined3d_buffer_invalidate_range(struct wined3d_buffer * buffer,DWORD location,unsigned int offset,unsigned int size)113 static void wined3d_buffer_invalidate_range(struct wined3d_buffer *buffer, DWORD location,
114 unsigned int offset, unsigned int size)
115 {
116 TRACE("buffer %p, location %s, offset %u, size %u.\n",
117 buffer, wined3d_debug_location(location), offset, size);
118
119 if (location & WINED3D_LOCATION_BUFFER)
120 buffer_invalidate_bo_range(buffer, offset, size);
121
122 buffer->locations &= ~location;
123
124 TRACE("New locations flags are %s.\n", wined3d_debug_location(buffer->locations));
125
126 if (!buffer->locations)
127 ERR("Buffer %p does not have any up to date location.\n", buffer);
128 }
129
wined3d_buffer_invalidate_location(struct wined3d_buffer * buffer,DWORD location)130 void wined3d_buffer_invalidate_location(struct wined3d_buffer *buffer, DWORD location)
131 {
132 wined3d_buffer_invalidate_range(buffer, location, 0, 0);
133 }
134
135 /* Context activation is done by the caller. */
buffer_bind(struct wined3d_buffer * buffer,struct wined3d_context * context)136 static void buffer_bind(struct wined3d_buffer *buffer, struct wined3d_context *context)
137 {
138 context_bind_bo(context, buffer->buffer_type_hint, buffer->buffer_object);
139 }
140
141 /* Context activation is done by the caller. */
buffer_destroy_buffer_object(struct wined3d_buffer * buffer,struct wined3d_context * context)142 static void buffer_destroy_buffer_object(struct wined3d_buffer *buffer, struct wined3d_context *context)
143 {
144 const struct wined3d_gl_info *gl_info = context->gl_info;
145 struct wined3d_resource *resource = &buffer->resource;
146
147 if (!buffer->buffer_object)
148 return;
149
150 /* The stream source state handler might have read the memory of the
151 * vertex buffer already and got the memory in the vbo which is not
152 * valid any longer. Dirtify the stream source to force a reload. This
153 * happens only once per changed vertexbuffer and should occur rather
154 * rarely. */
155 if (resource->bind_count)
156 {
157 if (buffer->bind_flags & WINED3D_BIND_VERTEX_BUFFER)
158 device_invalidate_state(resource->device, STATE_STREAMSRC);
159 if (buffer->bind_flags & WINED3D_BIND_INDEX_BUFFER)
160 device_invalidate_state(resource->device, STATE_INDEXBUFFER);
161 if (buffer->bind_flags & WINED3D_BIND_CONSTANT_BUFFER)
162 {
163 device_invalidate_state(resource->device, STATE_CONSTANT_BUFFER(WINED3D_SHADER_TYPE_VERTEX));
164 device_invalidate_state(resource->device, STATE_CONSTANT_BUFFER(WINED3D_SHADER_TYPE_HULL));
165 device_invalidate_state(resource->device, STATE_CONSTANT_BUFFER(WINED3D_SHADER_TYPE_DOMAIN));
166 device_invalidate_state(resource->device, STATE_CONSTANT_BUFFER(WINED3D_SHADER_TYPE_GEOMETRY));
167 device_invalidate_state(resource->device, STATE_CONSTANT_BUFFER(WINED3D_SHADER_TYPE_PIXEL));
168 device_invalidate_state(resource->device, STATE_CONSTANT_BUFFER(WINED3D_SHADER_TYPE_COMPUTE));
169 }
170 if (buffer->bind_flags & WINED3D_BIND_STREAM_OUTPUT)
171 {
172 device_invalidate_state(resource->device, STATE_STREAM_OUTPUT);
173 if (context->transform_feedback_active)
174 {
175 /* We have to make sure that transform feedback is not active
176 * when deleting a potentially bound transform feedback buffer.
177 * This may happen when the device is being destroyed. */
178 WARN("Deleting buffer object for buffer %p, disabling transform feedback.\n", buffer);
179 context_end_transform_feedback(context);
180 }
181 }
182 }
183
184 GL_EXTCALL(glDeleteBuffers(1, &buffer->buffer_object));
185 checkGLcall("glDeleteBuffers");
186 buffer->buffer_object = 0;
187
188 if (buffer->fence)
189 {
190 wined3d_fence_destroy(buffer->fence);
191 buffer->fence = NULL;
192 }
193 buffer->flags &= ~WINED3D_BUFFER_APPLESYNC;
194 }
195
196 /* Context activation is done by the caller. */
buffer_create_buffer_object(struct wined3d_buffer * buffer,struct wined3d_context * context)197 static BOOL buffer_create_buffer_object(struct wined3d_buffer *buffer, struct wined3d_context *context)
198 {
199 const struct wined3d_gl_info *gl_info = context->gl_info;
200 GLenum gl_usage = GL_STATIC_DRAW;
201 GLenum error;
202
203 TRACE("Creating an OpenGL buffer object for wined3d_buffer %p with usage %s.\n",
204 buffer, debug_d3dusage(buffer->resource.usage));
205
206 /* Make sure that the gl error is cleared. Do not use checkGLcall
207 * here because checkGLcall just prints a fixme and continues. However,
208 * if an error during VBO creation occurs we can fall back to non-VBO operation
209 * with full functionality(but performance loss).
210 */
211 while (gl_info->gl_ops.gl.p_glGetError() != GL_NO_ERROR);
212
213 /* Basically the FVF parameter passed to CreateVertexBuffer is no good.
214 * The vertex declaration from the device determines how the data in the
215 * buffer is interpreted. This means that on each draw call the buffer has
216 * to be verified to check if the rhw and color values are in the correct
217 * format. */
218
219 GL_EXTCALL(glGenBuffers(1, &buffer->buffer_object));
220 error = gl_info->gl_ops.gl.p_glGetError();
221 if (!buffer->buffer_object || error != GL_NO_ERROR)
222 {
223 ERR("Failed to create a BO with error %s (%#x).\n", debug_glerror(error), error);
224 goto fail;
225 }
226
227 buffer_bind(buffer, context);
228 error = gl_info->gl_ops.gl.p_glGetError();
229 if (error != GL_NO_ERROR)
230 {
231 ERR("Failed to bind the BO with error %s (%#x).\n", debug_glerror(error), error);
232 goto fail;
233 }
234
235 if (buffer->resource.usage & WINED3DUSAGE_DYNAMIC)
236 {
237 TRACE("Buffer has WINED3DUSAGE_DYNAMIC set.\n");
238 gl_usage = GL_STREAM_DRAW_ARB;
239
240 if (gl_info->supported[APPLE_FLUSH_BUFFER_RANGE])
241 {
242 GL_EXTCALL(glBufferParameteriAPPLE(buffer->buffer_type_hint, GL_BUFFER_FLUSHING_UNMAP_APPLE, GL_FALSE));
243 GL_EXTCALL(glBufferParameteriAPPLE(buffer->buffer_type_hint, GL_BUFFER_SERIALIZED_MODIFY_APPLE, GL_FALSE));
244 checkGLcall("glBufferParameteriAPPLE");
245 buffer->flags |= WINED3D_BUFFER_APPLESYNC;
246 }
247 /* No setup is needed here for GL_ARB_map_buffer_range. */
248 }
249
250 GL_EXTCALL(glBufferData(buffer->buffer_type_hint, buffer->resource.size, NULL, gl_usage));
251 error = gl_info->gl_ops.gl.p_glGetError();
252 if (error != GL_NO_ERROR)
253 {
254 ERR("glBufferData failed with error %s (%#x).\n", debug_glerror(error), error);
255 goto fail;
256 }
257
258 buffer->buffer_object_usage = gl_usage;
259 buffer_invalidate_bo_range(buffer, 0, 0);
260
261 return TRUE;
262
263 fail:
264 /* Clean up all BO init, but continue because we can work without a BO :-) */
265 ERR("Failed to create a buffer object. Continuing, but performance issues may occur.\n");
266 buffer->flags &= ~WINED3D_BUFFER_USE_BO;
267 buffer_destroy_buffer_object(buffer, context);
268 buffer_clear_dirty_areas(buffer);
269 return FALSE;
270 }
271
buffer_process_converted_attribute(struct wined3d_buffer * buffer,const enum wined3d_buffer_conversion_type conversion_type,const struct wined3d_stream_info_element * attrib,DWORD * stride_this_run)272 static BOOL buffer_process_converted_attribute(struct wined3d_buffer *buffer,
273 const enum wined3d_buffer_conversion_type conversion_type,
274 const struct wined3d_stream_info_element *attrib, DWORD *stride_this_run)
275 {
276 const struct wined3d_format *format = attrib->format;
277 BOOL ret = FALSE;
278 unsigned int i;
279 DWORD_PTR data;
280
281 /* Check for some valid situations which cause us pain. One is if the buffer is used for
282 * constant attributes(stride = 0), the other one is if the buffer is used on two streams
283 * with different strides. In the 2nd case we might have to drop conversion entirely,
284 * it is possible that the same bytes are once read as FLOAT2 and once as UBYTE4N.
285 */
286 if (!attrib->stride)
287 {
288 FIXME("%s used with stride 0, let's hope we get the vertex stride from somewhere else.\n",
289 debug_d3dformat(format->id));
290 }
291 else if (attrib->stride != *stride_this_run && *stride_this_run)
292 {
293 FIXME("Got two concurrent strides, %d and %d.\n", attrib->stride, *stride_this_run);
294 }
295 else
296 {
297 *stride_this_run = attrib->stride;
298 if (buffer->stride != *stride_this_run)
299 {
300 /* We rely that this happens only on the first converted attribute that is found,
301 * if at all. See above check
302 */
303 TRACE("Reconverting because converted attributes occur, and the stride changed.\n");
304 buffer->stride = *stride_this_run;
305 heap_free(buffer->conversion_map);
306 buffer->conversion_map = heap_calloc(buffer->stride, sizeof(*buffer->conversion_map));
307 ret = TRUE;
308 }
309 }
310
311 data = ((DWORD_PTR)attrib->data.addr) % buffer->stride;
312 for (i = 0; i < format->attribute_size; ++i)
313 {
314 DWORD_PTR idx = (data + i) % buffer->stride;
315 if (buffer->conversion_map[idx] != conversion_type)
316 {
317 TRACE("Byte %lu in vertex changed:\n", idx);
318 TRACE(" It was type %#x, is %#x now.\n", buffer->conversion_map[idx], conversion_type);
319 ret = TRUE;
320 buffer->conversion_map[idx] = conversion_type;
321 }
322 }
323
324 return ret;
325 }
326
327 #define WINED3D_BUFFER_FIXUP_D3DCOLOR 0x01
328 #define WINED3D_BUFFER_FIXUP_XYZRHW 0x02
329
buffer_check_attribute(struct wined3d_buffer * This,const struct wined3d_stream_info * si,const struct wined3d_state * state,UINT attrib_idx,DWORD fixup_flags,DWORD * stride_this_run)330 static BOOL buffer_check_attribute(struct wined3d_buffer *This, const struct wined3d_stream_info *si,
331 const struct wined3d_state *state, UINT attrib_idx, DWORD fixup_flags, DWORD *stride_this_run)
332 {
333 const struct wined3d_stream_info_element *attrib = &si->elements[attrib_idx];
334 enum wined3d_format_id format;
335 BOOL ret = FALSE;
336
337 /* Ignore attributes that do not have our vbo. After that check we can be sure that the attribute is
338 * there, on nonexistent attribs the vbo is 0.
339 */
340 if (!(si->use_map & (1u << attrib_idx))
341 || state->streams[attrib->stream_idx].buffer != This)
342 return FALSE;
343
344 format = attrib->format->id;
345 /* Look for newly appeared conversion */
346 if (fixup_flags & WINED3D_BUFFER_FIXUP_D3DCOLOR && format == WINED3DFMT_B8G8R8A8_UNORM)
347 {
348 ret = buffer_process_converted_attribute(This, CONV_D3DCOLOR, attrib, stride_this_run);
349 }
350 else if (fixup_flags & WINED3D_BUFFER_FIXUP_XYZRHW && si->position_transformed)
351 {
352 if (format != WINED3DFMT_R32G32B32A32_FLOAT)
353 {
354 FIXME("Unexpected format %s for transformed position.\n", debug_d3dformat(format));
355 return FALSE;
356 }
357
358 ret = buffer_process_converted_attribute(This, CONV_POSITIONT, attrib, stride_this_run);
359 }
360 else if (This->conversion_map)
361 {
362 ret = buffer_process_converted_attribute(This, CONV_NONE, attrib, stride_this_run);
363 }
364
365 return ret;
366 }
367
buffer_find_decl(struct wined3d_buffer * This,const struct wined3d_stream_info * si,const struct wined3d_state * state,DWORD fixup_flags)368 static BOOL buffer_find_decl(struct wined3d_buffer *This, const struct wined3d_stream_info *si,
369 const struct wined3d_state *state, DWORD fixup_flags)
370 {
371 UINT stride_this_run = 0;
372 BOOL ret = FALSE;
373
374 /* In d3d7 the vertex buffer declaration NEVER changes because it is stored in the d3d7 vertex buffer.
375 * Once we have our declaration there is no need to look it up again. Index buffers also never need
376 * conversion, so once the (empty) conversion structure is created don't bother checking again
377 */
378 if (This->flags & WINED3D_BUFFER_HASDESC)
379 {
380 if(This->resource.usage & WINED3DUSAGE_STATICDECL) return FALSE;
381 }
382
383 if (!fixup_flags)
384 {
385 TRACE("No fixup required.\n");
386 if(This->conversion_map)
387 {
388 heap_free(This->conversion_map);
389 This->conversion_map = NULL;
390 This->stride = 0;
391 return TRUE;
392 }
393
394 return FALSE;
395 }
396
397 TRACE("Finding vertex buffer conversion information\n");
398 /* Certain declaration types need some fixups before we can pass them to
399 * opengl. This means D3DCOLOR attributes with fixed function vertex
400 * processing, FLOAT4 POSITIONT with fixed function, and FLOAT16 if
401 * GL_ARB_half_float_vertex is not supported.
402 *
403 * Note for d3d8 and d3d9:
404 * The vertex buffer FVF doesn't help with finding them, we have to use
405 * the decoded vertex declaration and pick the things that concern the
406 * current buffer. A problem with this is that this can change between
407 * draws, so we have to validate the information and reprocess the buffer
408 * if it changes, and avoid false positives for performance reasons.
409 * WineD3D doesn't even know the vertex buffer any more, it is managed
410 * by the client libraries and passed to SetStreamSource and ProcessVertices
411 * as needed.
412 *
413 * We have to distinguish between vertex shaders and fixed function to
414 * pick the way we access the strided vertex information.
415 *
416 * This code sets up a per-byte array with the size of the detected
417 * stride of the arrays in the buffer. For each byte we have a field
418 * that marks the conversion needed on this byte. For example, the
419 * following declaration with fixed function vertex processing:
420 *
421 * POSITIONT, FLOAT4
422 * NORMAL, FLOAT3
423 * DIFFUSE, FLOAT16_4
424 * SPECULAR, D3DCOLOR
425 *
426 * Will result in
427 * { POSITIONT }{ NORMAL }{ DIFFUSE }{SPECULAR }
428 * [P][P][P][P][P][P][P][P][P][P][P][P][P][P][P][P][0][0][0][0][0][0][0][0][0][0][0][0][F][F][F][F][F][F][F][F][C][C][C][C]
429 *
430 * Where in this example map P means 4 component position conversion, 0
431 * means no conversion, F means FLOAT16_2 conversion and C means D3DCOLOR
432 * conversion (red / blue swizzle).
433 *
434 * If we're doing conversion and the stride changes we have to reconvert
435 * the whole buffer. Note that we do not mind if the semantic changes,
436 * we only care for the conversion type. So if the NORMAL is replaced
437 * with a TEXCOORD, nothing has to be done, or if the DIFFUSE is replaced
438 * with a D3DCOLOR BLENDWEIGHT we can happily dismiss the change. Some
439 * conversion types depend on the semantic as well, for example a FLOAT4
440 * texcoord needs no conversion while a FLOAT4 positiont needs one
441 */
442
443 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_POSITION,
444 fixup_flags, &stride_this_run) || ret;
445 fixup_flags &= ~WINED3D_BUFFER_FIXUP_XYZRHW;
446
447 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_BLENDWEIGHT,
448 fixup_flags, &stride_this_run) || ret;
449 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_BLENDINDICES,
450 fixup_flags, &stride_this_run) || ret;
451 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_NORMAL,
452 fixup_flags, &stride_this_run) || ret;
453 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_DIFFUSE,
454 fixup_flags, &stride_this_run) || ret;
455 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_SPECULAR,
456 fixup_flags, &stride_this_run) || ret;
457 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD0,
458 fixup_flags, &stride_this_run) || ret;
459 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD1,
460 fixup_flags, &stride_this_run) || ret;
461 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD2,
462 fixup_flags, &stride_this_run) || ret;
463 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD3,
464 fixup_flags, &stride_this_run) || ret;
465 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD4,
466 fixup_flags, &stride_this_run) || ret;
467 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD5,
468 fixup_flags, &stride_this_run) || ret;
469 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD6,
470 fixup_flags, &stride_this_run) || ret;
471 ret = buffer_check_attribute(This, si, state, WINED3D_FFP_TEXCOORD7,
472 fixup_flags, &stride_this_run) || ret;
473
474 if (!stride_this_run && This->conversion_map)
475 {
476 /* Sanity test */
477 if (!ret)
478 ERR("no converted attributes found, old conversion map exists, and no declaration change?\n");
479 heap_free(This->conversion_map);
480 This->conversion_map = NULL;
481 This->stride = 0;
482 }
483
484 if (ret) TRACE("Conversion information changed\n");
485
486 return ret;
487 }
488
fixup_d3dcolor(DWORD * dst_color)489 static inline unsigned int fixup_d3dcolor(DWORD *dst_color)
490 {
491 DWORD src_color = *dst_color;
492
493 /* Color conversion like in draw_primitive_immediate_mode(). Watch out for
494 * endianness. If we want this to work on big-endian machines as well we
495 * have to consider more things.
496 *
497 * 0xff000000: Alpha mask
498 * 0x00ff0000: Blue mask
499 * 0x0000ff00: Green mask
500 * 0x000000ff: Red mask
501 */
502 *dst_color = 0;
503 *dst_color |= (src_color & 0xff00ff00u); /* Alpha Green */
504 *dst_color |= (src_color & 0x00ff0000u) >> 16; /* Red */
505 *dst_color |= (src_color & 0x000000ffu) << 16; /* Blue */
506
507 return sizeof(*dst_color);
508 }
509
fixup_transformed_pos(struct wined3d_vec4 * p)510 static inline unsigned int fixup_transformed_pos(struct wined3d_vec4 *p)
511 {
512 /* rhw conversion like in position_float4(). */
513 if (p->w != 1.0f && p->w != 0.0f)
514 {
515 float w = 1.0f / p->w;
516 p->x *= w;
517 p->y *= w;
518 p->z *= w;
519 p->w = w;
520 }
521
522 return sizeof(*p);
523 }
524
wined3d_buffer_incref(struct wined3d_buffer * buffer)525 ULONG CDECL wined3d_buffer_incref(struct wined3d_buffer *buffer)
526 {
527 ULONG refcount = InterlockedIncrement(&buffer->resource.ref);
528
529 TRACE("%p increasing refcount to %u.\n", buffer, refcount);
530
531 return refcount;
532 }
533
534 /* Context activation is done by the caller. */
wined3d_buffer_upload_ranges(struct wined3d_buffer * buffer,struct wined3d_context * context,const void * data,unsigned int data_offset,unsigned int range_count,const struct wined3d_map_range * ranges)535 static void wined3d_buffer_upload_ranges(struct wined3d_buffer *buffer, struct wined3d_context *context,
536 const void *data, unsigned int data_offset, unsigned int range_count, const struct wined3d_map_range *ranges)
537 {
538 const struct wined3d_gl_info *gl_info = context->gl_info;
539 const struct wined3d_map_range *range;
540
541 buffer_bind(buffer, context);
542
543 while (range_count--)
544 {
545 range = &ranges[range_count];
546 GL_EXTCALL(glBufferSubData(buffer->buffer_type_hint,
547 range->offset, range->size, (BYTE *)data + range->offset - data_offset));
548 }
549 checkGLcall("glBufferSubData");
550 }
551
buffer_conversion_upload(struct wined3d_buffer * buffer,struct wined3d_context * context)552 static void buffer_conversion_upload(struct wined3d_buffer *buffer, struct wined3d_context *context)
553 {
554 unsigned int i, j, range_idx, start, end, vertex_count;
555 BYTE *data;
556
557 if (!wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_SYSMEM))
558 {
559 ERR("Failed to load system memory.\n");
560 return;
561 }
562 buffer->flags |= WINED3D_BUFFER_PIN_SYSMEM;
563
564 /* Now for each vertex in the buffer that needs conversion. */
565 vertex_count = buffer->resource.size / buffer->stride;
566
567 if (!(data = heap_alloc(buffer->resource.size)))
568 {
569 ERR("Out of memory.\n");
570 return;
571 }
572
573 for (range_idx = 0; range_idx < buffer->modified_areas; ++range_idx)
574 {
575 start = buffer->maps[range_idx].offset;
576 end = start + buffer->maps[range_idx].size;
577
578 memcpy(data + start, (BYTE *)buffer->resource.heap_memory + start, end - start);
579 for (i = start / buffer->stride; i < min((end / buffer->stride) + 1, vertex_count); ++i)
580 {
581 for (j = 0; j < buffer->stride;)
582 {
583 switch (buffer->conversion_map[j])
584 {
585 case CONV_NONE:
586 /* Done already */
587 j += sizeof(DWORD);
588 break;
589 case CONV_D3DCOLOR:
590 j += fixup_d3dcolor((DWORD *) (data + i * buffer->stride + j));
591 break;
592 case CONV_POSITIONT:
593 j += fixup_transformed_pos((struct wined3d_vec4 *) (data + i * buffer->stride + j));
594 break;
595 default:
596 FIXME("Unimplemented conversion %d in shifted conversion.\n", buffer->conversion_map[j]);
597 ++j;
598 }
599 }
600 }
601 }
602
603 wined3d_buffer_upload_ranges(buffer, context, data, 0, buffer->modified_areas, buffer->maps);
604
605 heap_free(data);
606 }
607
wined3d_buffer_prepare_location(struct wined3d_buffer * buffer,struct wined3d_context * context,DWORD location)608 static BOOL wined3d_buffer_prepare_location(struct wined3d_buffer *buffer,
609 struct wined3d_context *context, DWORD location)
610 {
611 switch (location)
612 {
613 case WINED3D_LOCATION_SYSMEM:
614 if (buffer->resource.heap_memory)
615 return TRUE;
616
617 if (!wined3d_resource_allocate_sysmem(&buffer->resource))
618 {
619 ERR("Failed to allocate system memory.\n");
620 return FALSE;
621 }
622 return TRUE;
623
624 case WINED3D_LOCATION_BUFFER:
625 if (buffer->buffer_object)
626 return TRUE;
627
628 if (!(buffer->flags & WINED3D_BUFFER_USE_BO))
629 {
630 WARN("Trying to create BO for buffer %p with no WINED3D_BUFFER_USE_BO.\n", buffer);
631 return FALSE;
632 }
633 return buffer_create_buffer_object(buffer, context);
634
635 default:
636 ERR("Invalid location %s.\n", wined3d_debug_location(location));
637 return FALSE;
638 }
639 }
640
wined3d_buffer_load_location(struct wined3d_buffer * buffer,struct wined3d_context * context,DWORD location)641 BOOL wined3d_buffer_load_location(struct wined3d_buffer *buffer,
642 struct wined3d_context *context, DWORD location)
643 {
644 const struct wined3d_gl_info *gl_info = context->gl_info;
645
646 TRACE("buffer %p, context %p, location %s.\n",
647 buffer, context, wined3d_debug_location(location));
648
649 if (buffer->locations & location)
650 {
651 TRACE("Location (%#x) is already up to date.\n", location);
652 return TRUE;
653 }
654
655 if (!buffer->locations)
656 {
657 ERR("Buffer %p does not have any up to date location.\n", buffer);
658 wined3d_buffer_validate_location(buffer, WINED3D_LOCATION_DISCARDED);
659 return wined3d_buffer_load_location(buffer, context, location);
660 }
661
662 TRACE("Current buffer location %s.\n", wined3d_debug_location(buffer->locations));
663
664 if (!wined3d_buffer_prepare_location(buffer, context, location))
665 return FALSE;
666
667 if (buffer->locations & WINED3D_LOCATION_DISCARDED)
668 {
669 TRACE("Buffer previously discarded, nothing to do.\n");
670 wined3d_buffer_validate_location(buffer, location);
671 wined3d_buffer_invalidate_location(buffer, WINED3D_LOCATION_DISCARDED);
672 return TRUE;
673 }
674
675 switch (location)
676 {
677 case WINED3D_LOCATION_SYSMEM:
678 buffer_bind(buffer, context);
679 GL_EXTCALL(glGetBufferSubData(buffer->buffer_type_hint, 0, buffer->resource.size,
680 buffer->resource.heap_memory));
681 checkGLcall("buffer download");
682 break;
683
684 case WINED3D_LOCATION_BUFFER:
685 if (!buffer->conversion_map)
686 wined3d_buffer_upload_ranges(buffer, context, buffer->resource.heap_memory,
687 0, buffer->modified_areas, buffer->maps);
688 else
689 buffer_conversion_upload(buffer, context);
690 break;
691
692 default:
693 ERR("Invalid location %s.\n", wined3d_debug_location(location));
694 return FALSE;
695 }
696
697 wined3d_buffer_validate_location(buffer, location);
698 if (buffer->resource.heap_memory && location == WINED3D_LOCATION_BUFFER
699 && !(buffer->resource.usage & WINED3DUSAGE_DYNAMIC))
700 wined3d_buffer_evict_sysmem(buffer);
701
702 return TRUE;
703 }
704
705 /* Context activation is done by the caller. */
wined3d_buffer_load_sysmem(struct wined3d_buffer * buffer,struct wined3d_context * context)706 BYTE *wined3d_buffer_load_sysmem(struct wined3d_buffer *buffer, struct wined3d_context *context)
707 {
708 if (wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_SYSMEM))
709 buffer->flags |= WINED3D_BUFFER_PIN_SYSMEM;
710 return buffer->resource.heap_memory;
711 }
712
wined3d_buffer_get_memory(struct wined3d_buffer * buffer,struct wined3d_bo_address * data,DWORD locations)713 DWORD wined3d_buffer_get_memory(struct wined3d_buffer *buffer,
714 struct wined3d_bo_address *data, DWORD locations)
715 {
716 TRACE("buffer %p, data %p, locations %s.\n",
717 buffer, data, wined3d_debug_location(locations));
718
719 if (locations & WINED3D_LOCATION_BUFFER)
720 {
721 data->buffer_object = buffer->buffer_object;
722 data->addr = NULL;
723 return WINED3D_LOCATION_BUFFER;
724 }
725 if (locations & WINED3D_LOCATION_SYSMEM)
726 {
727 data->buffer_object = 0;
728 data->addr = buffer->resource.heap_memory;
729 return WINED3D_LOCATION_SYSMEM;
730 }
731
732 ERR("Unexpected locations %s.\n", wined3d_debug_location(locations));
733 data->buffer_object = 0;
734 data->addr = NULL;
735 return 0;
736 }
737
buffer_unload(struct wined3d_resource * resource)738 static void buffer_unload(struct wined3d_resource *resource)
739 {
740 struct wined3d_buffer *buffer = buffer_from_resource(resource);
741
742 TRACE("buffer %p.\n", buffer);
743
744 if (buffer->buffer_object)
745 {
746 struct wined3d_context *context;
747
748 context = context_acquire(resource->device, NULL, 0);
749
750 wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_SYSMEM);
751 wined3d_buffer_invalidate_location(buffer, WINED3D_LOCATION_BUFFER);
752 buffer_destroy_buffer_object(buffer, context);
753 buffer_clear_dirty_areas(buffer);
754
755 context_release(context);
756
757 heap_free(buffer->conversion_map);
758 buffer->conversion_map = NULL;
759 buffer->stride = 0;
760 buffer->conversion_stride = 0;
761 buffer->flags &= ~WINED3D_BUFFER_HASDESC;
762 }
763
764 resource_unload(resource);
765 }
766
wined3d_buffer_drop_bo(struct wined3d_buffer * buffer)767 static void wined3d_buffer_drop_bo(struct wined3d_buffer *buffer)
768 {
769 buffer->flags &= ~WINED3D_BUFFER_USE_BO;
770 buffer_unload(&buffer->resource);
771 }
772
wined3d_buffer_destroy_object(void * object)773 static void wined3d_buffer_destroy_object(void *object)
774 {
775 struct wined3d_buffer *buffer = object;
776 struct wined3d_context *context;
777
778 if (buffer->buffer_object)
779 {
780 context = context_acquire(buffer->resource.device, NULL, 0);
781 buffer_destroy_buffer_object(buffer, context);
782 context_release(context);
783
784 heap_free(buffer->conversion_map);
785 }
786
787 heap_free(buffer->maps);
788 heap_free(buffer);
789 }
790
wined3d_buffer_decref(struct wined3d_buffer * buffer)791 ULONG CDECL wined3d_buffer_decref(struct wined3d_buffer *buffer)
792 {
793 ULONG refcount = InterlockedDecrement(&buffer->resource.ref);
794
795 TRACE("%p decreasing refcount to %u.\n", buffer, refcount);
796
797 if (!refcount)
798 {
799 buffer->resource.parent_ops->wined3d_object_destroyed(buffer->resource.parent);
800 resource_cleanup(&buffer->resource);
801 wined3d_cs_destroy_object(buffer->resource.device->cs, wined3d_buffer_destroy_object, buffer);
802 }
803
804 return refcount;
805 }
806
wined3d_buffer_get_parent(const struct wined3d_buffer * buffer)807 void * CDECL wined3d_buffer_get_parent(const struct wined3d_buffer *buffer)
808 {
809 TRACE("buffer %p.\n", buffer);
810
811 return buffer->resource.parent;
812 }
813
814 /* The caller provides a context and binds the buffer */
buffer_sync_apple(struct wined3d_buffer * buffer,DWORD flags,const struct wined3d_gl_info * gl_info)815 static void buffer_sync_apple(struct wined3d_buffer *buffer, DWORD flags, const struct wined3d_gl_info *gl_info)
816 {
817 enum wined3d_fence_result ret;
818 HRESULT hr;
819
820 /* No fencing needs to be done if the app promises not to overwrite
821 * existing data. */
822 if (flags & WINED3D_MAP_NOOVERWRITE)
823 return;
824
825 if (flags & WINED3D_MAP_DISCARD)
826 {
827 GL_EXTCALL(glBufferData(buffer->buffer_type_hint, buffer->resource.size, NULL, buffer->buffer_object_usage));
828 checkGLcall("glBufferData");
829 return;
830 }
831
832 if (!buffer->fence)
833 {
834 TRACE("Creating fence for buffer %p.\n", buffer);
835
836 if (FAILED(hr = wined3d_fence_create(buffer->resource.device, &buffer->fence)))
837 {
838 if (hr == WINED3DERR_NOTAVAILABLE)
839 FIXME("Fences not supported, dropping async buffer locks.\n");
840 else
841 ERR("Failed to create fence, hr %#x.\n", hr);
842 goto drop_fence;
843 }
844
845 /* Since we don't know about old draws a glFinish is needed once */
846 gl_info->gl_ops.gl.p_glFinish();
847 return;
848 }
849
850 TRACE("Synchronizing buffer %p.\n", buffer);
851 ret = wined3d_fence_wait(buffer->fence, buffer->resource.device);
852 switch (ret)
853 {
854 case WINED3D_FENCE_NOT_STARTED:
855 case WINED3D_FENCE_OK:
856 /* All done */
857 return;
858
859 case WINED3D_FENCE_WRONG_THREAD:
860 WARN("Cannot synchronize buffer lock due to a thread conflict.\n");
861 goto drop_fence;
862
863 default:
864 ERR("wined3d_fence_wait() returned %u, dropping async buffer locks.\n", ret);
865 goto drop_fence;
866 }
867
868 drop_fence:
869 if (buffer->fence)
870 {
871 wined3d_fence_destroy(buffer->fence);
872 buffer->fence = NULL;
873 }
874
875 gl_info->gl_ops.gl.p_glFinish();
876 GL_EXTCALL(glBufferParameteriAPPLE(buffer->buffer_type_hint, GL_BUFFER_SERIALIZED_MODIFY_APPLE, GL_TRUE));
877 checkGLcall("glBufferParameteriAPPLE(buffer->buffer_type_hint, GL_BUFFER_SERIALIZED_MODIFY_APPLE, GL_TRUE)");
878 buffer->flags &= ~WINED3D_BUFFER_APPLESYNC;
879 }
880
buffer_mark_used(struct wined3d_buffer * buffer)881 static void buffer_mark_used(struct wined3d_buffer *buffer)
882 {
883 buffer->flags &= ~WINED3D_BUFFER_DISCARD;
884 }
885
886 /* Context activation is done by the caller. */
wined3d_buffer_load(struct wined3d_buffer * buffer,struct wined3d_context * context,const struct wined3d_state * state)887 void wined3d_buffer_load(struct wined3d_buffer *buffer, struct wined3d_context *context,
888 const struct wined3d_state *state)
889 {
890 const struct wined3d_gl_info *gl_info = context->gl_info;
891 BOOL decl_changed = FALSE;
892
893 TRACE("buffer %p.\n", buffer);
894
895 if (buffer->resource.map_count)
896 {
897 WARN("Buffer is mapped, skipping preload.\n");
898 return;
899 }
900
901 buffer_mark_used(buffer);
902
903 /* TODO: Make converting independent from VBOs */
904 if (!(buffer->flags & WINED3D_BUFFER_USE_BO))
905 {
906 /* Not doing any conversion */
907 return;
908 }
909
910 if (!wined3d_buffer_prepare_location(buffer, context, WINED3D_LOCATION_BUFFER))
911 {
912 ERR("Failed to prepare buffer location.\n");
913 return;
914 }
915
916 /* Reading the declaration makes only sense if we have valid state information
917 * (i.e., if this function is called during draws). */
918 if (state)
919 {
920 DWORD fixup_flags = 0;
921
922 if (!use_vs(state))
923 {
924 if (!gl_info->supported[ARB_VERTEX_ARRAY_BGRA] && !context->d3d_info->ffp_generic_attributes)
925 fixup_flags |= WINED3D_BUFFER_FIXUP_D3DCOLOR;
926 if (!context->d3d_info->xyzrhw)
927 fixup_flags |= WINED3D_BUFFER_FIXUP_XYZRHW;
928 }
929
930 decl_changed = buffer_find_decl(buffer, &context->stream_info, state, fixup_flags);
931 buffer->flags |= WINED3D_BUFFER_HASDESC;
932 }
933
934 if (!decl_changed && !(buffer->flags & WINED3D_BUFFER_HASDESC && buffer_is_dirty(buffer)))
935 {
936 ++buffer->draw_count;
937 if (buffer->draw_count > VB_RESETDECLCHANGE)
938 buffer->decl_change_count = 0;
939 if (buffer->draw_count > VB_RESETFULLCONVS)
940 buffer->full_conversion_count = 0;
941 return;
942 }
943
944 /* If applications change the declaration over and over, reconverting all the time is a huge
945 * performance hit. So count the declaration changes and release the VBO if there are too many
946 * of them (and thus stop converting)
947 */
948 if (decl_changed)
949 {
950 ++buffer->decl_change_count;
951 buffer->draw_count = 0;
952
953 if (buffer->decl_change_count > VB_MAXDECLCHANGES
954 || (buffer->conversion_map && (buffer->resource.usage & WINED3DUSAGE_DYNAMIC)))
955 {
956 FIXME("Too many declaration changes or converting dynamic buffer, stopping converting.\n");
957 wined3d_buffer_drop_bo(buffer);
958 return;
959 }
960
961 /* The declaration changed, reload the whole buffer. */
962 WARN("Reloading buffer because of a vertex declaration change.\n");
963 buffer_invalidate_bo_range(buffer, 0, 0);
964 }
965 else
966 {
967 /* However, it is perfectly fine to change the declaration every now and then. We don't want a game that
968 * changes it every minute drop the VBO after VB_MAX_DECL_CHANGES minutes. So count draws without
969 * decl changes and reset the decl change count after a specific number of them
970 */
971 if (buffer->conversion_map && buffer_is_fully_dirty(buffer))
972 {
973 ++buffer->full_conversion_count;
974 if (buffer->full_conversion_count > VB_MAXFULLCONVERSIONS)
975 {
976 FIXME("Too many full buffer conversions, stopping converting.\n");
977 wined3d_buffer_drop_bo(buffer);
978 return;
979 }
980 }
981 else
982 {
983 ++buffer->draw_count;
984 if (buffer->draw_count > VB_RESETDECLCHANGE)
985 buffer->decl_change_count = 0;
986 if (buffer->draw_count > VB_RESETFULLCONVS)
987 buffer->full_conversion_count = 0;
988 }
989 }
990
991 if (!wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_BUFFER))
992 ERR("Failed to load buffer location.\n");
993 }
994
wined3d_buffer_get_resource(struct wined3d_buffer * buffer)995 struct wined3d_resource * CDECL wined3d_buffer_get_resource(struct wined3d_buffer *buffer)
996 {
997 TRACE("buffer %p.\n", buffer);
998
999 return &buffer->resource;
1000 }
1001
wined3d_buffer_map(struct wined3d_buffer * buffer,UINT offset,UINT size,BYTE ** data,DWORD flags)1002 static HRESULT wined3d_buffer_map(struct wined3d_buffer *buffer, UINT offset, UINT size, BYTE **data, DWORD flags)
1003 {
1004 struct wined3d_device *device = buffer->resource.device;
1005 struct wined3d_context *context;
1006 LONG count;
1007 BYTE *base;
1008
1009 TRACE("buffer %p, offset %u, size %u, data %p, flags %#x.\n", buffer, offset, size, data, flags);
1010
1011 count = ++buffer->resource.map_count;
1012
1013 if (buffer->buffer_object)
1014 {
1015 unsigned int dirty_offset = offset, dirty_size = size;
1016
1017 /* DISCARD invalidates the entire buffer, regardless of the specified
1018 * offset and size. Some applications also depend on the entire buffer
1019 * being uploaded in that case. Two such applications are Port Royale
1020 * and Darkstar One. */
1021 if (flags & WINED3D_MAP_DISCARD)
1022 {
1023 dirty_offset = 0;
1024 dirty_size = 0;
1025 }
1026
1027 if (((flags & WINED3D_MAP_WRITE) && !(flags & (WINED3D_MAP_NOOVERWRITE | WINED3D_MAP_DISCARD)))
1028 || (!(flags & WINED3D_MAP_WRITE) && (buffer->locations & WINED3D_LOCATION_SYSMEM))
1029 || buffer->flags & WINED3D_BUFFER_PIN_SYSMEM)
1030 {
1031 if (!(buffer->locations & WINED3D_LOCATION_SYSMEM))
1032 {
1033 context = context_acquire(device, NULL, 0);
1034 wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_SYSMEM);
1035 context_release(context);
1036 }
1037
1038 if (flags & WINED3D_MAP_WRITE)
1039 wined3d_buffer_invalidate_range(buffer, WINED3D_LOCATION_BUFFER, dirty_offset, dirty_size);
1040 }
1041 else
1042 {
1043 const struct wined3d_gl_info *gl_info;
1044
1045 context = context_acquire(device, NULL, 0);
1046 gl_info = context->gl_info;
1047
1048 if (flags & WINED3D_MAP_DISCARD)
1049 wined3d_buffer_validate_location(buffer, WINED3D_LOCATION_BUFFER);
1050 else
1051 wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_BUFFER);
1052
1053 if (flags & WINED3D_MAP_WRITE)
1054 buffer_invalidate_bo_range(buffer, dirty_offset, dirty_size);
1055
1056 if ((flags & WINED3D_MAP_DISCARD) && buffer->resource.heap_memory)
1057 wined3d_buffer_evict_sysmem(buffer);
1058
1059 if (count == 1)
1060 {
1061 buffer_bind(buffer, context);
1062
1063 /* Filter redundant WINED3D_MAP_DISCARD maps. The 3DMark2001
1064 * multitexture fill rate test seems to depend on this. When
1065 * we map a buffer with GL_MAP_INVALIDATE_BUFFER_BIT, the
1066 * driver is free to discard the previous contents of the
1067 * buffer. The r600g driver only does this when the buffer is
1068 * currently in use, while the proprietary NVIDIA driver
1069 * appears to do this unconditionally. */
1070 if (buffer->flags & WINED3D_BUFFER_DISCARD)
1071 flags &= ~WINED3D_MAP_DISCARD;
1072
1073 if (gl_info->supported[ARB_MAP_BUFFER_RANGE])
1074 {
1075 GLbitfield mapflags = wined3d_resource_gl_map_flags(flags);
1076 buffer->map_ptr = GL_EXTCALL(glMapBufferRange(buffer->buffer_type_hint,
1077 0, buffer->resource.size, mapflags));
1078 checkGLcall("glMapBufferRange");
1079 }
1080 else
1081 {
1082 if (buffer->flags & WINED3D_BUFFER_APPLESYNC)
1083 buffer_sync_apple(buffer, flags, gl_info);
1084 buffer->map_ptr = GL_EXTCALL(glMapBuffer(buffer->buffer_type_hint,
1085 GL_READ_WRITE));
1086 checkGLcall("glMapBuffer");
1087 }
1088
1089 if (((DWORD_PTR)buffer->map_ptr) & (RESOURCE_ALIGNMENT - 1))
1090 {
1091 WARN("Pointer %p is not %u byte aligned.\n", buffer->map_ptr, RESOURCE_ALIGNMENT);
1092
1093 GL_EXTCALL(glUnmapBuffer(buffer->buffer_type_hint));
1094 checkGLcall("glUnmapBuffer");
1095 buffer->map_ptr = NULL;
1096
1097 if (buffer->resource.usage & WINED3DUSAGE_DYNAMIC)
1098 {
1099 /* The extra copy is more expensive than not using VBOs at
1100 * all on the Nvidia Linux driver, which is the only driver
1101 * that returns unaligned pointers.
1102 */
1103 TRACE("Dynamic buffer, dropping VBO.\n");
1104 wined3d_buffer_drop_bo(buffer);
1105 }
1106 else
1107 {
1108 TRACE("Falling back to doublebuffered operation.\n");
1109 wined3d_buffer_load_location(buffer, context, WINED3D_LOCATION_SYSMEM);
1110 buffer->flags |= WINED3D_BUFFER_PIN_SYSMEM;
1111 }
1112 TRACE("New pointer is %p.\n", buffer->resource.heap_memory);
1113 }
1114 }
1115
1116 context_release(context);
1117 }
1118
1119 if (flags & WINED3D_MAP_DISCARD)
1120 buffer->flags |= WINED3D_BUFFER_DISCARD;
1121 }
1122
1123 base = buffer->map_ptr ? buffer->map_ptr : buffer->resource.heap_memory;
1124 *data = base + offset;
1125
1126 TRACE("Returning memory at %p (base %p, offset %u).\n", *data, base, offset);
1127 /* TODO: check Flags compatibility with buffer->currentDesc.Usage (see MSDN) */
1128
1129 return WINED3D_OK;
1130 }
1131
wined3d_buffer_unmap(struct wined3d_buffer * buffer)1132 static void wined3d_buffer_unmap(struct wined3d_buffer *buffer)
1133 {
1134 ULONG i;
1135
1136 TRACE("buffer %p.\n", buffer);
1137
1138 /* In the case that the number of Unmap calls > the
1139 * number of Map calls, d3d returns always D3D_OK.
1140 * This is also needed to prevent Map from returning garbage on
1141 * the next call (this will happen if the lock_count is < 0). */
1142 if (!buffer->resource.map_count)
1143 {
1144 WARN("Unmap called without a previous map call.\n");
1145 return;
1146 }
1147
1148 if (--buffer->resource.map_count)
1149 {
1150 /* Delay loading the buffer until everything is unlocked */
1151 TRACE("Ignoring unmap.\n");
1152 return;
1153 }
1154
1155 if (buffer->map_ptr)
1156 {
1157 struct wined3d_device *device = buffer->resource.device;
1158 const struct wined3d_gl_info *gl_info;
1159 struct wined3d_context *context;
1160
1161 context = context_acquire(device, NULL, 0);
1162 gl_info = context->gl_info;
1163
1164 buffer_bind(buffer, context);
1165
1166 if (gl_info->supported[ARB_MAP_BUFFER_RANGE])
1167 {
1168 for (i = 0; i < buffer->modified_areas; ++i)
1169 {
1170 GL_EXTCALL(glFlushMappedBufferRange(buffer->buffer_type_hint,
1171 buffer->maps[i].offset, buffer->maps[i].size));
1172 checkGLcall("glFlushMappedBufferRange");
1173 }
1174 }
1175 else if (buffer->flags & WINED3D_BUFFER_APPLESYNC)
1176 {
1177 for (i = 0; i < buffer->modified_areas; ++i)
1178 {
1179 GL_EXTCALL(glFlushMappedBufferRangeAPPLE(buffer->buffer_type_hint,
1180 buffer->maps[i].offset, buffer->maps[i].size));
1181 checkGLcall("glFlushMappedBufferRangeAPPLE");
1182 }
1183 }
1184
1185 GL_EXTCALL(glUnmapBuffer(buffer->buffer_type_hint));
1186 if (wined3d_settings.strict_draw_ordering)
1187 gl_info->gl_ops.gl.p_glFlush(); /* Flush to ensure ordering across contexts. */
1188 context_release(context);
1189
1190 buffer_clear_dirty_areas(buffer);
1191 buffer->map_ptr = NULL;
1192 }
1193 }
1194
wined3d_buffer_copy(struct wined3d_buffer * dst_buffer,unsigned int dst_offset,struct wined3d_buffer * src_buffer,unsigned int src_offset,unsigned int size)1195 void wined3d_buffer_copy(struct wined3d_buffer *dst_buffer, unsigned int dst_offset,
1196 struct wined3d_buffer *src_buffer, unsigned int src_offset, unsigned int size)
1197 {
1198 struct wined3d_bo_address dst, src;
1199 struct wined3d_context *context;
1200 DWORD dst_location;
1201
1202 buffer_mark_used(dst_buffer);
1203 buffer_mark_used(src_buffer);
1204
1205 dst_location = wined3d_buffer_get_memory(dst_buffer, &dst, dst_buffer->locations);
1206 dst.addr += dst_offset;
1207
1208 wined3d_buffer_get_memory(src_buffer, &src, src_buffer->locations);
1209 src.addr += src_offset;
1210
1211 context = context_acquire(dst_buffer->resource.device, NULL, 0);
1212 context_copy_bo_address(context, &dst, dst_buffer->buffer_type_hint,
1213 &src, src_buffer->buffer_type_hint, size);
1214 context_release(context);
1215
1216 wined3d_buffer_invalidate_range(dst_buffer, ~dst_location, dst_offset, size);
1217 }
1218
wined3d_buffer_upload_data(struct wined3d_buffer * buffer,struct wined3d_context * context,const struct wined3d_box * box,const void * data)1219 void wined3d_buffer_upload_data(struct wined3d_buffer *buffer, struct wined3d_context *context,
1220 const struct wined3d_box *box, const void *data)
1221 {
1222 struct wined3d_map_range range;
1223
1224 if (box)
1225 {
1226 range.offset = box->left;
1227 range.size = box->right - box->left;
1228 }
1229 else
1230 {
1231 range.offset = 0;
1232 range.size = buffer->resource.size;
1233 }
1234
1235 wined3d_buffer_upload_ranges(buffer, context, data, range.offset, 1, &range);
1236 }
1237
buffer_resource_incref(struct wined3d_resource * resource)1238 static ULONG buffer_resource_incref(struct wined3d_resource *resource)
1239 {
1240 return wined3d_buffer_incref(buffer_from_resource(resource));
1241 }
1242
buffer_resource_decref(struct wined3d_resource * resource)1243 static ULONG buffer_resource_decref(struct wined3d_resource *resource)
1244 {
1245 return wined3d_buffer_decref(buffer_from_resource(resource));
1246 }
1247
buffer_resource_preload(struct wined3d_resource * resource)1248 static void buffer_resource_preload(struct wined3d_resource *resource)
1249 {
1250 struct wined3d_context *context;
1251
1252 context = context_acquire(resource->device, NULL, 0);
1253 wined3d_buffer_load(buffer_from_resource(resource), context, NULL);
1254 context_release(context);
1255 }
1256
buffer_resource_sub_resource_map(struct wined3d_resource * resource,unsigned int sub_resource_idx,struct wined3d_map_desc * map_desc,const struct wined3d_box * box,DWORD flags)1257 static HRESULT buffer_resource_sub_resource_map(struct wined3d_resource *resource, unsigned int sub_resource_idx,
1258 struct wined3d_map_desc *map_desc, const struct wined3d_box *box, DWORD flags)
1259 {
1260 struct wined3d_buffer *buffer = buffer_from_resource(resource);
1261 UINT offset, size;
1262
1263 if (sub_resource_idx)
1264 {
1265 WARN("Invalid sub_resource_idx %u.\n", sub_resource_idx);
1266 return E_INVALIDARG;
1267 }
1268
1269 if (box)
1270 {
1271 offset = box->left;
1272 size = box->right - box->left;
1273 }
1274 else
1275 {
1276 offset = size = 0;
1277 }
1278
1279 map_desc->row_pitch = map_desc->slice_pitch = buffer->desc.byte_width;
1280 return wined3d_buffer_map(buffer, offset, size, (BYTE **)&map_desc->data, flags);
1281 }
1282
buffer_resource_sub_resource_map_info(struct wined3d_resource * resource,unsigned int sub_resource_idx,struct wined3d_map_info * info,DWORD flags)1283 static HRESULT buffer_resource_sub_resource_map_info(struct wined3d_resource *resource, unsigned int sub_resource_idx,
1284 struct wined3d_map_info *info, DWORD flags)
1285 {
1286 struct wined3d_buffer *buffer = buffer_from_resource(resource);
1287
1288 if (sub_resource_idx)
1289 {
1290 WARN("Invalid sub_resource_idx %u.\n", sub_resource_idx);
1291 return E_INVALIDARG;
1292 }
1293
1294 info->row_pitch = buffer->desc.byte_width;
1295 info->slice_pitch = buffer->desc.byte_width;
1296 info->size = buffer->resource.size;
1297
1298 return WINED3D_OK;
1299 }
1300
buffer_resource_sub_resource_unmap(struct wined3d_resource * resource,unsigned int sub_resource_idx)1301 static HRESULT buffer_resource_sub_resource_unmap(struct wined3d_resource *resource, unsigned int sub_resource_idx)
1302 {
1303 if (sub_resource_idx)
1304 {
1305 WARN("Invalid sub_resource_idx %u.\n", sub_resource_idx);
1306 return E_INVALIDARG;
1307 }
1308
1309 wined3d_buffer_unmap(buffer_from_resource(resource));
1310 return WINED3D_OK;
1311 }
1312
1313 static const struct wined3d_resource_ops buffer_resource_ops =
1314 {
1315 buffer_resource_incref,
1316 buffer_resource_decref,
1317 buffer_resource_preload,
1318 buffer_unload,
1319 buffer_resource_sub_resource_map,
1320 buffer_resource_sub_resource_map_info,
1321 buffer_resource_sub_resource_unmap,
1322 };
1323
buffer_type_hint_from_bind_flags(const struct wined3d_gl_info * gl_info,unsigned int bind_flags)1324 static GLenum buffer_type_hint_from_bind_flags(const struct wined3d_gl_info *gl_info,
1325 unsigned int bind_flags)
1326 {
1327 if (bind_flags == WINED3D_BIND_INDEX_BUFFER)
1328 return GL_ELEMENT_ARRAY_BUFFER;
1329
1330 if (bind_flags & (WINED3D_BIND_SHADER_RESOURCE | WINED3D_BIND_UNORDERED_ACCESS)
1331 && gl_info->supported[ARB_TEXTURE_BUFFER_OBJECT])
1332 return GL_TEXTURE_BUFFER;
1333
1334 if (bind_flags & WINED3D_BIND_CONSTANT_BUFFER)
1335 return GL_UNIFORM_BUFFER;
1336
1337 if (bind_flags & WINED3D_BIND_STREAM_OUTPUT)
1338 return GL_TRANSFORM_FEEDBACK_BUFFER;
1339
1340 if (bind_flags & ~(WINED3D_BIND_VERTEX_BUFFER | WINED3D_BIND_INDEX_BUFFER))
1341 FIXME("Unhandled bind flags %#x.\n", bind_flags);
1342
1343 return GL_ARRAY_BUFFER;
1344 }
1345
buffer_init(struct wined3d_buffer * buffer,struct wined3d_device * device,UINT size,DWORD usage,enum wined3d_format_id format_id,unsigned int access,unsigned int bind_flags,const struct wined3d_sub_resource_data * data,void * parent,const struct wined3d_parent_ops * parent_ops)1346 static HRESULT buffer_init(struct wined3d_buffer *buffer, struct wined3d_device *device,
1347 UINT size, DWORD usage, enum wined3d_format_id format_id, unsigned int access, unsigned int bind_flags,
1348 const struct wined3d_sub_resource_data *data, void *parent, const struct wined3d_parent_ops *parent_ops)
1349 {
1350 const struct wined3d_gl_info *gl_info = &device->adapter->gl_info;
1351 const struct wined3d_format *format = wined3d_get_format(gl_info, format_id, usage);
1352 BOOL dynamic_buffer_ok;
1353 HRESULT hr;
1354
1355 if (!size)
1356 {
1357 WARN("Size 0 requested, returning E_INVALIDARG.\n");
1358 return E_INVALIDARG;
1359 }
1360
1361 if (bind_flags & WINED3D_BIND_CONSTANT_BUFFER && size & (WINED3D_CONSTANT_BUFFER_ALIGNMENT - 1))
1362 {
1363 WARN("Size %#x is not suitably aligned for constant buffers.\n", size);
1364 return E_INVALIDARG;
1365 }
1366
1367 if (data && !data->data)
1368 {
1369 WARN("Invalid sub-resource data specified.\n");
1370 return E_INVALIDARG;
1371 }
1372
1373 if (FAILED(hr = resource_init(&buffer->resource, device, WINED3D_RTYPE_BUFFER, format, WINED3D_MULTISAMPLE_NONE,
1374 0, usage, access, size, 1, 1, size, parent, parent_ops, &buffer_resource_ops)))
1375 {
1376 WARN("Failed to initialize resource, hr %#x.\n", hr);
1377 return hr;
1378 }
1379 buffer->buffer_type_hint = buffer_type_hint_from_bind_flags(gl_info, bind_flags);
1380 buffer->bind_flags = bind_flags;
1381 buffer->locations = WINED3D_LOCATION_SYSMEM;
1382
1383 TRACE("buffer %p, size %#x, usage %#x, format %s, memory @ %p.\n",
1384 buffer, buffer->resource.size, buffer->resource.usage,
1385 debug_d3dformat(buffer->resource.format->id), buffer->resource.heap_memory);
1386
1387 if (device->create_parms.flags & WINED3DCREATE_SOFTWARE_VERTEXPROCESSING
1388 || wined3d_resource_access_is_managed(access))
1389 {
1390 /* SWvp and managed buffers always return the same pointer in buffer
1391 * maps and retain data in DISCARD maps. Keep a system memory copy of
1392 * the buffer to provide the same behavior to the application. */
1393 TRACE("Using doublebuffer mode.\n");
1394 buffer->flags |= WINED3D_BUFFER_PIN_SYSMEM;
1395 }
1396
1397 /* Observations show that draw_primitive_immediate_mode() is faster on
1398 * dynamic vertex buffers than converting + draw_primitive_arrays().
1399 * (Half-Life 2 and others.) */
1400 dynamic_buffer_ok = gl_info->supported[APPLE_FLUSH_BUFFER_RANGE] || gl_info->supported[ARB_MAP_BUFFER_RANGE];
1401
1402 if (!gl_info->supported[ARB_VERTEX_BUFFER_OBJECT])
1403 {
1404 TRACE("Not creating a BO because GL_ARB_vertex_buffer is not supported.\n");
1405 }
1406 else if (!(access & WINED3D_RESOURCE_ACCESS_GPU))
1407 {
1408 TRACE("Not creating a BO because the buffer is not GPU accessible.\n");
1409 }
1410 else if (!dynamic_buffer_ok && (buffer->resource.usage & WINED3DUSAGE_DYNAMIC))
1411 {
1412 TRACE("Not creating a BO because the buffer has dynamic usage and no GL support.\n");
1413 }
1414 else
1415 {
1416 buffer->flags |= WINED3D_BUFFER_USE_BO;
1417 }
1418
1419 if (!(buffer->maps = heap_alloc(sizeof(*buffer->maps))))
1420 {
1421 ERR("Out of memory.\n");
1422 buffer_unload(&buffer->resource);
1423 resource_cleanup(&buffer->resource);
1424 wined3d_resource_wait_idle(&buffer->resource);
1425 return E_OUTOFMEMORY;
1426 }
1427 buffer->maps_size = 1;
1428
1429 if (data)
1430 wined3d_device_update_sub_resource(device, &buffer->resource,
1431 0, NULL, data->data, data->row_pitch, data->slice_pitch);
1432
1433 return WINED3D_OK;
1434 }
1435
wined3d_buffer_create(struct wined3d_device * device,const struct wined3d_buffer_desc * desc,const struct wined3d_sub_resource_data * data,void * parent,const struct wined3d_parent_ops * parent_ops,struct wined3d_buffer ** buffer)1436 HRESULT CDECL wined3d_buffer_create(struct wined3d_device *device, const struct wined3d_buffer_desc *desc,
1437 const struct wined3d_sub_resource_data *data, void *parent, const struct wined3d_parent_ops *parent_ops,
1438 struct wined3d_buffer **buffer)
1439 {
1440 struct wined3d_buffer *object;
1441 HRESULT hr;
1442
1443 TRACE("device %p, desc %p, data %p, parent %p, parent_ops %p, buffer %p.\n",
1444 device, desc, data, parent, parent_ops, buffer);
1445
1446 if (!(object = heap_alloc_zero(sizeof(*object))))
1447 return E_OUTOFMEMORY;
1448
1449 if (FAILED(hr = buffer_init(object, device, desc->byte_width, desc->usage, WINED3DFMT_UNKNOWN,
1450 desc->access, desc->bind_flags, data, parent, parent_ops)))
1451 {
1452 WARN("Failed to initialize buffer, hr %#x.\n", hr);
1453 heap_free(object);
1454 return hr;
1455 }
1456 object->desc = *desc;
1457
1458 TRACE("Created buffer %p.\n", object);
1459
1460 *buffer = object;
1461
1462 return WINED3D_OK;
1463 }
1464