1 /*
2  * Copyright © 2021 Raspberry Pi
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #include "v3dv_private.h"
25 #include "broadcom/common/v3d_macros.h"
26 #include "broadcom/cle/v3dx_pack.h"
27 
28 #include "util/format/u_format.h"
29 
30 #define SWIZ(x,y,z,w) {   \
31    PIPE_SWIZZLE_##x,      \
32    PIPE_SWIZZLE_##y,      \
33    PIPE_SWIZZLE_##z,      \
34    PIPE_SWIZZLE_##w       \
35 }
36 
37 #define FORMAT(vk, rt, tex, swiz, return_size, supports_filtering)  \
38    [VK_FORMAT_##vk] = {                                             \
39       true,                                                         \
40       V3D_OUTPUT_IMAGE_FORMAT_##rt,                                 \
41       TEXTURE_DATA_FORMAT_##tex,                                    \
42       swiz,                                                         \
43       return_size,                                                  \
44       supports_filtering,                                           \
45    }
46 
47 #define SWIZ_X001 SWIZ(X, 0, 0, 1)
48 #define SWIZ_XY01 SWIZ(X, Y, 0, 1)
49 #define SWIZ_XYZ1 SWIZ(X, Y, Z, 1)
50 #define SWIZ_XYZW SWIZ(X, Y, Z, W)
51 #define SWIZ_YZWX SWIZ(Y, Z, W, X)
52 #define SWIZ_YZW1 SWIZ(Y, Z, W, 1)
53 #define SWIZ_ZYXW SWIZ(Z, Y, X, W)
54 #define SWIZ_ZYX1 SWIZ(Z, Y, X, 1)
55 #define SWIZ_XXXY SWIZ(X, X, X, Y)
56 #define SWIZ_XXX1 SWIZ(X, X, X, 1)
57 #define SWIZ_XXXX SWIZ(X, X, X, X)
58 #define SWIZ_000X SWIZ(0, 0, 0, X)
59 #define SWIZ_WXYZ SWIZ(W, X, Y, Z)
60 
61 /* FIXME: expand format table to describe whether the format is supported
62  * for buffer surfaces (texel buffers, vertex buffers, etc).
63  */
64 static const struct v3dv_format format_table[] = {
65    /* Color, 4 channels */
66    FORMAT(B8G8R8A8_SRGB,           SRGB8_ALPHA8, RGBA8,         SWIZ_ZYXW, 16, true),
67    FORMAT(B8G8R8A8_UNORM,          RGBA8,        RGBA8,         SWIZ_ZYXW, 16, true),
68 
69    FORMAT(R8G8B8A8_SRGB,           SRGB8_ALPHA8, RGBA8,         SWIZ_XYZW, 16, true),
70    FORMAT(R8G8B8A8_UNORM,          RGBA8,        RGBA8,         SWIZ_XYZW, 16, true),
71    FORMAT(R8G8B8A8_SNORM,          NO,           RGBA8_SNORM,   SWIZ_XYZW, 16, true),
72    FORMAT(R8G8B8A8_SINT,           RGBA8I,       RGBA8I,        SWIZ_XYZW, 16, false),
73    FORMAT(R8G8B8A8_UINT,           RGBA8UI,      RGBA8UI,       SWIZ_XYZW, 16, false),
74 
75    FORMAT(R16G16B16A16_SFLOAT,     RGBA16F,      RGBA16F,       SWIZ_XYZW, 16, true),
76    FORMAT(R16G16B16A16_UNORM,      NO,           RGBA16,        SWIZ_XYZW, 32, true),
77    FORMAT(R16G16B16A16_SNORM,      NO,           RGBA16_SNORM,  SWIZ_XYZW, 32, true),
78    FORMAT(R16G16B16A16_SINT,       RGBA16I,      RGBA16I,       SWIZ_XYZW, 16, false),
79    FORMAT(R16G16B16A16_UINT,       RGBA16UI,     RGBA16UI,      SWIZ_XYZW, 16, false),
80 
81    FORMAT(R32G32B32A32_SFLOAT,     RGBA32F,      RGBA32F,       SWIZ_XYZW, 32, false),
82    FORMAT(R32G32B32A32_SINT,       RGBA32I,      RGBA32I,       SWIZ_XYZW, 32, false),
83    FORMAT(R32G32B32A32_UINT,       RGBA32UI,     RGBA32UI,      SWIZ_XYZW, 32, false),
84 
85    /* Color, 3 channels */
86    FORMAT(R32G32B32_SFLOAT,        NO,           NO,            SWIZ_XYZ1,  0, false),
87    FORMAT(R32G32B32_UINT,          NO,           NO,            SWIZ_XYZ1,  0, false),
88    FORMAT(R32G32B32_SINT,          NO,           NO,            SWIZ_XYZ1,  0, false),
89 
90    /* Color, 2 channels */
91    FORMAT(R8G8_UNORM,              RG8,          RG8,           SWIZ_XY01, 16, true),
92    FORMAT(R8G8_SNORM,              NO,           RG8_SNORM,     SWIZ_XY01, 16, true),
93    FORMAT(R8G8_SINT,               RG8I,         RG8I,          SWIZ_XY01, 16, false),
94    FORMAT(R8G8_UINT,               RG8UI,        RG8UI,         SWIZ_XY01, 16, false),
95 
96    FORMAT(R16G16_UNORM,            NO,           RG16,          SWIZ_XY01, 32, true),
97    FORMAT(R16G16_SNORM,            NO,           RG16_SNORM,    SWIZ_XY01, 32, true),
98    FORMAT(R16G16_SFLOAT,           RG16F,        RG16F,         SWIZ_XY01, 16, true),
99    FORMAT(R16G16_SINT,             RG16I,        RG16I,         SWIZ_XY01, 16, false),
100    FORMAT(R16G16_UINT,             RG16UI,       RG16UI,        SWIZ_XY01, 16, false),
101 
102    FORMAT(R32G32_SFLOAT,           RG32F,        RG32F,         SWIZ_XY01, 32, false),
103    FORMAT(R32G32_SINT,             RG32I,        RG32I,         SWIZ_XY01, 32, false),
104    FORMAT(R32G32_UINT,             RG32UI,       RG32UI,        SWIZ_XY01, 32, false),
105 
106    /* Color, 1 channel */
107    FORMAT(R8_UNORM,                R8,           R8,            SWIZ_X001, 16, true),
108    FORMAT(R8_SNORM,                NO,           R8_SNORM,      SWIZ_X001, 16, true),
109    FORMAT(R8_SINT,                 R8I,          R8I,           SWIZ_X001, 16, false),
110    FORMAT(R8_UINT,                 R8UI,         R8UI,          SWIZ_X001, 16, false),
111 
112    FORMAT(R16_UNORM,               NO,           R16,           SWIZ_X001, 32, true),
113    FORMAT(R16_SNORM,               NO,           R16_SNORM,     SWIZ_X001, 32, true),
114    FORMAT(R16_SFLOAT,              R16F,         R16F,          SWIZ_X001, 16, true),
115    FORMAT(R16_SINT,                R16I,         R16I,          SWIZ_X001, 16, false),
116    FORMAT(R16_UINT,                R16UI,        R16UI,         SWIZ_X001, 16, false),
117 
118    FORMAT(R32_SFLOAT,              R32F,         R32F,          SWIZ_X001, 32, false),
119    FORMAT(R32_SINT,                R32I,         R32I,          SWIZ_X001, 32, false),
120    FORMAT(R32_UINT,                R32UI,        R32UI,         SWIZ_X001, 32, false),
121 
122    /* Color, packed */
123    FORMAT(R4G4B4A4_UNORM_PACK16,   ABGR4444,     RGBA4,         SWIZ_XYZW, 16, true),
124    FORMAT(B4G4R4A4_UNORM_PACK16,   ABGR4444,     RGBA4,         SWIZ_ZYXW, 16, true), /* Swap RB */
125    FORMAT(R5G6B5_UNORM_PACK16,     BGR565,       RGB565,        SWIZ_XYZ1, 16, true),
126    FORMAT(R5G5B5A1_UNORM_PACK16,   ABGR1555,     RGB5_A1,       SWIZ_XYZW, 16, true),
127    FORMAT(A1R5G5B5_UNORM_PACK16,   RGBA5551,     A1_RGB5,       SWIZ_ZYXW, 16, true), /* Swap RB */
128    FORMAT(A8B8G8R8_UNORM_PACK32,   RGBA8,        RGBA8,         SWIZ_XYZW, 16, true), /* RGBA8 UNORM */
129    FORMAT(A8B8G8R8_SNORM_PACK32,   NO,           RGBA8_SNORM,   SWIZ_XYZW, 16, true), /* RGBA8 SNORM */
130    FORMAT(A8B8G8R8_UINT_PACK32,    RGBA8UI,      RGBA8UI,       SWIZ_XYZW, 16, false), /* RGBA8 UINT */
131    FORMAT(A8B8G8R8_SINT_PACK32,    RGBA8I,       RGBA8I,        SWIZ_XYZW, 16, false), /* RGBA8 SINT */
132    FORMAT(A8B8G8R8_SRGB_PACK32,    SRGB8_ALPHA8, RGBA8,         SWIZ_XYZW, 16, true), /* RGBA8 sRGB */
133    FORMAT(A2B10G10R10_UNORM_PACK32,RGB10_A2,     RGB10_A2,      SWIZ_XYZW, 16, true),
134    FORMAT(A2B10G10R10_UINT_PACK32, RGB10_A2UI,   RGB10_A2UI,    SWIZ_XYZW, 16, false),
135    FORMAT(E5B9G9R9_UFLOAT_PACK32,  NO,           RGB9_E5,       SWIZ_XYZ1, 16, true),
136    FORMAT(B10G11R11_UFLOAT_PACK32, R11F_G11F_B10F,R11F_G11F_B10F, SWIZ_XYZ1, 16, true),
137 
138    /* Depth */
139    FORMAT(D16_UNORM,               D16,          DEPTH_COMP16,  SWIZ_X001, 32, false),
140    FORMAT(D32_SFLOAT,              D32F,         DEPTH_COMP32F, SWIZ_X001, 32, false),
141    FORMAT(X8_D24_UNORM_PACK32,     D24S8,        DEPTH24_X8,    SWIZ_X001, 32, false),
142 
143    /* Depth + Stencil */
144    FORMAT(D24_UNORM_S8_UINT,       D24S8,        DEPTH24_X8,    SWIZ_X001, 32, false),
145 
146    /* Compressed: ETC2 / EAC */
147    FORMAT(ETC2_R8G8B8_UNORM_BLOCK,    NO,  RGB8_ETC2,                SWIZ_XYZ1, 16, true),
148    FORMAT(ETC2_R8G8B8_SRGB_BLOCK,     NO,  RGB8_ETC2,                SWIZ_XYZ1, 16, true),
149    FORMAT(ETC2_R8G8B8A1_UNORM_BLOCK,  NO,  RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, true),
150    FORMAT(ETC2_R8G8B8A1_SRGB_BLOCK,   NO,  RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, true),
151    FORMAT(ETC2_R8G8B8A8_UNORM_BLOCK,  NO,  RGBA8_ETC2_EAC,           SWIZ_XYZW, 16, true),
152    FORMAT(ETC2_R8G8B8A8_SRGB_BLOCK,   NO,  RGBA8_ETC2_EAC,           SWIZ_XYZW, 16, true),
153    FORMAT(EAC_R11_UNORM_BLOCK,        NO,  R11_EAC,                  SWIZ_X001, 16, true),
154    FORMAT(EAC_R11_SNORM_BLOCK,        NO,  SIGNED_R11_EAC,           SWIZ_X001, 16, true),
155    FORMAT(EAC_R11G11_UNORM_BLOCK,     NO,  RG11_EAC,                 SWIZ_XY01, 16, true),
156    FORMAT(EAC_R11G11_SNORM_BLOCK,     NO,  SIGNED_RG11_EAC,          SWIZ_XY01, 16, true),
157 
158    /* Compressed: BC1-3 */
159    FORMAT(BC1_RGB_UNORM_BLOCK,        NO,  BC1,                      SWIZ_XYZ1, 16, true),
160    FORMAT(BC1_RGB_SRGB_BLOCK,         NO,  BC1,                      SWIZ_XYZ1, 16, true),
161    FORMAT(BC1_RGBA_UNORM_BLOCK,       NO,  BC1,                      SWIZ_XYZW, 16, true),
162    FORMAT(BC1_RGBA_SRGB_BLOCK,        NO,  BC1,                      SWIZ_XYZW, 16, true),
163    FORMAT(BC2_UNORM_BLOCK,            NO,  BC2,                      SWIZ_XYZW, 16, true),
164    FORMAT(BC2_SRGB_BLOCK,             NO,  BC2,                      SWIZ_XYZW, 16, true),
165    FORMAT(BC3_UNORM_BLOCK,            NO,  BC3,                      SWIZ_XYZW, 16, true),
166    FORMAT(BC3_SRGB_BLOCK,             NO,  BC3,                      SWIZ_XYZW, 16, true),
167 
168    /* Compressed: ASTC */
169    FORMAT(ASTC_4x4_UNORM_BLOCK,       NO,  ASTC_4X4,                 SWIZ_XYZW, 16, true),
170    FORMAT(ASTC_4x4_SRGB_BLOCK,        NO,  ASTC_4X4,                 SWIZ_XYZW, 16, true),
171    FORMAT(ASTC_5x4_UNORM_BLOCK,       NO,  ASTC_5X4,                 SWIZ_XYZW, 16, true),
172    FORMAT(ASTC_5x4_SRGB_BLOCK,        NO,  ASTC_5X4,                 SWIZ_XYZW, 16, true),
173    FORMAT(ASTC_5x5_UNORM_BLOCK,       NO,  ASTC_5X5,                 SWIZ_XYZW, 16, true),
174    FORMAT(ASTC_5x5_SRGB_BLOCK,        NO,  ASTC_5X5,                 SWIZ_XYZW, 16, true),
175    FORMAT(ASTC_6x5_UNORM_BLOCK,       NO,  ASTC_6X5,                 SWIZ_XYZW, 16, true),
176    FORMAT(ASTC_6x5_SRGB_BLOCK,        NO,  ASTC_6X5,                 SWIZ_XYZW, 16, true),
177    FORMAT(ASTC_6x6_UNORM_BLOCK,       NO,  ASTC_6X6,                 SWIZ_XYZW, 16, true),
178    FORMAT(ASTC_6x6_SRGB_BLOCK,        NO,  ASTC_6X6,                 SWIZ_XYZW, 16, true),
179    FORMAT(ASTC_8x5_UNORM_BLOCK,       NO,  ASTC_8X5,                 SWIZ_XYZW, 16, true),
180    FORMAT(ASTC_8x5_SRGB_BLOCK,        NO,  ASTC_8X5,                 SWIZ_XYZW, 16, true),
181    FORMAT(ASTC_8x6_UNORM_BLOCK,       NO,  ASTC_8X6,                 SWIZ_XYZW, 16, true),
182    FORMAT(ASTC_8x6_SRGB_BLOCK,        NO,  ASTC_8X6,                 SWIZ_XYZW, 16, true),
183    FORMAT(ASTC_8x8_UNORM_BLOCK,       NO,  ASTC_8X8,                 SWIZ_XYZW, 16, true),
184    FORMAT(ASTC_8x8_SRGB_BLOCK,        NO,  ASTC_8X8,                 SWIZ_XYZW, 16, true),
185    FORMAT(ASTC_10x5_UNORM_BLOCK,      NO,  ASTC_10X5,                SWIZ_XYZW, 16, true),
186    FORMAT(ASTC_10x5_SRGB_BLOCK,       NO,  ASTC_10X5,                SWIZ_XYZW, 16, true),
187    FORMAT(ASTC_10x6_UNORM_BLOCK,      NO,  ASTC_10X6,                SWIZ_XYZW, 16, true),
188    FORMAT(ASTC_10x6_SRGB_BLOCK,       NO,  ASTC_10X6,                SWIZ_XYZW, 16, true),
189    FORMAT(ASTC_10x8_UNORM_BLOCK,      NO,  ASTC_10X8,                SWIZ_XYZW, 16, true),
190    FORMAT(ASTC_10x8_SRGB_BLOCK,       NO,  ASTC_10X8,                SWIZ_XYZW, 16, true),
191    FORMAT(ASTC_10x10_UNORM_BLOCK,     NO,  ASTC_10X10,               SWIZ_XYZW, 16, true),
192    FORMAT(ASTC_10x10_SRGB_BLOCK,      NO,  ASTC_10X10,               SWIZ_XYZW, 16, true),
193    FORMAT(ASTC_12x10_UNORM_BLOCK,     NO,  ASTC_12X10,               SWIZ_XYZW, 16, true),
194    FORMAT(ASTC_12x10_SRGB_BLOCK,      NO,  ASTC_12X10,               SWIZ_XYZW, 16, true),
195    FORMAT(ASTC_12x12_UNORM_BLOCK,     NO,  ASTC_12X12,               SWIZ_XYZW, 16, true),
196    FORMAT(ASTC_12x12_SRGB_BLOCK,      NO,  ASTC_12X12,               SWIZ_XYZW, 16, true),
197 };
198 
199 const struct v3dv_format *
v3dX(get_format)200 v3dX(get_format)(VkFormat format)
201 {
202    if (format < ARRAY_SIZE(format_table) && format_table[format].supported)
203       return &format_table[format];
204    else
205       return NULL;
206 }
207 
208 void
v3dX(get_internal_type_bpp_for_output_format)209 v3dX(get_internal_type_bpp_for_output_format)(uint32_t format,
210                                               uint32_t *type,
211                                               uint32_t *bpp)
212 {
213    switch (format) {
214    case V3D_OUTPUT_IMAGE_FORMAT_RGBA8:
215    case V3D_OUTPUT_IMAGE_FORMAT_RGB8:
216    case V3D_OUTPUT_IMAGE_FORMAT_RG8:
217    case V3D_OUTPUT_IMAGE_FORMAT_R8:
218    case V3D_OUTPUT_IMAGE_FORMAT_ABGR4444:
219    case V3D_OUTPUT_IMAGE_FORMAT_BGR565:
220    case V3D_OUTPUT_IMAGE_FORMAT_ABGR1555:
221       *type = V3D_INTERNAL_TYPE_8;
222       *bpp = V3D_INTERNAL_BPP_32;
223       break;
224 
225    case V3D_OUTPUT_IMAGE_FORMAT_RGBA8I:
226    case V3D_OUTPUT_IMAGE_FORMAT_RG8I:
227    case V3D_OUTPUT_IMAGE_FORMAT_R8I:
228       *type = V3D_INTERNAL_TYPE_8I;
229       *bpp = V3D_INTERNAL_BPP_32;
230       break;
231 
232    case V3D_OUTPUT_IMAGE_FORMAT_RGBA8UI:
233    case V3D_OUTPUT_IMAGE_FORMAT_RG8UI:
234    case V3D_OUTPUT_IMAGE_FORMAT_R8UI:
235       *type = V3D_INTERNAL_TYPE_8UI;
236       *bpp = V3D_INTERNAL_BPP_32;
237       break;
238 
239    case V3D_OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
240    case V3D_OUTPUT_IMAGE_FORMAT_SRGB:
241    case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2:
242    case V3D_OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
243    case V3D_OUTPUT_IMAGE_FORMAT_RGBA16F:
244       /* Note that sRGB RTs are stored in the tile buffer at 16F,
245        * and the conversion to sRGB happens at tilebuffer load/store.
246        */
247       *type = V3D_INTERNAL_TYPE_16F;
248       *bpp = V3D_INTERNAL_BPP_64;
249       break;
250 
251    case V3D_OUTPUT_IMAGE_FORMAT_RG16F:
252    case V3D_OUTPUT_IMAGE_FORMAT_R16F:
253       *type = V3D_INTERNAL_TYPE_16F;
254       /* Use 64bpp to make sure the TLB doesn't throw away the alpha
255        * channel before alpha test happens.
256        */
257       *bpp = V3D_INTERNAL_BPP_64;
258       break;
259 
260    case V3D_OUTPUT_IMAGE_FORMAT_RGBA16I:
261       *type = V3D_INTERNAL_TYPE_16I;
262       *bpp = V3D_INTERNAL_BPP_64;
263       break;
264 
265    case V3D_OUTPUT_IMAGE_FORMAT_RG16I:
266    case V3D_OUTPUT_IMAGE_FORMAT_R16I:
267       *type = V3D_INTERNAL_TYPE_16I;
268       *bpp = V3D_INTERNAL_BPP_32;
269       break;
270 
271    case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2UI:
272    case V3D_OUTPUT_IMAGE_FORMAT_RGBA16UI:
273       *type = V3D_INTERNAL_TYPE_16UI;
274       *bpp = V3D_INTERNAL_BPP_64;
275       break;
276 
277    case V3D_OUTPUT_IMAGE_FORMAT_RG16UI:
278    case V3D_OUTPUT_IMAGE_FORMAT_R16UI:
279       *type = V3D_INTERNAL_TYPE_16UI;
280       *bpp = V3D_INTERNAL_BPP_32;
281       break;
282 
283    case V3D_OUTPUT_IMAGE_FORMAT_RGBA32I:
284       *type = V3D_INTERNAL_TYPE_32I;
285       *bpp = V3D_INTERNAL_BPP_128;
286       break;
287 
288    case V3D_OUTPUT_IMAGE_FORMAT_RG32I:
289       *type = V3D_INTERNAL_TYPE_32I;
290       *bpp = V3D_INTERNAL_BPP_64;
291       break;
292 
293    case V3D_OUTPUT_IMAGE_FORMAT_R32I:
294       *type = V3D_INTERNAL_TYPE_32I;
295       *bpp = V3D_INTERNAL_BPP_32;
296       break;
297 
298    case V3D_OUTPUT_IMAGE_FORMAT_RGBA32UI:
299       *type = V3D_INTERNAL_TYPE_32UI;
300       *bpp = V3D_INTERNAL_BPP_128;
301       break;
302 
303    case V3D_OUTPUT_IMAGE_FORMAT_RG32UI:
304       *type = V3D_INTERNAL_TYPE_32UI;
305       *bpp = V3D_INTERNAL_BPP_64;
306       break;
307 
308    case V3D_OUTPUT_IMAGE_FORMAT_R32UI:
309       *type = V3D_INTERNAL_TYPE_32UI;
310       *bpp = V3D_INTERNAL_BPP_32;
311       break;
312 
313    case V3D_OUTPUT_IMAGE_FORMAT_RGBA32F:
314       *type = V3D_INTERNAL_TYPE_32F;
315       *bpp = V3D_INTERNAL_BPP_128;
316       break;
317 
318    case V3D_OUTPUT_IMAGE_FORMAT_RG32F:
319       *type = V3D_INTERNAL_TYPE_32F;
320       *bpp = V3D_INTERNAL_BPP_64;
321       break;
322 
323    case V3D_OUTPUT_IMAGE_FORMAT_R32F:
324       *type = V3D_INTERNAL_TYPE_32F;
325       *bpp = V3D_INTERNAL_BPP_32;
326       break;
327 
328    default:
329       /* Provide some default values, as we'll be called at RB
330        * creation time, even if an RB with this format isn't supported.
331        */
332       *type = V3D_INTERNAL_TYPE_8;
333       *bpp = V3D_INTERNAL_BPP_32;
334       break;
335    }
336 }
337 
338 bool
v3dX(format_supports_tlb_resolve)339 v3dX(format_supports_tlb_resolve)(const struct v3dv_format *format)
340 {
341    uint32_t type, bpp;
342    v3dX(get_internal_type_bpp_for_output_format)(format->rt_type, &type, &bpp);
343    return type == V3D_INTERNAL_TYPE_8 || type == V3D_INTERNAL_TYPE_16F;
344 }
345 
346 bool
v3dX(format_supports_blending)347 v3dX(format_supports_blending)(const struct v3dv_format *format)
348 {
349    /* Hardware blending is only supported on render targets that are configured
350     * 4x8-bit unorm, 2x16-bit float or 4x16-bit float.
351     */
352    uint32_t type, bpp;
353    v3dX(get_internal_type_bpp_for_output_format)(format->rt_type, &type, &bpp);
354    switch (type) {
355    case V3D_INTERNAL_TYPE_8:
356       return bpp == V3D_INTERNAL_BPP_32;
357    case V3D_INTERNAL_TYPE_16F:
358       return bpp == V3D_INTERNAL_BPP_32 || V3D_INTERNAL_BPP_64;
359    default:
360       return false;
361    }
362 }
363 
364 bool
v3dX(tfu_supports_tex_format)365 v3dX(tfu_supports_tex_format)(uint32_t tex_format)
366 {
367    switch (tex_format) {
368    case TEXTURE_DATA_FORMAT_R8:
369    case TEXTURE_DATA_FORMAT_R8_SNORM:
370    case TEXTURE_DATA_FORMAT_RG8:
371    case TEXTURE_DATA_FORMAT_RG8_SNORM:
372    case TEXTURE_DATA_FORMAT_RGBA8:
373    case TEXTURE_DATA_FORMAT_RGBA8_SNORM:
374    case TEXTURE_DATA_FORMAT_RGB565:
375    case TEXTURE_DATA_FORMAT_RGBA4:
376    case TEXTURE_DATA_FORMAT_RGB5_A1:
377    case TEXTURE_DATA_FORMAT_RGB10_A2:
378    case TEXTURE_DATA_FORMAT_R16:
379    case TEXTURE_DATA_FORMAT_R16_SNORM:
380    case TEXTURE_DATA_FORMAT_RG16:
381    case TEXTURE_DATA_FORMAT_RG16_SNORM:
382    case TEXTURE_DATA_FORMAT_RGBA16:
383    case TEXTURE_DATA_FORMAT_RGBA16_SNORM:
384    case TEXTURE_DATA_FORMAT_R16F:
385    case TEXTURE_DATA_FORMAT_RG16F:
386    case TEXTURE_DATA_FORMAT_RGBA16F:
387    case TEXTURE_DATA_FORMAT_R11F_G11F_B10F:
388    case TEXTURE_DATA_FORMAT_R4:
389    case TEXTURE_DATA_FORMAT_RGB9_E5:
390    case TEXTURE_DATA_FORMAT_R32F:
391    case TEXTURE_DATA_FORMAT_RG32F:
392    case TEXTURE_DATA_FORMAT_RGBA32F:
393    case TEXTURE_DATA_FORMAT_RGB8_ETC2:
394    case TEXTURE_DATA_FORMAT_RGB8_PUNCHTHROUGH_ALPHA1:
395    case TEXTURE_DATA_FORMAT_RGBA8_ETC2_EAC:
396    case TEXTURE_DATA_FORMAT_R11_EAC:
397    case TEXTURE_DATA_FORMAT_SIGNED_R11_EAC:
398    case TEXTURE_DATA_FORMAT_RG11_EAC:
399    case TEXTURE_DATA_FORMAT_SIGNED_RG11_EAC:
400       return true;
401    default:
402       return false;
403    }
404 }
405 
406 uint8_t
v3dX(get_internal_depth_type)407 v3dX(get_internal_depth_type)(VkFormat format)
408 {
409    switch (format) {
410    case VK_FORMAT_D16_UNORM:
411       return V3D_INTERNAL_TYPE_DEPTH_16;
412    case VK_FORMAT_D32_SFLOAT:
413       return V3D_INTERNAL_TYPE_DEPTH_32F;
414    case VK_FORMAT_X8_D24_UNORM_PACK32:
415    case VK_FORMAT_D24_UNORM_S8_UINT:
416       return V3D_INTERNAL_TYPE_DEPTH_24;
417    default:
418       unreachable("Invalid depth format");
419       break;
420    }
421 }
422 
423 void
v3dX(get_internal_type_bpp_for_image_aspects)424 v3dX(get_internal_type_bpp_for_image_aspects)(VkFormat vk_format,
425                                               VkImageAspectFlags aspect_mask,
426                                               uint32_t *internal_type,
427                                               uint32_t *internal_bpp)
428 {
429    const VkImageAspectFlags ds_aspects = VK_IMAGE_ASPECT_DEPTH_BIT |
430                                          VK_IMAGE_ASPECT_STENCIL_BIT;
431 
432    /* We can't store depth/stencil pixel formats to a raster format, so
433     * so instead we load our depth/stencil aspects to a compatible color
434     * format.
435     */
436    /* FIXME: pre-compute this at image creation time? */
437    if (aspect_mask & ds_aspects) {
438       switch (vk_format) {
439       case VK_FORMAT_D16_UNORM:
440          *internal_type = V3D_INTERNAL_TYPE_16UI;
441          *internal_bpp = V3D_INTERNAL_BPP_64;
442          break;
443       case VK_FORMAT_D32_SFLOAT:
444          *internal_type = V3D_INTERNAL_TYPE_32F;
445          *internal_bpp = V3D_INTERNAL_BPP_128;
446          break;
447       case VK_FORMAT_X8_D24_UNORM_PACK32:
448       case VK_FORMAT_D24_UNORM_S8_UINT:
449          /* Use RGBA8 format so we can relocate the X/S bits in the appropriate
450           * place to match Vulkan expectations. See the comment on the tile
451           * load command for more details.
452           */
453          *internal_type = V3D_INTERNAL_TYPE_8UI;
454          *internal_bpp = V3D_INTERNAL_BPP_32;
455          break;
456       default:
457          assert(!"unsupported format");
458          break;
459       }
460    } else {
461       const struct v3dv_format *format = v3dX(get_format)(vk_format);
462       v3dX(get_internal_type_bpp_for_output_format)(format->rt_type,
463                                                     internal_type, internal_bpp);
464    }
465 }
466