1 /*
2  * Copyright © 2021 Raspberry Pi Ltd
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #include "v3dv_private.h"
25 #include "broadcom/common/v3d_macros.h"
26 #include "broadcom/cle/v3dx_pack.h"
27 
28 #include "util/format/u_format.h"
29 #include "vulkan/util/vk_util.h"
30 
31 #define SWIZ(x,y,z,w) {   \
32    PIPE_SWIZZLE_##x,      \
33    PIPE_SWIZZLE_##y,      \
34    PIPE_SWIZZLE_##z,      \
35    PIPE_SWIZZLE_##w       \
36 }
37 
38 #define FORMAT(vk, rt, tex, swiz, return_size, supports_filtering)  \
39    [VK_ENUM_OFFSET(VK_FORMAT_##vk)] = {                             \
40       true,                                                         \
41       V3D_OUTPUT_IMAGE_FORMAT_##rt,                                 \
42       TEXTURE_DATA_FORMAT_##tex,                                    \
43       swiz,                                                         \
44       return_size,                                                  \
45       supports_filtering,                                           \
46    }
47 
48 #define SWIZ_X001 SWIZ(X, 0, 0, 1)
49 #define SWIZ_XY01 SWIZ(X, Y, 0, 1)
50 #define SWIZ_XYZ1 SWIZ(X, Y, Z, 1)
51 #define SWIZ_XYZW SWIZ(X, Y, Z, W)
52 #define SWIZ_YZWX SWIZ(Y, Z, W, X)
53 #define SWIZ_YZW1 SWIZ(Y, Z, W, 1)
54 #define SWIZ_ZYXW SWIZ(Z, Y, X, W)
55 #define SWIZ_ZYX1 SWIZ(Z, Y, X, 1)
56 #define SWIZ_XXXY SWIZ(X, X, X, Y)
57 #define SWIZ_XXX1 SWIZ(X, X, X, 1)
58 #define SWIZ_XXXX SWIZ(X, X, X, X)
59 #define SWIZ_000X SWIZ(0, 0, 0, X)
60 #define SWIZ_WXYZ SWIZ(W, X, Y, Z)
61 #define SWIZ_WZYX SWIZ(W, Z, Y, X)
62 
63 /* FIXME: expand format table to describe whether the format is supported
64  * for buffer surfaces (texel buffers, vertex buffers, etc).
65  */
66 static const struct v3dv_format format_table[] = {
67    /* Color, 4 channels */
68    FORMAT(B8G8R8A8_SRGB,           SRGB8_ALPHA8, RGBA8,         SWIZ_ZYXW, 16, true),
69    FORMAT(B8G8R8A8_UNORM,          RGBA8,        RGBA8,         SWIZ_ZYXW, 16, true),
70 
71    FORMAT(R8G8B8A8_SRGB,           SRGB8_ALPHA8, RGBA8,         SWIZ_XYZW, 16, true),
72    FORMAT(R8G8B8A8_UNORM,          RGBA8,        RGBA8,         SWIZ_XYZW, 16, true),
73    FORMAT(R8G8B8A8_SNORM,          NO,           RGBA8_SNORM,   SWIZ_XYZW, 16, true),
74    FORMAT(R8G8B8A8_SINT,           RGBA8I,       RGBA8I,        SWIZ_XYZW, 16, false),
75    FORMAT(R8G8B8A8_UINT,           RGBA8UI,      RGBA8UI,       SWIZ_XYZW, 16, false),
76 
77    FORMAT(R16G16B16A16_SFLOAT,     RGBA16F,      RGBA16F,       SWIZ_XYZW, 16, true),
78    FORMAT(R16G16B16A16_UNORM,      NO,           RGBA16,        SWIZ_XYZW, 32, true),
79    FORMAT(R16G16B16A16_SNORM,      NO,           RGBA16_SNORM,  SWIZ_XYZW, 32, true),
80    FORMAT(R16G16B16A16_SINT,       RGBA16I,      RGBA16I,       SWIZ_XYZW, 16, false),
81    FORMAT(R16G16B16A16_UINT,       RGBA16UI,     RGBA16UI,      SWIZ_XYZW, 16, false),
82 
83    FORMAT(R32G32B32A32_SFLOAT,     RGBA32F,      RGBA32F,       SWIZ_XYZW, 32, false),
84    FORMAT(R32G32B32A32_SINT,       RGBA32I,      RGBA32I,       SWIZ_XYZW, 32, false),
85    FORMAT(R32G32B32A32_UINT,       RGBA32UI,     RGBA32UI,      SWIZ_XYZW, 32, false),
86 
87    /* Color, 3 channels */
88    FORMAT(R32G32B32_SFLOAT,        NO,           NO,            SWIZ_XYZ1,  0, false),
89    FORMAT(R32G32B32_UINT,          NO,           NO,            SWIZ_XYZ1,  0, false),
90    FORMAT(R32G32B32_SINT,          NO,           NO,            SWIZ_XYZ1,  0, false),
91 
92    /* Color, 2 channels */
93    FORMAT(R8G8_UNORM,              RG8,          RG8,           SWIZ_XY01, 16, true),
94    FORMAT(R8G8_SNORM,              NO,           RG8_SNORM,     SWIZ_XY01, 16, true),
95    FORMAT(R8G8_SINT,               RG8I,         RG8I,          SWIZ_XY01, 16, false),
96    FORMAT(R8G8_UINT,               RG8UI,        RG8UI,         SWIZ_XY01, 16, false),
97 
98    FORMAT(R16G16_UNORM,            NO,           RG16,          SWIZ_XY01, 32, true),
99    FORMAT(R16G16_SNORM,            NO,           RG16_SNORM,    SWIZ_XY01, 32, true),
100    FORMAT(R16G16_SFLOAT,           RG16F,        RG16F,         SWIZ_XY01, 16, true),
101    FORMAT(R16G16_SINT,             RG16I,        RG16I,         SWIZ_XY01, 16, false),
102    FORMAT(R16G16_UINT,             RG16UI,       RG16UI,        SWIZ_XY01, 16, false),
103 
104    FORMAT(R32G32_SFLOAT,           RG32F,        RG32F,         SWIZ_XY01, 32, false),
105    FORMAT(R32G32_SINT,             RG32I,        RG32I,         SWIZ_XY01, 32, false),
106    FORMAT(R32G32_UINT,             RG32UI,       RG32UI,        SWIZ_XY01, 32, false),
107 
108    /* Color, 1 channel */
109    FORMAT(R8_UNORM,                R8,           R8,            SWIZ_X001, 16, true),
110    FORMAT(R8_SNORM,                NO,           R8_SNORM,      SWIZ_X001, 16, true),
111    FORMAT(R8_SINT,                 R8I,          R8I,           SWIZ_X001, 16, false),
112    FORMAT(R8_UINT,                 R8UI,         R8UI,          SWIZ_X001, 16, false),
113 
114    FORMAT(R16_UNORM,               NO,           R16,           SWIZ_X001, 32, true),
115    FORMAT(R16_SNORM,               NO,           R16_SNORM,     SWIZ_X001, 32, true),
116    FORMAT(R16_SFLOAT,              R16F,         R16F,          SWIZ_X001, 16, true),
117    FORMAT(R16_SINT,                R16I,         R16I,          SWIZ_X001, 16, false),
118    FORMAT(R16_UINT,                R16UI,        R16UI,         SWIZ_X001, 16, false),
119 
120    FORMAT(R32_SFLOAT,              R32F,         R32F,          SWIZ_X001, 32, false),
121    FORMAT(R32_SINT,                R32I,         R32I,          SWIZ_X001, 32, false),
122    FORMAT(R32_UINT,                R32UI,        R32UI,         SWIZ_X001, 32, false),
123 
124    /* Color, packed */
125    FORMAT(R4G4B4A4_UNORM_PACK16,   ABGR4444,     RGBA4,         SWIZ_XYZW, 16, true),
126    FORMAT(B4G4R4A4_UNORM_PACK16,   ABGR4444,     RGBA4,         SWIZ_ZYXW, 16, true), /* Swap RB */
127    FORMAT(R5G6B5_UNORM_PACK16,     BGR565,       RGB565,        SWIZ_XYZ1, 16, true),
128    FORMAT(R5G5B5A1_UNORM_PACK16,   ABGR1555,     RGB5_A1,       SWIZ_XYZW, 16, true),
129    FORMAT(A1R5G5B5_UNORM_PACK16,   RGBA5551,     A1_RGB5,       SWIZ_ZYXW, 16, true), /* Swap RB */
130    FORMAT(A8B8G8R8_UNORM_PACK32,   RGBA8,        RGBA8,         SWIZ_XYZW, 16, true), /* RGBA8 UNORM */
131    FORMAT(A8B8G8R8_SNORM_PACK32,   NO,           RGBA8_SNORM,   SWIZ_XYZW, 16, true), /* RGBA8 SNORM */
132    FORMAT(A8B8G8R8_UINT_PACK32,    RGBA8UI,      RGBA8UI,       SWIZ_XYZW, 16, false), /* RGBA8 UINT */
133    FORMAT(A8B8G8R8_SINT_PACK32,    RGBA8I,       RGBA8I,        SWIZ_XYZW, 16, false), /* RGBA8 SINT */
134    FORMAT(A8B8G8R8_SRGB_PACK32,    SRGB8_ALPHA8, RGBA8,         SWIZ_XYZW, 16, true), /* RGBA8 sRGB */
135    FORMAT(A2B10G10R10_UNORM_PACK32,RGB10_A2,     RGB10_A2,      SWIZ_XYZW, 16, true),
136    FORMAT(A2B10G10R10_UINT_PACK32, RGB10_A2UI,   RGB10_A2UI,    SWIZ_XYZW, 16, false),
137    FORMAT(E5B9G9R9_UFLOAT_PACK32,  NO,           RGB9_E5,       SWIZ_XYZ1, 16, true),
138    FORMAT(B10G11R11_UFLOAT_PACK32, R11F_G11F_B10F,R11F_G11F_B10F, SWIZ_XYZ1, 16, true),
139 
140    /* Depth */
141    FORMAT(D16_UNORM,               D16,          DEPTH_COMP16,  SWIZ_X001, 32, false),
142    FORMAT(D32_SFLOAT,              D32F,         DEPTH_COMP32F, SWIZ_X001, 32, false),
143    FORMAT(X8_D24_UNORM_PACK32,     D24S8,        DEPTH24_X8,    SWIZ_X001, 32, false),
144 
145    /* Depth + Stencil */
146    FORMAT(D24_UNORM_S8_UINT,       D24S8,        DEPTH24_X8,    SWIZ_X001, 32, false),
147 
148    /* Compressed: ETC2 / EAC */
149    FORMAT(ETC2_R8G8B8_UNORM_BLOCK,    NO,  RGB8_ETC2,                SWIZ_XYZ1, 16, true),
150    FORMAT(ETC2_R8G8B8_SRGB_BLOCK,     NO,  RGB8_ETC2,                SWIZ_XYZ1, 16, true),
151    FORMAT(ETC2_R8G8B8A1_UNORM_BLOCK,  NO,  RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, true),
152    FORMAT(ETC2_R8G8B8A1_SRGB_BLOCK,   NO,  RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, true),
153    FORMAT(ETC2_R8G8B8A8_UNORM_BLOCK,  NO,  RGBA8_ETC2_EAC,           SWIZ_XYZW, 16, true),
154    FORMAT(ETC2_R8G8B8A8_SRGB_BLOCK,   NO,  RGBA8_ETC2_EAC,           SWIZ_XYZW, 16, true),
155    FORMAT(EAC_R11_UNORM_BLOCK,        NO,  R11_EAC,                  SWIZ_X001, 16, true),
156    FORMAT(EAC_R11_SNORM_BLOCK,        NO,  SIGNED_R11_EAC,           SWIZ_X001, 16, true),
157    FORMAT(EAC_R11G11_UNORM_BLOCK,     NO,  RG11_EAC,                 SWIZ_XY01, 16, true),
158    FORMAT(EAC_R11G11_SNORM_BLOCK,     NO,  SIGNED_RG11_EAC,          SWIZ_XY01, 16, true),
159 
160    /* Compressed: BC1-3 */
161    FORMAT(BC1_RGB_UNORM_BLOCK,        NO,  BC1,                      SWIZ_XYZ1, 16, true),
162    FORMAT(BC1_RGB_SRGB_BLOCK,         NO,  BC1,                      SWIZ_XYZ1, 16, true),
163    FORMAT(BC1_RGBA_UNORM_BLOCK,       NO,  BC1,                      SWIZ_XYZW, 16, true),
164    FORMAT(BC1_RGBA_SRGB_BLOCK,        NO,  BC1,                      SWIZ_XYZW, 16, true),
165    FORMAT(BC2_UNORM_BLOCK,            NO,  BC2,                      SWIZ_XYZW, 16, true),
166    FORMAT(BC2_SRGB_BLOCK,             NO,  BC2,                      SWIZ_XYZW, 16, true),
167    FORMAT(BC3_UNORM_BLOCK,            NO,  BC3,                      SWIZ_XYZW, 16, true),
168    FORMAT(BC3_SRGB_BLOCK,             NO,  BC3,                      SWIZ_XYZW, 16, true),
169 
170    /* Compressed: ASTC */
171    FORMAT(ASTC_4x4_UNORM_BLOCK,       NO,  ASTC_4X4,                 SWIZ_XYZW, 16, true),
172    FORMAT(ASTC_4x4_SRGB_BLOCK,        NO,  ASTC_4X4,                 SWIZ_XYZW, 16, true),
173    FORMAT(ASTC_5x4_UNORM_BLOCK,       NO,  ASTC_5X4,                 SWIZ_XYZW, 16, true),
174    FORMAT(ASTC_5x4_SRGB_BLOCK,        NO,  ASTC_5X4,                 SWIZ_XYZW, 16, true),
175    FORMAT(ASTC_5x5_UNORM_BLOCK,       NO,  ASTC_5X5,                 SWIZ_XYZW, 16, true),
176    FORMAT(ASTC_5x5_SRGB_BLOCK,        NO,  ASTC_5X5,                 SWIZ_XYZW, 16, true),
177    FORMAT(ASTC_6x5_UNORM_BLOCK,       NO,  ASTC_6X5,                 SWIZ_XYZW, 16, true),
178    FORMAT(ASTC_6x5_SRGB_BLOCK,        NO,  ASTC_6X5,                 SWIZ_XYZW, 16, true),
179    FORMAT(ASTC_6x6_UNORM_BLOCK,       NO,  ASTC_6X6,                 SWIZ_XYZW, 16, true),
180    FORMAT(ASTC_6x6_SRGB_BLOCK,        NO,  ASTC_6X6,                 SWIZ_XYZW, 16, true),
181    FORMAT(ASTC_8x5_UNORM_BLOCK,       NO,  ASTC_8X5,                 SWIZ_XYZW, 16, true),
182    FORMAT(ASTC_8x5_SRGB_BLOCK,        NO,  ASTC_8X5,                 SWIZ_XYZW, 16, true),
183    FORMAT(ASTC_8x6_UNORM_BLOCK,       NO,  ASTC_8X6,                 SWIZ_XYZW, 16, true),
184    FORMAT(ASTC_8x6_SRGB_BLOCK,        NO,  ASTC_8X6,                 SWIZ_XYZW, 16, true),
185    FORMAT(ASTC_8x8_UNORM_BLOCK,       NO,  ASTC_8X8,                 SWIZ_XYZW, 16, true),
186    FORMAT(ASTC_8x8_SRGB_BLOCK,        NO,  ASTC_8X8,                 SWIZ_XYZW, 16, true),
187    FORMAT(ASTC_10x5_UNORM_BLOCK,      NO,  ASTC_10X5,                SWIZ_XYZW, 16, true),
188    FORMAT(ASTC_10x5_SRGB_BLOCK,       NO,  ASTC_10X5,                SWIZ_XYZW, 16, true),
189    FORMAT(ASTC_10x6_UNORM_BLOCK,      NO,  ASTC_10X6,                SWIZ_XYZW, 16, true),
190    FORMAT(ASTC_10x6_SRGB_BLOCK,       NO,  ASTC_10X6,                SWIZ_XYZW, 16, true),
191    FORMAT(ASTC_10x8_UNORM_BLOCK,      NO,  ASTC_10X8,                SWIZ_XYZW, 16, true),
192    FORMAT(ASTC_10x8_SRGB_BLOCK,       NO,  ASTC_10X8,                SWIZ_XYZW, 16, true),
193    FORMAT(ASTC_10x10_UNORM_BLOCK,     NO,  ASTC_10X10,               SWIZ_XYZW, 16, true),
194    FORMAT(ASTC_10x10_SRGB_BLOCK,      NO,  ASTC_10X10,               SWIZ_XYZW, 16, true),
195    FORMAT(ASTC_12x10_UNORM_BLOCK,     NO,  ASTC_12X10,               SWIZ_XYZW, 16, true),
196    FORMAT(ASTC_12x10_SRGB_BLOCK,      NO,  ASTC_12X10,               SWIZ_XYZW, 16, true),
197    FORMAT(ASTC_12x12_UNORM_BLOCK,     NO,  ASTC_12X12,               SWIZ_XYZW, 16, true),
198    FORMAT(ASTC_12x12_SRGB_BLOCK,      NO,  ASTC_12X12,               SWIZ_XYZW, 16, true),
199 };
200 
201 /**
202  * Vulkan layout for 4444 formats is defined like this:
203  *
204  * Vulkan ABGR4: (LSB) R | G | B | A (MSB)
205  * Vulkan ARGB4: (LSB) B | G | R | A (MSB)
206  *
207  * We map this to the V3D RGB4 texture format, which really, is ABGR4 with
208  * R in the MSB, so:
209  *
210  * V3D ABGR4   : (LSB) A | B | G | R (MSB)
211  *
212  * Which is reversed from Vulkan's ABGR4 layout. So in order to match Vulkan
213  * semantics we need to apply the following swizzles:
214  *
215  * ABGR4: WZYX (reverse)
216  * ARGB4: YZWX (reverse + swap R/B)
217  */
218 static const struct v3dv_format format_table_4444[] = {
219    FORMAT(A4B4G4R4_UNORM_PACK16_EXT, ABGR4444, RGBA4, SWIZ_WZYX, 16, true), /* Reverse */
220    FORMAT(A4R4G4B4_UNORM_PACK16_EXT, ABGR4444, RGBA4, SWIZ_YZWX, 16, true), /* Reverse + RB swap */
221 };
222 
223 const struct v3dv_format *
get_format(VkFormat format)224 v3dX(get_format)(VkFormat format)
225 {
226    /* Core formats */
227    if (format < ARRAY_SIZE(format_table) && format_table[format].supported)
228       return &format_table[format];
229 
230    switch (format) {
231    /* VK_EXT_4444_formats */
232    case VK_FORMAT_A4R4G4B4_UNORM_PACK16:
233    case VK_FORMAT_A4B4G4R4_UNORM_PACK16:
234       return &format_table_4444[VK_ENUM_OFFSET(format)];
235 
236    default:
237       return NULL;
238    }
239 }
240 
241 void
get_internal_type_bpp_for_output_format(uint32_t format, uint32_t *type, uint32_t *bpp)242 v3dX(get_internal_type_bpp_for_output_format)(uint32_t format,
243                                               uint32_t *type,
244                                               uint32_t *bpp)
245 {
246    switch (format) {
247    case V3D_OUTPUT_IMAGE_FORMAT_RGBA8:
248    case V3D_OUTPUT_IMAGE_FORMAT_RGB8:
249    case V3D_OUTPUT_IMAGE_FORMAT_RG8:
250    case V3D_OUTPUT_IMAGE_FORMAT_R8:
251    case V3D_OUTPUT_IMAGE_FORMAT_ABGR4444:
252    case V3D_OUTPUT_IMAGE_FORMAT_BGR565:
253    case V3D_OUTPUT_IMAGE_FORMAT_ABGR1555:
254       *type = V3D_INTERNAL_TYPE_8;
255       *bpp = V3D_INTERNAL_BPP_32;
256       break;
257 
258    case V3D_OUTPUT_IMAGE_FORMAT_RGBA8I:
259    case V3D_OUTPUT_IMAGE_FORMAT_RG8I:
260    case V3D_OUTPUT_IMAGE_FORMAT_R8I:
261       *type = V3D_INTERNAL_TYPE_8I;
262       *bpp = V3D_INTERNAL_BPP_32;
263       break;
264 
265    case V3D_OUTPUT_IMAGE_FORMAT_RGBA8UI:
266    case V3D_OUTPUT_IMAGE_FORMAT_RG8UI:
267    case V3D_OUTPUT_IMAGE_FORMAT_R8UI:
268       *type = V3D_INTERNAL_TYPE_8UI;
269       *bpp = V3D_INTERNAL_BPP_32;
270       break;
271 
272    case V3D_OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
273    case V3D_OUTPUT_IMAGE_FORMAT_SRGB:
274    case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2:
275    case V3D_OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
276    case V3D_OUTPUT_IMAGE_FORMAT_RGBA16F:
277       /* Note that sRGB RTs are stored in the tile buffer at 16F,
278        * and the conversion to sRGB happens at tilebuffer load/store.
279        */
280       *type = V3D_INTERNAL_TYPE_16F;
281       *bpp = V3D_INTERNAL_BPP_64;
282       break;
283 
284    case V3D_OUTPUT_IMAGE_FORMAT_RG16F:
285    case V3D_OUTPUT_IMAGE_FORMAT_R16F:
286       *type = V3D_INTERNAL_TYPE_16F;
287       /* Use 64bpp to make sure the TLB doesn't throw away the alpha
288        * channel before alpha test happens.
289        */
290       *bpp = V3D_INTERNAL_BPP_64;
291       break;
292 
293    case V3D_OUTPUT_IMAGE_FORMAT_RGBA16I:
294       *type = V3D_INTERNAL_TYPE_16I;
295       *bpp = V3D_INTERNAL_BPP_64;
296       break;
297 
298    case V3D_OUTPUT_IMAGE_FORMAT_RG16I:
299    case V3D_OUTPUT_IMAGE_FORMAT_R16I:
300       *type = V3D_INTERNAL_TYPE_16I;
301       *bpp = V3D_INTERNAL_BPP_32;
302       break;
303 
304    case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2UI:
305    case V3D_OUTPUT_IMAGE_FORMAT_RGBA16UI:
306       *type = V3D_INTERNAL_TYPE_16UI;
307       *bpp = V3D_INTERNAL_BPP_64;
308       break;
309 
310    case V3D_OUTPUT_IMAGE_FORMAT_RG16UI:
311    case V3D_OUTPUT_IMAGE_FORMAT_R16UI:
312       *type = V3D_INTERNAL_TYPE_16UI;
313       *bpp = V3D_INTERNAL_BPP_32;
314       break;
315 
316    case V3D_OUTPUT_IMAGE_FORMAT_RGBA32I:
317       *type = V3D_INTERNAL_TYPE_32I;
318       *bpp = V3D_INTERNAL_BPP_128;
319       break;
320 
321    case V3D_OUTPUT_IMAGE_FORMAT_RG32I:
322       *type = V3D_INTERNAL_TYPE_32I;
323       *bpp = V3D_INTERNAL_BPP_64;
324       break;
325 
326    case V3D_OUTPUT_IMAGE_FORMAT_R32I:
327       *type = V3D_INTERNAL_TYPE_32I;
328       *bpp = V3D_INTERNAL_BPP_32;
329       break;
330 
331    case V3D_OUTPUT_IMAGE_FORMAT_RGBA32UI:
332       *type = V3D_INTERNAL_TYPE_32UI;
333       *bpp = V3D_INTERNAL_BPP_128;
334       break;
335 
336    case V3D_OUTPUT_IMAGE_FORMAT_RG32UI:
337       *type = V3D_INTERNAL_TYPE_32UI;
338       *bpp = V3D_INTERNAL_BPP_64;
339       break;
340 
341    case V3D_OUTPUT_IMAGE_FORMAT_R32UI:
342       *type = V3D_INTERNAL_TYPE_32UI;
343       *bpp = V3D_INTERNAL_BPP_32;
344       break;
345 
346    case V3D_OUTPUT_IMAGE_FORMAT_RGBA32F:
347       *type = V3D_INTERNAL_TYPE_32F;
348       *bpp = V3D_INTERNAL_BPP_128;
349       break;
350 
351    case V3D_OUTPUT_IMAGE_FORMAT_RG32F:
352       *type = V3D_INTERNAL_TYPE_32F;
353       *bpp = V3D_INTERNAL_BPP_64;
354       break;
355 
356    case V3D_OUTPUT_IMAGE_FORMAT_R32F:
357       *type = V3D_INTERNAL_TYPE_32F;
358       *bpp = V3D_INTERNAL_BPP_32;
359       break;
360 
361    default:
362       /* Provide some default values, as we'll be called at RB
363        * creation time, even if an RB with this format isn't supported.
364        */
365       *type = V3D_INTERNAL_TYPE_8;
366       *bpp = V3D_INTERNAL_BPP_32;
367       break;
368    }
369 }
370 
371 bool
format_supports_tlb_resolve(const struct v3dv_format *format)372 v3dX(format_supports_tlb_resolve)(const struct v3dv_format *format)
373 {
374    uint32_t type, bpp;
375    v3dX(get_internal_type_bpp_for_output_format)(format->rt_type, &type, &bpp);
376    return type == V3D_INTERNAL_TYPE_8 || type == V3D_INTERNAL_TYPE_16F;
377 }
378 
379 bool
format_supports_blending(const struct v3dv_format *format)380 v3dX(format_supports_blending)(const struct v3dv_format *format)
381 {
382    /* Hardware blending is only supported on render targets that are configured
383     * 4x8-bit unorm, 2x16-bit float or 4x16-bit float.
384     */
385    uint32_t type, bpp;
386    v3dX(get_internal_type_bpp_for_output_format)(format->rt_type, &type, &bpp);
387    switch (type) {
388    case V3D_INTERNAL_TYPE_8:
389       return bpp == V3D_INTERNAL_BPP_32;
390    case V3D_INTERNAL_TYPE_16F:
391       return bpp == V3D_INTERNAL_BPP_32 || V3D_INTERNAL_BPP_64;
392    default:
393       return false;
394    }
395 }
396 
397 bool
tfu_supports_tex_format(uint32_t tex_format)398 v3dX(tfu_supports_tex_format)(uint32_t tex_format)
399 {
400    switch (tex_format) {
401    case TEXTURE_DATA_FORMAT_R8:
402    case TEXTURE_DATA_FORMAT_R8_SNORM:
403    case TEXTURE_DATA_FORMAT_RG8:
404    case TEXTURE_DATA_FORMAT_RG8_SNORM:
405    case TEXTURE_DATA_FORMAT_RGBA8:
406    case TEXTURE_DATA_FORMAT_RGBA8_SNORM:
407    case TEXTURE_DATA_FORMAT_RGB565:
408    case TEXTURE_DATA_FORMAT_RGBA4:
409    case TEXTURE_DATA_FORMAT_RGB5_A1:
410    case TEXTURE_DATA_FORMAT_RGB10_A2:
411    case TEXTURE_DATA_FORMAT_R16:
412    case TEXTURE_DATA_FORMAT_R16_SNORM:
413    case TEXTURE_DATA_FORMAT_RG16:
414    case TEXTURE_DATA_FORMAT_RG16_SNORM:
415    case TEXTURE_DATA_FORMAT_RGBA16:
416    case TEXTURE_DATA_FORMAT_RGBA16_SNORM:
417    case TEXTURE_DATA_FORMAT_R16F:
418    case TEXTURE_DATA_FORMAT_RG16F:
419    case TEXTURE_DATA_FORMAT_RGBA16F:
420    case TEXTURE_DATA_FORMAT_R11F_G11F_B10F:
421    case TEXTURE_DATA_FORMAT_R4:
422    case TEXTURE_DATA_FORMAT_RGB9_E5:
423    case TEXTURE_DATA_FORMAT_R32F:
424    case TEXTURE_DATA_FORMAT_RG32F:
425    case TEXTURE_DATA_FORMAT_RGBA32F:
426    case TEXTURE_DATA_FORMAT_RGB8_ETC2:
427    case TEXTURE_DATA_FORMAT_RGB8_PUNCHTHROUGH_ALPHA1:
428    case TEXTURE_DATA_FORMAT_RGBA8_ETC2_EAC:
429    case TEXTURE_DATA_FORMAT_R11_EAC:
430    case TEXTURE_DATA_FORMAT_SIGNED_R11_EAC:
431    case TEXTURE_DATA_FORMAT_RG11_EAC:
432    case TEXTURE_DATA_FORMAT_SIGNED_RG11_EAC:
433       return true;
434    default:
435       return false;
436    }
437 }
438 
439 uint8_t
get_internal_depth_type(VkFormat format)440 v3dX(get_internal_depth_type)(VkFormat format)
441 {
442    switch (format) {
443    case VK_FORMAT_D16_UNORM:
444       return V3D_INTERNAL_TYPE_DEPTH_16;
445    case VK_FORMAT_D32_SFLOAT:
446       return V3D_INTERNAL_TYPE_DEPTH_32F;
447    case VK_FORMAT_X8_D24_UNORM_PACK32:
448    case VK_FORMAT_D24_UNORM_S8_UINT:
449       return V3D_INTERNAL_TYPE_DEPTH_24;
450    default:
451       unreachable("Invalid depth format");
452       break;
453    }
454 }
455 
456 void
get_internal_type_bpp_for_image_aspects(VkFormat vk_format, VkImageAspectFlags aspect_mask, uint32_t *internal_type, uint32_t *internal_bpp)457 v3dX(get_internal_type_bpp_for_image_aspects)(VkFormat vk_format,
458                                               VkImageAspectFlags aspect_mask,
459                                               uint32_t *internal_type,
460                                               uint32_t *internal_bpp)
461 {
462    /* We can't store depth/stencil pixel formats to a raster format, so
463     * instead we load our depth/stencil aspects to a compatible color format.
464     */
465    if (aspect_mask & (VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT)) {
466       *internal_bpp = V3D_INTERNAL_BPP_32;
467       switch (vk_format) {
468       case VK_FORMAT_D16_UNORM:
469          *internal_type = V3D_INTERNAL_TYPE_16UI;
470          break;
471       case VK_FORMAT_D32_SFLOAT:
472          *internal_type = V3D_INTERNAL_TYPE_32F;
473          break;
474       case VK_FORMAT_X8_D24_UNORM_PACK32:
475       case VK_FORMAT_D24_UNORM_S8_UINT:
476          /* Use RGBA8 format so we can relocate the X/S bits in the appropriate
477           * place to match Vulkan expectations. See the comment on the tile
478           * load command for more details.
479           */
480          *internal_type = V3D_INTERNAL_TYPE_8UI;
481          break;
482       default:
483          assert(!"unsupported format");
484          break;
485       }
486    } else {
487       const struct v3dv_format *format = v3dX(get_format)(vk_format);
488       v3dX(get_internal_type_bpp_for_output_format)(format->rt_type,
489                                                     internal_type, internal_bpp);
490    }
491 }
492