1 /*
2 * Copyright © 2021 Raspberry Pi Ltd
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "v3dv_private.h"
25 #include "broadcom/common/v3d_macros.h"
26 #include "broadcom/cle/v3dx_pack.h"
27
28 #include "util/format/u_format.h"
29 #include "vulkan/util/vk_util.h"
30
31 #define SWIZ(x,y,z,w) { \
32 PIPE_SWIZZLE_##x, \
33 PIPE_SWIZZLE_##y, \
34 PIPE_SWIZZLE_##z, \
35 PIPE_SWIZZLE_##w \
36 }
37
38 #define FORMAT(vk, rt, tex, swiz, return_size, supports_filtering) \
39 [VK_ENUM_OFFSET(VK_FORMAT_##vk)] = { \
40 true, \
41 V3D_OUTPUT_IMAGE_FORMAT_##rt, \
42 TEXTURE_DATA_FORMAT_##tex, \
43 swiz, \
44 return_size, \
45 supports_filtering, \
46 }
47
48 #define SWIZ_X001 SWIZ(X, 0, 0, 1)
49 #define SWIZ_XY01 SWIZ(X, Y, 0, 1)
50 #define SWIZ_XYZ1 SWIZ(X, Y, Z, 1)
51 #define SWIZ_XYZW SWIZ(X, Y, Z, W)
52 #define SWIZ_YZWX SWIZ(Y, Z, W, X)
53 #define SWIZ_YZW1 SWIZ(Y, Z, W, 1)
54 #define SWIZ_ZYXW SWIZ(Z, Y, X, W)
55 #define SWIZ_ZYX1 SWIZ(Z, Y, X, 1)
56 #define SWIZ_XXXY SWIZ(X, X, X, Y)
57 #define SWIZ_XXX1 SWIZ(X, X, X, 1)
58 #define SWIZ_XXXX SWIZ(X, X, X, X)
59 #define SWIZ_000X SWIZ(0, 0, 0, X)
60 #define SWIZ_WXYZ SWIZ(W, X, Y, Z)
61 #define SWIZ_WZYX SWIZ(W, Z, Y, X)
62
63 /* FIXME: expand format table to describe whether the format is supported
64 * for buffer surfaces (texel buffers, vertex buffers, etc).
65 */
66 static const struct v3dv_format format_table[] = {
67 /* Color, 4 channels */
68 FORMAT(B8G8R8A8_SRGB, SRGB8_ALPHA8, RGBA8, SWIZ_ZYXW, 16, true),
69 FORMAT(B8G8R8A8_UNORM, RGBA8, RGBA8, SWIZ_ZYXW, 16, true),
70
71 FORMAT(R8G8B8A8_SRGB, SRGB8_ALPHA8, RGBA8, SWIZ_XYZW, 16, true),
72 FORMAT(R8G8B8A8_UNORM, RGBA8, RGBA8, SWIZ_XYZW, 16, true),
73 FORMAT(R8G8B8A8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZW, 16, true),
74 FORMAT(R8G8B8A8_SINT, RGBA8I, RGBA8I, SWIZ_XYZW, 16, false),
75 FORMAT(R8G8B8A8_UINT, RGBA8UI, RGBA8UI, SWIZ_XYZW, 16, false),
76
77 FORMAT(R16G16B16A16_SFLOAT, RGBA16F, RGBA16F, SWIZ_XYZW, 16, true),
78 FORMAT(R16G16B16A16_UNORM, NO, RGBA16, SWIZ_XYZW, 32, true),
79 FORMAT(R16G16B16A16_SNORM, NO, RGBA16_SNORM, SWIZ_XYZW, 32, true),
80 FORMAT(R16G16B16A16_SINT, RGBA16I, RGBA16I, SWIZ_XYZW, 16, false),
81 FORMAT(R16G16B16A16_UINT, RGBA16UI, RGBA16UI, SWIZ_XYZW, 16, false),
82
83 FORMAT(R32G32B32A32_SFLOAT, RGBA32F, RGBA32F, SWIZ_XYZW, 32, false),
84 FORMAT(R32G32B32A32_SINT, RGBA32I, RGBA32I, SWIZ_XYZW, 32, false),
85 FORMAT(R32G32B32A32_UINT, RGBA32UI, RGBA32UI, SWIZ_XYZW, 32, false),
86
87 /* Color, 3 channels */
88 FORMAT(R32G32B32_SFLOAT, NO, NO, SWIZ_XYZ1, 0, false),
89 FORMAT(R32G32B32_UINT, NO, NO, SWIZ_XYZ1, 0, false),
90 FORMAT(R32G32B32_SINT, NO, NO, SWIZ_XYZ1, 0, false),
91
92 /* Color, 2 channels */
93 FORMAT(R8G8_UNORM, RG8, RG8, SWIZ_XY01, 16, true),
94 FORMAT(R8G8_SNORM, NO, RG8_SNORM, SWIZ_XY01, 16, true),
95 FORMAT(R8G8_SINT, RG8I, RG8I, SWIZ_XY01, 16, false),
96 FORMAT(R8G8_UINT, RG8UI, RG8UI, SWIZ_XY01, 16, false),
97
98 FORMAT(R16G16_UNORM, NO, RG16, SWIZ_XY01, 32, true),
99 FORMAT(R16G16_SNORM, NO, RG16_SNORM, SWIZ_XY01, 32, true),
100 FORMAT(R16G16_SFLOAT, RG16F, RG16F, SWIZ_XY01, 16, true),
101 FORMAT(R16G16_SINT, RG16I, RG16I, SWIZ_XY01, 16, false),
102 FORMAT(R16G16_UINT, RG16UI, RG16UI, SWIZ_XY01, 16, false),
103
104 FORMAT(R32G32_SFLOAT, RG32F, RG32F, SWIZ_XY01, 32, false),
105 FORMAT(R32G32_SINT, RG32I, RG32I, SWIZ_XY01, 32, false),
106 FORMAT(R32G32_UINT, RG32UI, RG32UI, SWIZ_XY01, 32, false),
107
108 /* Color, 1 channel */
109 FORMAT(R8_UNORM, R8, R8, SWIZ_X001, 16, true),
110 FORMAT(R8_SNORM, NO, R8_SNORM, SWIZ_X001, 16, true),
111 FORMAT(R8_SINT, R8I, R8I, SWIZ_X001, 16, false),
112 FORMAT(R8_UINT, R8UI, R8UI, SWIZ_X001, 16, false),
113
114 FORMAT(R16_UNORM, NO, R16, SWIZ_X001, 32, true),
115 FORMAT(R16_SNORM, NO, R16_SNORM, SWIZ_X001, 32, true),
116 FORMAT(R16_SFLOAT, R16F, R16F, SWIZ_X001, 16, true),
117 FORMAT(R16_SINT, R16I, R16I, SWIZ_X001, 16, false),
118 FORMAT(R16_UINT, R16UI, R16UI, SWIZ_X001, 16, false),
119
120 FORMAT(R32_SFLOAT, R32F, R32F, SWIZ_X001, 32, false),
121 FORMAT(R32_SINT, R32I, R32I, SWIZ_X001, 32, false),
122 FORMAT(R32_UINT, R32UI, R32UI, SWIZ_X001, 32, false),
123
124 /* Color, packed */
125 FORMAT(R4G4B4A4_UNORM_PACK16, ABGR4444, RGBA4, SWIZ_XYZW, 16, true),
126 FORMAT(B4G4R4A4_UNORM_PACK16, ABGR4444, RGBA4, SWIZ_ZYXW, 16, true), /* Swap RB */
127 FORMAT(R5G6B5_UNORM_PACK16, BGR565, RGB565, SWIZ_XYZ1, 16, true),
128 FORMAT(R5G5B5A1_UNORM_PACK16, ABGR1555, RGB5_A1, SWIZ_XYZW, 16, true),
129 FORMAT(A1R5G5B5_UNORM_PACK16, RGBA5551, A1_RGB5, SWIZ_ZYXW, 16, true), /* Swap RB */
130 FORMAT(A8B8G8R8_UNORM_PACK32, RGBA8, RGBA8, SWIZ_XYZW, 16, true), /* RGBA8 UNORM */
131 FORMAT(A8B8G8R8_SNORM_PACK32, NO, RGBA8_SNORM, SWIZ_XYZW, 16, true), /* RGBA8 SNORM */
132 FORMAT(A8B8G8R8_UINT_PACK32, RGBA8UI, RGBA8UI, SWIZ_XYZW, 16, false), /* RGBA8 UINT */
133 FORMAT(A8B8G8R8_SINT_PACK32, RGBA8I, RGBA8I, SWIZ_XYZW, 16, false), /* RGBA8 SINT */
134 FORMAT(A8B8G8R8_SRGB_PACK32, SRGB8_ALPHA8, RGBA8, SWIZ_XYZW, 16, true), /* RGBA8 sRGB */
135 FORMAT(A2B10G10R10_UNORM_PACK32,RGB10_A2, RGB10_A2, SWIZ_XYZW, 16, true),
136 FORMAT(A2B10G10R10_UINT_PACK32, RGB10_A2UI, RGB10_A2UI, SWIZ_XYZW, 16, false),
137 FORMAT(E5B9G9R9_UFLOAT_PACK32, NO, RGB9_E5, SWIZ_XYZ1, 16, true),
138 FORMAT(B10G11R11_UFLOAT_PACK32, R11F_G11F_B10F,R11F_G11F_B10F, SWIZ_XYZ1, 16, true),
139
140 /* Depth */
141 FORMAT(D16_UNORM, D16, DEPTH_COMP16, SWIZ_X001, 32, false),
142 FORMAT(D32_SFLOAT, D32F, DEPTH_COMP32F, SWIZ_X001, 32, false),
143 FORMAT(X8_D24_UNORM_PACK32, D24S8, DEPTH24_X8, SWIZ_X001, 32, false),
144
145 /* Depth + Stencil */
146 FORMAT(D24_UNORM_S8_UINT, D24S8, DEPTH24_X8, SWIZ_X001, 32, false),
147
148 /* Compressed: ETC2 / EAC */
149 FORMAT(ETC2_R8G8B8_UNORM_BLOCK, NO, RGB8_ETC2, SWIZ_XYZ1, 16, true),
150 FORMAT(ETC2_R8G8B8_SRGB_BLOCK, NO, RGB8_ETC2, SWIZ_XYZ1, 16, true),
151 FORMAT(ETC2_R8G8B8A1_UNORM_BLOCK, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, true),
152 FORMAT(ETC2_R8G8B8A1_SRGB_BLOCK, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, true),
153 FORMAT(ETC2_R8G8B8A8_UNORM_BLOCK, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, true),
154 FORMAT(ETC2_R8G8B8A8_SRGB_BLOCK, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, true),
155 FORMAT(EAC_R11_UNORM_BLOCK, NO, R11_EAC, SWIZ_X001, 16, true),
156 FORMAT(EAC_R11_SNORM_BLOCK, NO, SIGNED_R11_EAC, SWIZ_X001, 16, true),
157 FORMAT(EAC_R11G11_UNORM_BLOCK, NO, RG11_EAC, SWIZ_XY01, 16, true),
158 FORMAT(EAC_R11G11_SNORM_BLOCK, NO, SIGNED_RG11_EAC, SWIZ_XY01, 16, true),
159
160 /* Compressed: BC1-3 */
161 FORMAT(BC1_RGB_UNORM_BLOCK, NO, BC1, SWIZ_XYZ1, 16, true),
162 FORMAT(BC1_RGB_SRGB_BLOCK, NO, BC1, SWIZ_XYZ1, 16, true),
163 FORMAT(BC1_RGBA_UNORM_BLOCK, NO, BC1, SWIZ_XYZW, 16, true),
164 FORMAT(BC1_RGBA_SRGB_BLOCK, NO, BC1, SWIZ_XYZW, 16, true),
165 FORMAT(BC2_UNORM_BLOCK, NO, BC2, SWIZ_XYZW, 16, true),
166 FORMAT(BC2_SRGB_BLOCK, NO, BC2, SWIZ_XYZW, 16, true),
167 FORMAT(BC3_UNORM_BLOCK, NO, BC3, SWIZ_XYZW, 16, true),
168 FORMAT(BC3_SRGB_BLOCK, NO, BC3, SWIZ_XYZW, 16, true),
169
170 /* Compressed: ASTC */
171 FORMAT(ASTC_4x4_UNORM_BLOCK, NO, ASTC_4X4, SWIZ_XYZW, 16, true),
172 FORMAT(ASTC_4x4_SRGB_BLOCK, NO, ASTC_4X4, SWIZ_XYZW, 16, true),
173 FORMAT(ASTC_5x4_UNORM_BLOCK, NO, ASTC_5X4, SWIZ_XYZW, 16, true),
174 FORMAT(ASTC_5x4_SRGB_BLOCK, NO, ASTC_5X4, SWIZ_XYZW, 16, true),
175 FORMAT(ASTC_5x5_UNORM_BLOCK, NO, ASTC_5X5, SWIZ_XYZW, 16, true),
176 FORMAT(ASTC_5x5_SRGB_BLOCK, NO, ASTC_5X5, SWIZ_XYZW, 16, true),
177 FORMAT(ASTC_6x5_UNORM_BLOCK, NO, ASTC_6X5, SWIZ_XYZW, 16, true),
178 FORMAT(ASTC_6x5_SRGB_BLOCK, NO, ASTC_6X5, SWIZ_XYZW, 16, true),
179 FORMAT(ASTC_6x6_UNORM_BLOCK, NO, ASTC_6X6, SWIZ_XYZW, 16, true),
180 FORMAT(ASTC_6x6_SRGB_BLOCK, NO, ASTC_6X6, SWIZ_XYZW, 16, true),
181 FORMAT(ASTC_8x5_UNORM_BLOCK, NO, ASTC_8X5, SWIZ_XYZW, 16, true),
182 FORMAT(ASTC_8x5_SRGB_BLOCK, NO, ASTC_8X5, SWIZ_XYZW, 16, true),
183 FORMAT(ASTC_8x6_UNORM_BLOCK, NO, ASTC_8X6, SWIZ_XYZW, 16, true),
184 FORMAT(ASTC_8x6_SRGB_BLOCK, NO, ASTC_8X6, SWIZ_XYZW, 16, true),
185 FORMAT(ASTC_8x8_UNORM_BLOCK, NO, ASTC_8X8, SWIZ_XYZW, 16, true),
186 FORMAT(ASTC_8x8_SRGB_BLOCK, NO, ASTC_8X8, SWIZ_XYZW, 16, true),
187 FORMAT(ASTC_10x5_UNORM_BLOCK, NO, ASTC_10X5, SWIZ_XYZW, 16, true),
188 FORMAT(ASTC_10x5_SRGB_BLOCK, NO, ASTC_10X5, SWIZ_XYZW, 16, true),
189 FORMAT(ASTC_10x6_UNORM_BLOCK, NO, ASTC_10X6, SWIZ_XYZW, 16, true),
190 FORMAT(ASTC_10x6_SRGB_BLOCK, NO, ASTC_10X6, SWIZ_XYZW, 16, true),
191 FORMAT(ASTC_10x8_UNORM_BLOCK, NO, ASTC_10X8, SWIZ_XYZW, 16, true),
192 FORMAT(ASTC_10x8_SRGB_BLOCK, NO, ASTC_10X8, SWIZ_XYZW, 16, true),
193 FORMAT(ASTC_10x10_UNORM_BLOCK, NO, ASTC_10X10, SWIZ_XYZW, 16, true),
194 FORMAT(ASTC_10x10_SRGB_BLOCK, NO, ASTC_10X10, SWIZ_XYZW, 16, true),
195 FORMAT(ASTC_12x10_UNORM_BLOCK, NO, ASTC_12X10, SWIZ_XYZW, 16, true),
196 FORMAT(ASTC_12x10_SRGB_BLOCK, NO, ASTC_12X10, SWIZ_XYZW, 16, true),
197 FORMAT(ASTC_12x12_UNORM_BLOCK, NO, ASTC_12X12, SWIZ_XYZW, 16, true),
198 FORMAT(ASTC_12x12_SRGB_BLOCK, NO, ASTC_12X12, SWIZ_XYZW, 16, true),
199 };
200
201 /**
202 * Vulkan layout for 4444 formats is defined like this:
203 *
204 * Vulkan ABGR4: (LSB) R | G | B | A (MSB)
205 * Vulkan ARGB4: (LSB) B | G | R | A (MSB)
206 *
207 * We map this to the V3D RGB4 texture format, which really, is ABGR4 with
208 * R in the MSB, so:
209 *
210 * V3D ABGR4 : (LSB) A | B | G | R (MSB)
211 *
212 * Which is reversed from Vulkan's ABGR4 layout. So in order to match Vulkan
213 * semantics we need to apply the following swizzles:
214 *
215 * ABGR4: WZYX (reverse)
216 * ARGB4: YZWX (reverse + swap R/B)
217 */
218 static const struct v3dv_format format_table_4444[] = {
219 FORMAT(A4B4G4R4_UNORM_PACK16_EXT, ABGR4444, RGBA4, SWIZ_WZYX, 16, true), /* Reverse */
220 FORMAT(A4R4G4B4_UNORM_PACK16_EXT, ABGR4444, RGBA4, SWIZ_YZWX, 16, true), /* Reverse + RB swap */
221 };
222
223 const struct v3dv_format *
get_format(VkFormat format)224 v3dX(get_format)(VkFormat format)
225 {
226 /* Core formats */
227 if (format < ARRAY_SIZE(format_table) && format_table[format].supported)
228 return &format_table[format];
229
230 switch (format) {
231 /* VK_EXT_4444_formats */
232 case VK_FORMAT_A4R4G4B4_UNORM_PACK16:
233 case VK_FORMAT_A4B4G4R4_UNORM_PACK16:
234 return &format_table_4444[VK_ENUM_OFFSET(format)];
235
236 default:
237 return NULL;
238 }
239 }
240
241 void
get_internal_type_bpp_for_output_format(uint32_t format, uint32_t *type, uint32_t *bpp)242 v3dX(get_internal_type_bpp_for_output_format)(uint32_t format,
243 uint32_t *type,
244 uint32_t *bpp)
245 {
246 switch (format) {
247 case V3D_OUTPUT_IMAGE_FORMAT_RGBA8:
248 case V3D_OUTPUT_IMAGE_FORMAT_RGB8:
249 case V3D_OUTPUT_IMAGE_FORMAT_RG8:
250 case V3D_OUTPUT_IMAGE_FORMAT_R8:
251 case V3D_OUTPUT_IMAGE_FORMAT_ABGR4444:
252 case V3D_OUTPUT_IMAGE_FORMAT_BGR565:
253 case V3D_OUTPUT_IMAGE_FORMAT_ABGR1555:
254 *type = V3D_INTERNAL_TYPE_8;
255 *bpp = V3D_INTERNAL_BPP_32;
256 break;
257
258 case V3D_OUTPUT_IMAGE_FORMAT_RGBA8I:
259 case V3D_OUTPUT_IMAGE_FORMAT_RG8I:
260 case V3D_OUTPUT_IMAGE_FORMAT_R8I:
261 *type = V3D_INTERNAL_TYPE_8I;
262 *bpp = V3D_INTERNAL_BPP_32;
263 break;
264
265 case V3D_OUTPUT_IMAGE_FORMAT_RGBA8UI:
266 case V3D_OUTPUT_IMAGE_FORMAT_RG8UI:
267 case V3D_OUTPUT_IMAGE_FORMAT_R8UI:
268 *type = V3D_INTERNAL_TYPE_8UI;
269 *bpp = V3D_INTERNAL_BPP_32;
270 break;
271
272 case V3D_OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
273 case V3D_OUTPUT_IMAGE_FORMAT_SRGB:
274 case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2:
275 case V3D_OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
276 case V3D_OUTPUT_IMAGE_FORMAT_RGBA16F:
277 /* Note that sRGB RTs are stored in the tile buffer at 16F,
278 * and the conversion to sRGB happens at tilebuffer load/store.
279 */
280 *type = V3D_INTERNAL_TYPE_16F;
281 *bpp = V3D_INTERNAL_BPP_64;
282 break;
283
284 case V3D_OUTPUT_IMAGE_FORMAT_RG16F:
285 case V3D_OUTPUT_IMAGE_FORMAT_R16F:
286 *type = V3D_INTERNAL_TYPE_16F;
287 /* Use 64bpp to make sure the TLB doesn't throw away the alpha
288 * channel before alpha test happens.
289 */
290 *bpp = V3D_INTERNAL_BPP_64;
291 break;
292
293 case V3D_OUTPUT_IMAGE_FORMAT_RGBA16I:
294 *type = V3D_INTERNAL_TYPE_16I;
295 *bpp = V3D_INTERNAL_BPP_64;
296 break;
297
298 case V3D_OUTPUT_IMAGE_FORMAT_RG16I:
299 case V3D_OUTPUT_IMAGE_FORMAT_R16I:
300 *type = V3D_INTERNAL_TYPE_16I;
301 *bpp = V3D_INTERNAL_BPP_32;
302 break;
303
304 case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2UI:
305 case V3D_OUTPUT_IMAGE_FORMAT_RGBA16UI:
306 *type = V3D_INTERNAL_TYPE_16UI;
307 *bpp = V3D_INTERNAL_BPP_64;
308 break;
309
310 case V3D_OUTPUT_IMAGE_FORMAT_RG16UI:
311 case V3D_OUTPUT_IMAGE_FORMAT_R16UI:
312 *type = V3D_INTERNAL_TYPE_16UI;
313 *bpp = V3D_INTERNAL_BPP_32;
314 break;
315
316 case V3D_OUTPUT_IMAGE_FORMAT_RGBA32I:
317 *type = V3D_INTERNAL_TYPE_32I;
318 *bpp = V3D_INTERNAL_BPP_128;
319 break;
320
321 case V3D_OUTPUT_IMAGE_FORMAT_RG32I:
322 *type = V3D_INTERNAL_TYPE_32I;
323 *bpp = V3D_INTERNAL_BPP_64;
324 break;
325
326 case V3D_OUTPUT_IMAGE_FORMAT_R32I:
327 *type = V3D_INTERNAL_TYPE_32I;
328 *bpp = V3D_INTERNAL_BPP_32;
329 break;
330
331 case V3D_OUTPUT_IMAGE_FORMAT_RGBA32UI:
332 *type = V3D_INTERNAL_TYPE_32UI;
333 *bpp = V3D_INTERNAL_BPP_128;
334 break;
335
336 case V3D_OUTPUT_IMAGE_FORMAT_RG32UI:
337 *type = V3D_INTERNAL_TYPE_32UI;
338 *bpp = V3D_INTERNAL_BPP_64;
339 break;
340
341 case V3D_OUTPUT_IMAGE_FORMAT_R32UI:
342 *type = V3D_INTERNAL_TYPE_32UI;
343 *bpp = V3D_INTERNAL_BPP_32;
344 break;
345
346 case V3D_OUTPUT_IMAGE_FORMAT_RGBA32F:
347 *type = V3D_INTERNAL_TYPE_32F;
348 *bpp = V3D_INTERNAL_BPP_128;
349 break;
350
351 case V3D_OUTPUT_IMAGE_FORMAT_RG32F:
352 *type = V3D_INTERNAL_TYPE_32F;
353 *bpp = V3D_INTERNAL_BPP_64;
354 break;
355
356 case V3D_OUTPUT_IMAGE_FORMAT_R32F:
357 *type = V3D_INTERNAL_TYPE_32F;
358 *bpp = V3D_INTERNAL_BPP_32;
359 break;
360
361 default:
362 /* Provide some default values, as we'll be called at RB
363 * creation time, even if an RB with this format isn't supported.
364 */
365 *type = V3D_INTERNAL_TYPE_8;
366 *bpp = V3D_INTERNAL_BPP_32;
367 break;
368 }
369 }
370
371 bool
format_supports_tlb_resolve(const struct v3dv_format *format)372 v3dX(format_supports_tlb_resolve)(const struct v3dv_format *format)
373 {
374 uint32_t type, bpp;
375 v3dX(get_internal_type_bpp_for_output_format)(format->rt_type, &type, &bpp);
376 return type == V3D_INTERNAL_TYPE_8 || type == V3D_INTERNAL_TYPE_16F;
377 }
378
379 bool
format_supports_blending(const struct v3dv_format *format)380 v3dX(format_supports_blending)(const struct v3dv_format *format)
381 {
382 /* Hardware blending is only supported on render targets that are configured
383 * 4x8-bit unorm, 2x16-bit float or 4x16-bit float.
384 */
385 uint32_t type, bpp;
386 v3dX(get_internal_type_bpp_for_output_format)(format->rt_type, &type, &bpp);
387 switch (type) {
388 case V3D_INTERNAL_TYPE_8:
389 return bpp == V3D_INTERNAL_BPP_32;
390 case V3D_INTERNAL_TYPE_16F:
391 return bpp == V3D_INTERNAL_BPP_32 || V3D_INTERNAL_BPP_64;
392 default:
393 return false;
394 }
395 }
396
397 bool
tfu_supports_tex_format(uint32_t tex_format)398 v3dX(tfu_supports_tex_format)(uint32_t tex_format)
399 {
400 switch (tex_format) {
401 case TEXTURE_DATA_FORMAT_R8:
402 case TEXTURE_DATA_FORMAT_R8_SNORM:
403 case TEXTURE_DATA_FORMAT_RG8:
404 case TEXTURE_DATA_FORMAT_RG8_SNORM:
405 case TEXTURE_DATA_FORMAT_RGBA8:
406 case TEXTURE_DATA_FORMAT_RGBA8_SNORM:
407 case TEXTURE_DATA_FORMAT_RGB565:
408 case TEXTURE_DATA_FORMAT_RGBA4:
409 case TEXTURE_DATA_FORMAT_RGB5_A1:
410 case TEXTURE_DATA_FORMAT_RGB10_A2:
411 case TEXTURE_DATA_FORMAT_R16:
412 case TEXTURE_DATA_FORMAT_R16_SNORM:
413 case TEXTURE_DATA_FORMAT_RG16:
414 case TEXTURE_DATA_FORMAT_RG16_SNORM:
415 case TEXTURE_DATA_FORMAT_RGBA16:
416 case TEXTURE_DATA_FORMAT_RGBA16_SNORM:
417 case TEXTURE_DATA_FORMAT_R16F:
418 case TEXTURE_DATA_FORMAT_RG16F:
419 case TEXTURE_DATA_FORMAT_RGBA16F:
420 case TEXTURE_DATA_FORMAT_R11F_G11F_B10F:
421 case TEXTURE_DATA_FORMAT_R4:
422 case TEXTURE_DATA_FORMAT_RGB9_E5:
423 case TEXTURE_DATA_FORMAT_R32F:
424 case TEXTURE_DATA_FORMAT_RG32F:
425 case TEXTURE_DATA_FORMAT_RGBA32F:
426 case TEXTURE_DATA_FORMAT_RGB8_ETC2:
427 case TEXTURE_DATA_FORMAT_RGB8_PUNCHTHROUGH_ALPHA1:
428 case TEXTURE_DATA_FORMAT_RGBA8_ETC2_EAC:
429 case TEXTURE_DATA_FORMAT_R11_EAC:
430 case TEXTURE_DATA_FORMAT_SIGNED_R11_EAC:
431 case TEXTURE_DATA_FORMAT_RG11_EAC:
432 case TEXTURE_DATA_FORMAT_SIGNED_RG11_EAC:
433 return true;
434 default:
435 return false;
436 }
437 }
438
439 uint8_t
get_internal_depth_type(VkFormat format)440 v3dX(get_internal_depth_type)(VkFormat format)
441 {
442 switch (format) {
443 case VK_FORMAT_D16_UNORM:
444 return V3D_INTERNAL_TYPE_DEPTH_16;
445 case VK_FORMAT_D32_SFLOAT:
446 return V3D_INTERNAL_TYPE_DEPTH_32F;
447 case VK_FORMAT_X8_D24_UNORM_PACK32:
448 case VK_FORMAT_D24_UNORM_S8_UINT:
449 return V3D_INTERNAL_TYPE_DEPTH_24;
450 default:
451 unreachable("Invalid depth format");
452 break;
453 }
454 }
455
456 void
get_internal_type_bpp_for_image_aspects(VkFormat vk_format, VkImageAspectFlags aspect_mask, uint32_t *internal_type, uint32_t *internal_bpp)457 v3dX(get_internal_type_bpp_for_image_aspects)(VkFormat vk_format,
458 VkImageAspectFlags aspect_mask,
459 uint32_t *internal_type,
460 uint32_t *internal_bpp)
461 {
462 /* We can't store depth/stencil pixel formats to a raster format, so
463 * instead we load our depth/stencil aspects to a compatible color format.
464 */
465 if (aspect_mask & (VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT)) {
466 *internal_bpp = V3D_INTERNAL_BPP_32;
467 switch (vk_format) {
468 case VK_FORMAT_D16_UNORM:
469 *internal_type = V3D_INTERNAL_TYPE_16UI;
470 break;
471 case VK_FORMAT_D32_SFLOAT:
472 *internal_type = V3D_INTERNAL_TYPE_32F;
473 break;
474 case VK_FORMAT_X8_D24_UNORM_PACK32:
475 case VK_FORMAT_D24_UNORM_S8_UINT:
476 /* Use RGBA8 format so we can relocate the X/S bits in the appropriate
477 * place to match Vulkan expectations. See the comment on the tile
478 * load command for more details.
479 */
480 *internal_type = V3D_INTERNAL_TYPE_8UI;
481 break;
482 default:
483 assert(!"unsupported format");
484 break;
485 }
486 } else {
487 const struct v3dv_format *format = v3dX(get_format)(vk_format);
488 v3dX(get_internal_type_bpp_for_output_format)(format->rt_type,
489 internal_type, internal_bpp);
490 }
491 }
492