162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Copyright © 2014-2015 Broadcom 362306a36Sopenharmony_ci * 462306a36Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a 562306a36Sopenharmony_ci * copy of this software and associated documentation files (the "Software"), 662306a36Sopenharmony_ci * to deal in the Software without restriction, including without limitation 762306a36Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense, 862306a36Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the 962306a36Sopenharmony_ci * Software is furnished to do so, subject to the following conditions: 1062306a36Sopenharmony_ci * 1162306a36Sopenharmony_ci * The above copyright notice and this permission notice (including the next 1262306a36Sopenharmony_ci * paragraph) shall be included in all copies or substantial portions of the 1362306a36Sopenharmony_ci * Software. 1462306a36Sopenharmony_ci * 1562306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1662306a36Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1762306a36Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 1862306a36Sopenharmony_ci * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 1962306a36Sopenharmony_ci * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 2062306a36Sopenharmony_ci * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 2162306a36Sopenharmony_ci * IN THE SOFTWARE. 2262306a36Sopenharmony_ci */ 2362306a36Sopenharmony_ci 2462306a36Sopenharmony_ci/** 2562306a36Sopenharmony_ci * DOC: Render command list generation 2662306a36Sopenharmony_ci * 2762306a36Sopenharmony_ci * In the V3D hardware, render command lists are what load and store 2862306a36Sopenharmony_ci * tiles of a framebuffer and optionally call out to binner-generated 2962306a36Sopenharmony_ci * command lists to do the 3D drawing for that tile. 3062306a36Sopenharmony_ci * 3162306a36Sopenharmony_ci * In the VC4 driver, render command list generation is performed by the 3262306a36Sopenharmony_ci * kernel instead of userspace. We do this because validating a 3362306a36Sopenharmony_ci * user-submitted command list is hard to get right and has high CPU overhead, 3462306a36Sopenharmony_ci * while the number of valid configurations for render command lists is 3562306a36Sopenharmony_ci * actually fairly low. 3662306a36Sopenharmony_ci */ 3762306a36Sopenharmony_ci 3862306a36Sopenharmony_ci#include "uapi/drm/vc4_drm.h" 3962306a36Sopenharmony_ci#include "vc4_drv.h" 4062306a36Sopenharmony_ci#include "vc4_packet.h" 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_cistruct vc4_rcl_setup { 4362306a36Sopenharmony_ci struct drm_gem_dma_object *color_read; 4462306a36Sopenharmony_ci struct drm_gem_dma_object *color_write; 4562306a36Sopenharmony_ci struct drm_gem_dma_object *zs_read; 4662306a36Sopenharmony_ci struct drm_gem_dma_object *zs_write; 4762306a36Sopenharmony_ci struct drm_gem_dma_object *msaa_color_write; 4862306a36Sopenharmony_ci struct drm_gem_dma_object *msaa_zs_write; 4962306a36Sopenharmony_ci 5062306a36Sopenharmony_ci struct drm_gem_dma_object *rcl; 5162306a36Sopenharmony_ci u32 next_offset; 5262306a36Sopenharmony_ci 5362306a36Sopenharmony_ci u32 next_write_bo_index; 5462306a36Sopenharmony_ci}; 5562306a36Sopenharmony_ci 5662306a36Sopenharmony_cistatic inline void rcl_u8(struct vc4_rcl_setup *setup, u8 val) 5762306a36Sopenharmony_ci{ 5862306a36Sopenharmony_ci *(u8 *)(setup->rcl->vaddr + setup->next_offset) = val; 5962306a36Sopenharmony_ci setup->next_offset += 1; 6062306a36Sopenharmony_ci} 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_cistatic inline void rcl_u16(struct vc4_rcl_setup *setup, u16 val) 6362306a36Sopenharmony_ci{ 6462306a36Sopenharmony_ci *(u16 *)(setup->rcl->vaddr + setup->next_offset) = val; 6562306a36Sopenharmony_ci setup->next_offset += 2; 6662306a36Sopenharmony_ci} 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_cistatic inline void rcl_u32(struct vc4_rcl_setup *setup, u32 val) 6962306a36Sopenharmony_ci{ 7062306a36Sopenharmony_ci *(u32 *)(setup->rcl->vaddr + setup->next_offset) = val; 7162306a36Sopenharmony_ci setup->next_offset += 4; 7262306a36Sopenharmony_ci} 7362306a36Sopenharmony_ci 7462306a36Sopenharmony_ci/* 7562306a36Sopenharmony_ci * Emits a no-op STORE_TILE_BUFFER_GENERAL. 7662306a36Sopenharmony_ci * 7762306a36Sopenharmony_ci * If we emit a PACKET_TILE_COORDINATES, it must be followed by a store of 7862306a36Sopenharmony_ci * some sort before another load is triggered. 7962306a36Sopenharmony_ci */ 8062306a36Sopenharmony_cistatic void vc4_store_before_load(struct vc4_rcl_setup *setup) 8162306a36Sopenharmony_ci{ 8262306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_TILE_BUFFER_GENERAL); 8362306a36Sopenharmony_ci rcl_u16(setup, 8462306a36Sopenharmony_ci VC4_SET_FIELD(VC4_LOADSTORE_TILE_BUFFER_NONE, 8562306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_BUFFER) | 8662306a36Sopenharmony_ci VC4_STORE_TILE_BUFFER_DISABLE_COLOR_CLEAR | 8762306a36Sopenharmony_ci VC4_STORE_TILE_BUFFER_DISABLE_ZS_CLEAR | 8862306a36Sopenharmony_ci VC4_STORE_TILE_BUFFER_DISABLE_VG_MASK_CLEAR); 8962306a36Sopenharmony_ci rcl_u32(setup, 0); /* no address, since we're in None mode */ 9062306a36Sopenharmony_ci} 9162306a36Sopenharmony_ci 9262306a36Sopenharmony_ci/* 9362306a36Sopenharmony_ci * Calculates the physical address of the start of a tile in a RCL surface. 9462306a36Sopenharmony_ci * 9562306a36Sopenharmony_ci * Unlike the other load/store packets, 9662306a36Sopenharmony_ci * VC4_PACKET_LOAD/STORE_FULL_RES_TILE_BUFFER don't look at the tile 9762306a36Sopenharmony_ci * coordinates packet, and instead just store to the address given. 9862306a36Sopenharmony_ci */ 9962306a36Sopenharmony_cistatic uint32_t vc4_full_res_offset(struct vc4_exec_info *exec, 10062306a36Sopenharmony_ci struct drm_gem_dma_object *bo, 10162306a36Sopenharmony_ci struct drm_vc4_submit_rcl_surface *surf, 10262306a36Sopenharmony_ci uint8_t x, uint8_t y) 10362306a36Sopenharmony_ci{ 10462306a36Sopenharmony_ci return bo->dma_addr + surf->offset + VC4_TILE_BUFFER_SIZE * 10562306a36Sopenharmony_ci (DIV_ROUND_UP(exec->args->width, 32) * y + x); 10662306a36Sopenharmony_ci} 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_ci/* 10962306a36Sopenharmony_ci * Emits a PACKET_TILE_COORDINATES if one isn't already pending. 11062306a36Sopenharmony_ci * 11162306a36Sopenharmony_ci * The tile coordinates packet triggers a pending load if there is one, are 11262306a36Sopenharmony_ci * used for clipping during rendering, and determine where loads/stores happen 11362306a36Sopenharmony_ci * relative to their base address. 11462306a36Sopenharmony_ci */ 11562306a36Sopenharmony_cistatic void vc4_tile_coordinates(struct vc4_rcl_setup *setup, 11662306a36Sopenharmony_ci uint32_t x, uint32_t y) 11762306a36Sopenharmony_ci{ 11862306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_TILE_COORDINATES); 11962306a36Sopenharmony_ci rcl_u8(setup, x); 12062306a36Sopenharmony_ci rcl_u8(setup, y); 12162306a36Sopenharmony_ci} 12262306a36Sopenharmony_ci 12362306a36Sopenharmony_cistatic void emit_tile(struct vc4_exec_info *exec, 12462306a36Sopenharmony_ci struct vc4_rcl_setup *setup, 12562306a36Sopenharmony_ci uint8_t x, uint8_t y, bool first, bool last) 12662306a36Sopenharmony_ci{ 12762306a36Sopenharmony_ci struct drm_vc4_submit_cl *args = exec->args; 12862306a36Sopenharmony_ci bool has_bin = args->bin_cl_size != 0; 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_ci /* Note that the load doesn't actually occur until the 13162306a36Sopenharmony_ci * tile coords packet is processed, and only one load 13262306a36Sopenharmony_ci * may be outstanding at a time. 13362306a36Sopenharmony_ci */ 13462306a36Sopenharmony_ci if (setup->color_read) { 13562306a36Sopenharmony_ci if (args->color_read.flags & 13662306a36Sopenharmony_ci VC4_SUBMIT_RCL_SURFACE_READ_IS_FULL_RES) { 13762306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER); 13862306a36Sopenharmony_ci rcl_u32(setup, 13962306a36Sopenharmony_ci vc4_full_res_offset(exec, setup->color_read, 14062306a36Sopenharmony_ci &args->color_read, x, y) | 14162306a36Sopenharmony_ci VC4_LOADSTORE_FULL_RES_DISABLE_ZS); 14262306a36Sopenharmony_ci } else { 14362306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_LOAD_TILE_BUFFER_GENERAL); 14462306a36Sopenharmony_ci rcl_u16(setup, args->color_read.bits); 14562306a36Sopenharmony_ci rcl_u32(setup, setup->color_read->dma_addr + 14662306a36Sopenharmony_ci args->color_read.offset); 14762306a36Sopenharmony_ci } 14862306a36Sopenharmony_ci } 14962306a36Sopenharmony_ci 15062306a36Sopenharmony_ci if (setup->zs_read) { 15162306a36Sopenharmony_ci if (setup->color_read) { 15262306a36Sopenharmony_ci /* Exec previous load. */ 15362306a36Sopenharmony_ci vc4_tile_coordinates(setup, x, y); 15462306a36Sopenharmony_ci vc4_store_before_load(setup); 15562306a36Sopenharmony_ci } 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci if (args->zs_read.flags & 15862306a36Sopenharmony_ci VC4_SUBMIT_RCL_SURFACE_READ_IS_FULL_RES) { 15962306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER); 16062306a36Sopenharmony_ci rcl_u32(setup, 16162306a36Sopenharmony_ci vc4_full_res_offset(exec, setup->zs_read, 16262306a36Sopenharmony_ci &args->zs_read, x, y) | 16362306a36Sopenharmony_ci VC4_LOADSTORE_FULL_RES_DISABLE_COLOR); 16462306a36Sopenharmony_ci } else { 16562306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_LOAD_TILE_BUFFER_GENERAL); 16662306a36Sopenharmony_ci rcl_u16(setup, args->zs_read.bits); 16762306a36Sopenharmony_ci rcl_u32(setup, setup->zs_read->dma_addr + 16862306a36Sopenharmony_ci args->zs_read.offset); 16962306a36Sopenharmony_ci } 17062306a36Sopenharmony_ci } 17162306a36Sopenharmony_ci 17262306a36Sopenharmony_ci /* Clipping depends on tile coordinates having been 17362306a36Sopenharmony_ci * emitted, so we always need one here. 17462306a36Sopenharmony_ci */ 17562306a36Sopenharmony_ci vc4_tile_coordinates(setup, x, y); 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci /* Wait for the binner before jumping to the first 17862306a36Sopenharmony_ci * tile's lists. 17962306a36Sopenharmony_ci */ 18062306a36Sopenharmony_ci if (first && has_bin) 18162306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_WAIT_ON_SEMAPHORE); 18262306a36Sopenharmony_ci 18362306a36Sopenharmony_ci if (has_bin) { 18462306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_BRANCH_TO_SUB_LIST); 18562306a36Sopenharmony_ci rcl_u32(setup, (exec->tile_alloc_offset + 18662306a36Sopenharmony_ci (y * exec->bin_tiles_x + x) * 32)); 18762306a36Sopenharmony_ci } 18862306a36Sopenharmony_ci 18962306a36Sopenharmony_ci if (setup->msaa_color_write) { 19062306a36Sopenharmony_ci bool last_tile_write = (!setup->msaa_zs_write && 19162306a36Sopenharmony_ci !setup->zs_write && 19262306a36Sopenharmony_ci !setup->color_write); 19362306a36Sopenharmony_ci uint32_t bits = VC4_LOADSTORE_FULL_RES_DISABLE_ZS; 19462306a36Sopenharmony_ci 19562306a36Sopenharmony_ci if (!last_tile_write) 19662306a36Sopenharmony_ci bits |= VC4_LOADSTORE_FULL_RES_DISABLE_CLEAR_ALL; 19762306a36Sopenharmony_ci else if (last) 19862306a36Sopenharmony_ci bits |= VC4_LOADSTORE_FULL_RES_EOF; 19962306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_FULL_RES_TILE_BUFFER); 20062306a36Sopenharmony_ci rcl_u32(setup, 20162306a36Sopenharmony_ci vc4_full_res_offset(exec, setup->msaa_color_write, 20262306a36Sopenharmony_ci &args->msaa_color_write, x, y) | 20362306a36Sopenharmony_ci bits); 20462306a36Sopenharmony_ci } 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_ci if (setup->msaa_zs_write) { 20762306a36Sopenharmony_ci bool last_tile_write = (!setup->zs_write && 20862306a36Sopenharmony_ci !setup->color_write); 20962306a36Sopenharmony_ci uint32_t bits = VC4_LOADSTORE_FULL_RES_DISABLE_COLOR; 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci if (setup->msaa_color_write) 21262306a36Sopenharmony_ci vc4_tile_coordinates(setup, x, y); 21362306a36Sopenharmony_ci if (!last_tile_write) 21462306a36Sopenharmony_ci bits |= VC4_LOADSTORE_FULL_RES_DISABLE_CLEAR_ALL; 21562306a36Sopenharmony_ci else if (last) 21662306a36Sopenharmony_ci bits |= VC4_LOADSTORE_FULL_RES_EOF; 21762306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_FULL_RES_TILE_BUFFER); 21862306a36Sopenharmony_ci rcl_u32(setup, 21962306a36Sopenharmony_ci vc4_full_res_offset(exec, setup->msaa_zs_write, 22062306a36Sopenharmony_ci &args->msaa_zs_write, x, y) | 22162306a36Sopenharmony_ci bits); 22262306a36Sopenharmony_ci } 22362306a36Sopenharmony_ci 22462306a36Sopenharmony_ci if (setup->zs_write) { 22562306a36Sopenharmony_ci bool last_tile_write = !setup->color_write; 22662306a36Sopenharmony_ci 22762306a36Sopenharmony_ci if (setup->msaa_color_write || setup->msaa_zs_write) 22862306a36Sopenharmony_ci vc4_tile_coordinates(setup, x, y); 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_TILE_BUFFER_GENERAL); 23162306a36Sopenharmony_ci rcl_u16(setup, args->zs_write.bits | 23262306a36Sopenharmony_ci (last_tile_write ? 23362306a36Sopenharmony_ci 0 : VC4_STORE_TILE_BUFFER_DISABLE_COLOR_CLEAR)); 23462306a36Sopenharmony_ci rcl_u32(setup, 23562306a36Sopenharmony_ci (setup->zs_write->dma_addr + args->zs_write.offset) | 23662306a36Sopenharmony_ci ((last && last_tile_write) ? 23762306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_EOF : 0)); 23862306a36Sopenharmony_ci } 23962306a36Sopenharmony_ci 24062306a36Sopenharmony_ci if (setup->color_write) { 24162306a36Sopenharmony_ci if (setup->msaa_color_write || setup->msaa_zs_write || 24262306a36Sopenharmony_ci setup->zs_write) { 24362306a36Sopenharmony_ci vc4_tile_coordinates(setup, x, y); 24462306a36Sopenharmony_ci } 24562306a36Sopenharmony_ci 24662306a36Sopenharmony_ci if (last) 24762306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_MS_TILE_BUFFER_AND_EOF); 24862306a36Sopenharmony_ci else 24962306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_MS_TILE_BUFFER); 25062306a36Sopenharmony_ci } 25162306a36Sopenharmony_ci} 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_cistatic int vc4_create_rcl_bo(struct drm_device *dev, struct vc4_exec_info *exec, 25462306a36Sopenharmony_ci struct vc4_rcl_setup *setup) 25562306a36Sopenharmony_ci{ 25662306a36Sopenharmony_ci struct drm_vc4_submit_cl *args = exec->args; 25762306a36Sopenharmony_ci bool has_bin = args->bin_cl_size != 0; 25862306a36Sopenharmony_ci uint8_t min_x_tile = args->min_x_tile; 25962306a36Sopenharmony_ci uint8_t min_y_tile = args->min_y_tile; 26062306a36Sopenharmony_ci uint8_t max_x_tile = args->max_x_tile; 26162306a36Sopenharmony_ci uint8_t max_y_tile = args->max_y_tile; 26262306a36Sopenharmony_ci uint8_t xtiles = max_x_tile - min_x_tile + 1; 26362306a36Sopenharmony_ci uint8_t ytiles = max_y_tile - min_y_tile + 1; 26462306a36Sopenharmony_ci uint8_t xi, yi; 26562306a36Sopenharmony_ci uint32_t size, loop_body_size; 26662306a36Sopenharmony_ci bool positive_x = true; 26762306a36Sopenharmony_ci bool positive_y = true; 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci if (args->flags & VC4_SUBMIT_CL_FIXED_RCL_ORDER) { 27062306a36Sopenharmony_ci if (!(args->flags & VC4_SUBMIT_CL_RCL_ORDER_INCREASING_X)) 27162306a36Sopenharmony_ci positive_x = false; 27262306a36Sopenharmony_ci if (!(args->flags & VC4_SUBMIT_CL_RCL_ORDER_INCREASING_Y)) 27362306a36Sopenharmony_ci positive_y = false; 27462306a36Sopenharmony_ci } 27562306a36Sopenharmony_ci 27662306a36Sopenharmony_ci size = VC4_PACKET_TILE_RENDERING_MODE_CONFIG_SIZE; 27762306a36Sopenharmony_ci loop_body_size = VC4_PACKET_TILE_COORDINATES_SIZE; 27862306a36Sopenharmony_ci 27962306a36Sopenharmony_ci if (args->flags & VC4_SUBMIT_CL_USE_CLEAR_COLOR) { 28062306a36Sopenharmony_ci size += VC4_PACKET_CLEAR_COLORS_SIZE + 28162306a36Sopenharmony_ci VC4_PACKET_TILE_COORDINATES_SIZE + 28262306a36Sopenharmony_ci VC4_PACKET_STORE_TILE_BUFFER_GENERAL_SIZE; 28362306a36Sopenharmony_ci } 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_ci if (setup->color_read) { 28662306a36Sopenharmony_ci if (args->color_read.flags & 28762306a36Sopenharmony_ci VC4_SUBMIT_RCL_SURFACE_READ_IS_FULL_RES) { 28862306a36Sopenharmony_ci loop_body_size += VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER_SIZE; 28962306a36Sopenharmony_ci } else { 29062306a36Sopenharmony_ci loop_body_size += VC4_PACKET_LOAD_TILE_BUFFER_GENERAL_SIZE; 29162306a36Sopenharmony_ci } 29262306a36Sopenharmony_ci } 29362306a36Sopenharmony_ci if (setup->zs_read) { 29462306a36Sopenharmony_ci if (setup->color_read) { 29562306a36Sopenharmony_ci loop_body_size += VC4_PACKET_TILE_COORDINATES_SIZE; 29662306a36Sopenharmony_ci loop_body_size += VC4_PACKET_STORE_TILE_BUFFER_GENERAL_SIZE; 29762306a36Sopenharmony_ci } 29862306a36Sopenharmony_ci 29962306a36Sopenharmony_ci if (args->zs_read.flags & 30062306a36Sopenharmony_ci VC4_SUBMIT_RCL_SURFACE_READ_IS_FULL_RES) { 30162306a36Sopenharmony_ci loop_body_size += VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER_SIZE; 30262306a36Sopenharmony_ci } else { 30362306a36Sopenharmony_ci loop_body_size += VC4_PACKET_LOAD_TILE_BUFFER_GENERAL_SIZE; 30462306a36Sopenharmony_ci } 30562306a36Sopenharmony_ci } 30662306a36Sopenharmony_ci 30762306a36Sopenharmony_ci if (has_bin) { 30862306a36Sopenharmony_ci size += VC4_PACKET_WAIT_ON_SEMAPHORE_SIZE; 30962306a36Sopenharmony_ci loop_body_size += VC4_PACKET_BRANCH_TO_SUB_LIST_SIZE; 31062306a36Sopenharmony_ci } 31162306a36Sopenharmony_ci 31262306a36Sopenharmony_ci if (setup->msaa_color_write) 31362306a36Sopenharmony_ci loop_body_size += VC4_PACKET_STORE_FULL_RES_TILE_BUFFER_SIZE; 31462306a36Sopenharmony_ci if (setup->msaa_zs_write) 31562306a36Sopenharmony_ci loop_body_size += VC4_PACKET_STORE_FULL_RES_TILE_BUFFER_SIZE; 31662306a36Sopenharmony_ci 31762306a36Sopenharmony_ci if (setup->zs_write) 31862306a36Sopenharmony_ci loop_body_size += VC4_PACKET_STORE_TILE_BUFFER_GENERAL_SIZE; 31962306a36Sopenharmony_ci if (setup->color_write) 32062306a36Sopenharmony_ci loop_body_size += VC4_PACKET_STORE_MS_TILE_BUFFER_SIZE; 32162306a36Sopenharmony_ci 32262306a36Sopenharmony_ci /* We need a VC4_PACKET_TILE_COORDINATES in between each store. */ 32362306a36Sopenharmony_ci loop_body_size += VC4_PACKET_TILE_COORDINATES_SIZE * 32462306a36Sopenharmony_ci ((setup->msaa_color_write != NULL) + 32562306a36Sopenharmony_ci (setup->msaa_zs_write != NULL) + 32662306a36Sopenharmony_ci (setup->color_write != NULL) + 32762306a36Sopenharmony_ci (setup->zs_write != NULL) - 1); 32862306a36Sopenharmony_ci 32962306a36Sopenharmony_ci size += xtiles * ytiles * loop_body_size; 33062306a36Sopenharmony_ci 33162306a36Sopenharmony_ci setup->rcl = &vc4_bo_create(dev, size, true, VC4_BO_TYPE_RCL)->base; 33262306a36Sopenharmony_ci if (IS_ERR(setup->rcl)) 33362306a36Sopenharmony_ci return PTR_ERR(setup->rcl); 33462306a36Sopenharmony_ci list_add_tail(&to_vc4_bo(&setup->rcl->base)->unref_head, 33562306a36Sopenharmony_ci &exec->unref_list); 33662306a36Sopenharmony_ci 33762306a36Sopenharmony_ci /* The tile buffer gets cleared when the previous tile is stored. If 33862306a36Sopenharmony_ci * the clear values changed between frames, then the tile buffer has 33962306a36Sopenharmony_ci * stale clear values in it, so we have to do a store in None mode (no 34062306a36Sopenharmony_ci * writes) so that we trigger the tile buffer clear. 34162306a36Sopenharmony_ci */ 34262306a36Sopenharmony_ci if (args->flags & VC4_SUBMIT_CL_USE_CLEAR_COLOR) { 34362306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_CLEAR_COLORS); 34462306a36Sopenharmony_ci rcl_u32(setup, args->clear_color[0]); 34562306a36Sopenharmony_ci rcl_u32(setup, args->clear_color[1]); 34662306a36Sopenharmony_ci rcl_u32(setup, args->clear_z); 34762306a36Sopenharmony_ci rcl_u8(setup, args->clear_s); 34862306a36Sopenharmony_ci 34962306a36Sopenharmony_ci vc4_tile_coordinates(setup, 0, 0); 35062306a36Sopenharmony_ci 35162306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_STORE_TILE_BUFFER_GENERAL); 35262306a36Sopenharmony_ci rcl_u16(setup, VC4_LOADSTORE_TILE_BUFFER_NONE); 35362306a36Sopenharmony_ci rcl_u32(setup, 0); /* no address, since we're in None mode */ 35462306a36Sopenharmony_ci } 35562306a36Sopenharmony_ci 35662306a36Sopenharmony_ci rcl_u8(setup, VC4_PACKET_TILE_RENDERING_MODE_CONFIG); 35762306a36Sopenharmony_ci rcl_u32(setup, 35862306a36Sopenharmony_ci (setup->color_write ? (setup->color_write->dma_addr + 35962306a36Sopenharmony_ci args->color_write.offset) : 36062306a36Sopenharmony_ci 0)); 36162306a36Sopenharmony_ci rcl_u16(setup, args->width); 36262306a36Sopenharmony_ci rcl_u16(setup, args->height); 36362306a36Sopenharmony_ci rcl_u16(setup, args->color_write.bits); 36462306a36Sopenharmony_ci 36562306a36Sopenharmony_ci for (yi = 0; yi < ytiles; yi++) { 36662306a36Sopenharmony_ci int y = positive_y ? min_y_tile + yi : max_y_tile - yi; 36762306a36Sopenharmony_ci for (xi = 0; xi < xtiles; xi++) { 36862306a36Sopenharmony_ci int x = positive_x ? min_x_tile + xi : max_x_tile - xi; 36962306a36Sopenharmony_ci bool first = (xi == 0 && yi == 0); 37062306a36Sopenharmony_ci bool last = (xi == xtiles - 1 && yi == ytiles - 1); 37162306a36Sopenharmony_ci 37262306a36Sopenharmony_ci emit_tile(exec, setup, x, y, first, last); 37362306a36Sopenharmony_ci } 37462306a36Sopenharmony_ci } 37562306a36Sopenharmony_ci 37662306a36Sopenharmony_ci BUG_ON(setup->next_offset != size); 37762306a36Sopenharmony_ci exec->ct1ca = setup->rcl->dma_addr; 37862306a36Sopenharmony_ci exec->ct1ea = setup->rcl->dma_addr + setup->next_offset; 37962306a36Sopenharmony_ci 38062306a36Sopenharmony_ci return 0; 38162306a36Sopenharmony_ci} 38262306a36Sopenharmony_ci 38362306a36Sopenharmony_cistatic int vc4_full_res_bounds_check(struct vc4_exec_info *exec, 38462306a36Sopenharmony_ci struct drm_gem_dma_object *obj, 38562306a36Sopenharmony_ci struct drm_vc4_submit_rcl_surface *surf) 38662306a36Sopenharmony_ci{ 38762306a36Sopenharmony_ci struct drm_vc4_submit_cl *args = exec->args; 38862306a36Sopenharmony_ci u32 render_tiles_stride = DIV_ROUND_UP(exec->args->width, 32); 38962306a36Sopenharmony_ci 39062306a36Sopenharmony_ci if (surf->offset > obj->base.size) { 39162306a36Sopenharmony_ci DRM_DEBUG("surface offset %d > BO size %zd\n", 39262306a36Sopenharmony_ci surf->offset, obj->base.size); 39362306a36Sopenharmony_ci return -EINVAL; 39462306a36Sopenharmony_ci } 39562306a36Sopenharmony_ci 39662306a36Sopenharmony_ci if ((obj->base.size - surf->offset) / VC4_TILE_BUFFER_SIZE < 39762306a36Sopenharmony_ci render_tiles_stride * args->max_y_tile + args->max_x_tile) { 39862306a36Sopenharmony_ci DRM_DEBUG("MSAA tile %d, %d out of bounds " 39962306a36Sopenharmony_ci "(bo size %zd, offset %d).\n", 40062306a36Sopenharmony_ci args->max_x_tile, args->max_y_tile, 40162306a36Sopenharmony_ci obj->base.size, 40262306a36Sopenharmony_ci surf->offset); 40362306a36Sopenharmony_ci return -EINVAL; 40462306a36Sopenharmony_ci } 40562306a36Sopenharmony_ci 40662306a36Sopenharmony_ci return 0; 40762306a36Sopenharmony_ci} 40862306a36Sopenharmony_ci 40962306a36Sopenharmony_cistatic int vc4_rcl_msaa_surface_setup(struct vc4_exec_info *exec, 41062306a36Sopenharmony_ci struct drm_gem_dma_object **obj, 41162306a36Sopenharmony_ci struct drm_vc4_submit_rcl_surface *surf) 41262306a36Sopenharmony_ci{ 41362306a36Sopenharmony_ci if (surf->flags != 0 || surf->bits != 0) { 41462306a36Sopenharmony_ci DRM_DEBUG("MSAA surface had nonzero flags/bits\n"); 41562306a36Sopenharmony_ci return -EINVAL; 41662306a36Sopenharmony_ci } 41762306a36Sopenharmony_ci 41862306a36Sopenharmony_ci if (surf->hindex == ~0) 41962306a36Sopenharmony_ci return 0; 42062306a36Sopenharmony_ci 42162306a36Sopenharmony_ci *obj = vc4_use_bo(exec, surf->hindex); 42262306a36Sopenharmony_ci if (!*obj) 42362306a36Sopenharmony_ci return -EINVAL; 42462306a36Sopenharmony_ci 42562306a36Sopenharmony_ci exec->rcl_write_bo[exec->rcl_write_bo_count++] = *obj; 42662306a36Sopenharmony_ci 42762306a36Sopenharmony_ci if (surf->offset & 0xf) { 42862306a36Sopenharmony_ci DRM_DEBUG("MSAA write must be 16b aligned.\n"); 42962306a36Sopenharmony_ci return -EINVAL; 43062306a36Sopenharmony_ci } 43162306a36Sopenharmony_ci 43262306a36Sopenharmony_ci return vc4_full_res_bounds_check(exec, *obj, surf); 43362306a36Sopenharmony_ci} 43462306a36Sopenharmony_ci 43562306a36Sopenharmony_cistatic int vc4_rcl_surface_setup(struct vc4_exec_info *exec, 43662306a36Sopenharmony_ci struct drm_gem_dma_object **obj, 43762306a36Sopenharmony_ci struct drm_vc4_submit_rcl_surface *surf, 43862306a36Sopenharmony_ci bool is_write) 43962306a36Sopenharmony_ci{ 44062306a36Sopenharmony_ci uint8_t tiling = VC4_GET_FIELD(surf->bits, 44162306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_TILING); 44262306a36Sopenharmony_ci uint8_t buffer = VC4_GET_FIELD(surf->bits, 44362306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_BUFFER); 44462306a36Sopenharmony_ci uint8_t format = VC4_GET_FIELD(surf->bits, 44562306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_FORMAT); 44662306a36Sopenharmony_ci int cpp; 44762306a36Sopenharmony_ci int ret; 44862306a36Sopenharmony_ci 44962306a36Sopenharmony_ci if (surf->flags & ~VC4_SUBMIT_RCL_SURFACE_READ_IS_FULL_RES) { 45062306a36Sopenharmony_ci DRM_DEBUG("Extra flags set\n"); 45162306a36Sopenharmony_ci return -EINVAL; 45262306a36Sopenharmony_ci } 45362306a36Sopenharmony_ci 45462306a36Sopenharmony_ci if (surf->hindex == ~0) 45562306a36Sopenharmony_ci return 0; 45662306a36Sopenharmony_ci 45762306a36Sopenharmony_ci *obj = vc4_use_bo(exec, surf->hindex); 45862306a36Sopenharmony_ci if (!*obj) 45962306a36Sopenharmony_ci return -EINVAL; 46062306a36Sopenharmony_ci 46162306a36Sopenharmony_ci if (is_write) 46262306a36Sopenharmony_ci exec->rcl_write_bo[exec->rcl_write_bo_count++] = *obj; 46362306a36Sopenharmony_ci 46462306a36Sopenharmony_ci if (surf->flags & VC4_SUBMIT_RCL_SURFACE_READ_IS_FULL_RES) { 46562306a36Sopenharmony_ci if (surf == &exec->args->zs_write) { 46662306a36Sopenharmony_ci DRM_DEBUG("general zs write may not be a full-res.\n"); 46762306a36Sopenharmony_ci return -EINVAL; 46862306a36Sopenharmony_ci } 46962306a36Sopenharmony_ci 47062306a36Sopenharmony_ci if (surf->bits != 0) { 47162306a36Sopenharmony_ci DRM_DEBUG("load/store general bits set with " 47262306a36Sopenharmony_ci "full res load/store.\n"); 47362306a36Sopenharmony_ci return -EINVAL; 47462306a36Sopenharmony_ci } 47562306a36Sopenharmony_ci 47662306a36Sopenharmony_ci ret = vc4_full_res_bounds_check(exec, *obj, surf); 47762306a36Sopenharmony_ci if (ret) 47862306a36Sopenharmony_ci return ret; 47962306a36Sopenharmony_ci 48062306a36Sopenharmony_ci return 0; 48162306a36Sopenharmony_ci } 48262306a36Sopenharmony_ci 48362306a36Sopenharmony_ci if (surf->bits & ~(VC4_LOADSTORE_TILE_BUFFER_TILING_MASK | 48462306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_BUFFER_MASK | 48562306a36Sopenharmony_ci VC4_LOADSTORE_TILE_BUFFER_FORMAT_MASK)) { 48662306a36Sopenharmony_ci DRM_DEBUG("Unknown bits in load/store: 0x%04x\n", 48762306a36Sopenharmony_ci surf->bits); 48862306a36Sopenharmony_ci return -EINVAL; 48962306a36Sopenharmony_ci } 49062306a36Sopenharmony_ci 49162306a36Sopenharmony_ci if (tiling > VC4_TILING_FORMAT_LT) { 49262306a36Sopenharmony_ci DRM_DEBUG("Bad tiling format\n"); 49362306a36Sopenharmony_ci return -EINVAL; 49462306a36Sopenharmony_ci } 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_ci if (buffer == VC4_LOADSTORE_TILE_BUFFER_ZS) { 49762306a36Sopenharmony_ci if (format != 0) { 49862306a36Sopenharmony_ci DRM_DEBUG("No color format should be set for ZS\n"); 49962306a36Sopenharmony_ci return -EINVAL; 50062306a36Sopenharmony_ci } 50162306a36Sopenharmony_ci cpp = 4; 50262306a36Sopenharmony_ci } else if (buffer == VC4_LOADSTORE_TILE_BUFFER_COLOR) { 50362306a36Sopenharmony_ci switch (format) { 50462306a36Sopenharmony_ci case VC4_LOADSTORE_TILE_BUFFER_BGR565: 50562306a36Sopenharmony_ci case VC4_LOADSTORE_TILE_BUFFER_BGR565_DITHER: 50662306a36Sopenharmony_ci cpp = 2; 50762306a36Sopenharmony_ci break; 50862306a36Sopenharmony_ci case VC4_LOADSTORE_TILE_BUFFER_RGBA8888: 50962306a36Sopenharmony_ci cpp = 4; 51062306a36Sopenharmony_ci break; 51162306a36Sopenharmony_ci default: 51262306a36Sopenharmony_ci DRM_DEBUG("Bad tile buffer format\n"); 51362306a36Sopenharmony_ci return -EINVAL; 51462306a36Sopenharmony_ci } 51562306a36Sopenharmony_ci } else { 51662306a36Sopenharmony_ci DRM_DEBUG("Bad load/store buffer %d.\n", buffer); 51762306a36Sopenharmony_ci return -EINVAL; 51862306a36Sopenharmony_ci } 51962306a36Sopenharmony_ci 52062306a36Sopenharmony_ci if (surf->offset & 0xf) { 52162306a36Sopenharmony_ci DRM_DEBUG("load/store buffer must be 16b aligned.\n"); 52262306a36Sopenharmony_ci return -EINVAL; 52362306a36Sopenharmony_ci } 52462306a36Sopenharmony_ci 52562306a36Sopenharmony_ci if (!vc4_check_tex_size(exec, *obj, surf->offset, tiling, 52662306a36Sopenharmony_ci exec->args->width, exec->args->height, cpp)) { 52762306a36Sopenharmony_ci return -EINVAL; 52862306a36Sopenharmony_ci } 52962306a36Sopenharmony_ci 53062306a36Sopenharmony_ci return 0; 53162306a36Sopenharmony_ci} 53262306a36Sopenharmony_ci 53362306a36Sopenharmony_cistatic int 53462306a36Sopenharmony_civc4_rcl_render_config_surface_setup(struct vc4_exec_info *exec, 53562306a36Sopenharmony_ci struct vc4_rcl_setup *setup, 53662306a36Sopenharmony_ci struct drm_gem_dma_object **obj, 53762306a36Sopenharmony_ci struct drm_vc4_submit_rcl_surface *surf) 53862306a36Sopenharmony_ci{ 53962306a36Sopenharmony_ci uint8_t tiling = VC4_GET_FIELD(surf->bits, 54062306a36Sopenharmony_ci VC4_RENDER_CONFIG_MEMORY_FORMAT); 54162306a36Sopenharmony_ci uint8_t format = VC4_GET_FIELD(surf->bits, 54262306a36Sopenharmony_ci VC4_RENDER_CONFIG_FORMAT); 54362306a36Sopenharmony_ci int cpp; 54462306a36Sopenharmony_ci 54562306a36Sopenharmony_ci if (surf->flags != 0) { 54662306a36Sopenharmony_ci DRM_DEBUG("No flags supported on render config.\n"); 54762306a36Sopenharmony_ci return -EINVAL; 54862306a36Sopenharmony_ci } 54962306a36Sopenharmony_ci 55062306a36Sopenharmony_ci if (surf->bits & ~(VC4_RENDER_CONFIG_MEMORY_FORMAT_MASK | 55162306a36Sopenharmony_ci VC4_RENDER_CONFIG_FORMAT_MASK | 55262306a36Sopenharmony_ci VC4_RENDER_CONFIG_MS_MODE_4X | 55362306a36Sopenharmony_ci VC4_RENDER_CONFIG_DECIMATE_MODE_4X)) { 55462306a36Sopenharmony_ci DRM_DEBUG("Unknown bits in render config: 0x%04x\n", 55562306a36Sopenharmony_ci surf->bits); 55662306a36Sopenharmony_ci return -EINVAL; 55762306a36Sopenharmony_ci } 55862306a36Sopenharmony_ci 55962306a36Sopenharmony_ci if (surf->hindex == ~0) 56062306a36Sopenharmony_ci return 0; 56162306a36Sopenharmony_ci 56262306a36Sopenharmony_ci *obj = vc4_use_bo(exec, surf->hindex); 56362306a36Sopenharmony_ci if (!*obj) 56462306a36Sopenharmony_ci return -EINVAL; 56562306a36Sopenharmony_ci 56662306a36Sopenharmony_ci exec->rcl_write_bo[exec->rcl_write_bo_count++] = *obj; 56762306a36Sopenharmony_ci 56862306a36Sopenharmony_ci if (tiling > VC4_TILING_FORMAT_LT) { 56962306a36Sopenharmony_ci DRM_DEBUG("Bad tiling format\n"); 57062306a36Sopenharmony_ci return -EINVAL; 57162306a36Sopenharmony_ci } 57262306a36Sopenharmony_ci 57362306a36Sopenharmony_ci switch (format) { 57462306a36Sopenharmony_ci case VC4_RENDER_CONFIG_FORMAT_BGR565_DITHERED: 57562306a36Sopenharmony_ci case VC4_RENDER_CONFIG_FORMAT_BGR565: 57662306a36Sopenharmony_ci cpp = 2; 57762306a36Sopenharmony_ci break; 57862306a36Sopenharmony_ci case VC4_RENDER_CONFIG_FORMAT_RGBA8888: 57962306a36Sopenharmony_ci cpp = 4; 58062306a36Sopenharmony_ci break; 58162306a36Sopenharmony_ci default: 58262306a36Sopenharmony_ci DRM_DEBUG("Bad tile buffer format\n"); 58362306a36Sopenharmony_ci return -EINVAL; 58462306a36Sopenharmony_ci } 58562306a36Sopenharmony_ci 58662306a36Sopenharmony_ci if (!vc4_check_tex_size(exec, *obj, surf->offset, tiling, 58762306a36Sopenharmony_ci exec->args->width, exec->args->height, cpp)) { 58862306a36Sopenharmony_ci return -EINVAL; 58962306a36Sopenharmony_ci } 59062306a36Sopenharmony_ci 59162306a36Sopenharmony_ci return 0; 59262306a36Sopenharmony_ci} 59362306a36Sopenharmony_ci 59462306a36Sopenharmony_ciint vc4_get_rcl(struct drm_device *dev, struct vc4_exec_info *exec) 59562306a36Sopenharmony_ci{ 59662306a36Sopenharmony_ci struct vc4_dev *vc4 = to_vc4_dev(dev); 59762306a36Sopenharmony_ci struct vc4_rcl_setup setup = {0}; 59862306a36Sopenharmony_ci struct drm_vc4_submit_cl *args = exec->args; 59962306a36Sopenharmony_ci bool has_bin = args->bin_cl_size != 0; 60062306a36Sopenharmony_ci int ret; 60162306a36Sopenharmony_ci 60262306a36Sopenharmony_ci if (WARN_ON_ONCE(vc4->is_vc5)) 60362306a36Sopenharmony_ci return -ENODEV; 60462306a36Sopenharmony_ci 60562306a36Sopenharmony_ci if (args->min_x_tile > args->max_x_tile || 60662306a36Sopenharmony_ci args->min_y_tile > args->max_y_tile) { 60762306a36Sopenharmony_ci DRM_DEBUG("Bad render tile set (%d,%d)-(%d,%d)\n", 60862306a36Sopenharmony_ci args->min_x_tile, args->min_y_tile, 60962306a36Sopenharmony_ci args->max_x_tile, args->max_y_tile); 61062306a36Sopenharmony_ci return -EINVAL; 61162306a36Sopenharmony_ci } 61262306a36Sopenharmony_ci 61362306a36Sopenharmony_ci if (has_bin && 61462306a36Sopenharmony_ci (args->max_x_tile > exec->bin_tiles_x || 61562306a36Sopenharmony_ci args->max_y_tile > exec->bin_tiles_y)) { 61662306a36Sopenharmony_ci DRM_DEBUG("Render tiles (%d,%d) outside of bin config " 61762306a36Sopenharmony_ci "(%d,%d)\n", 61862306a36Sopenharmony_ci args->max_x_tile, args->max_y_tile, 61962306a36Sopenharmony_ci exec->bin_tiles_x, exec->bin_tiles_y); 62062306a36Sopenharmony_ci return -EINVAL; 62162306a36Sopenharmony_ci } 62262306a36Sopenharmony_ci 62362306a36Sopenharmony_ci ret = vc4_rcl_render_config_surface_setup(exec, &setup, 62462306a36Sopenharmony_ci &setup.color_write, 62562306a36Sopenharmony_ci &args->color_write); 62662306a36Sopenharmony_ci if (ret) 62762306a36Sopenharmony_ci return ret; 62862306a36Sopenharmony_ci 62962306a36Sopenharmony_ci ret = vc4_rcl_surface_setup(exec, &setup.color_read, &args->color_read, 63062306a36Sopenharmony_ci false); 63162306a36Sopenharmony_ci if (ret) 63262306a36Sopenharmony_ci return ret; 63362306a36Sopenharmony_ci 63462306a36Sopenharmony_ci ret = vc4_rcl_surface_setup(exec, &setup.zs_read, &args->zs_read, 63562306a36Sopenharmony_ci false); 63662306a36Sopenharmony_ci if (ret) 63762306a36Sopenharmony_ci return ret; 63862306a36Sopenharmony_ci 63962306a36Sopenharmony_ci ret = vc4_rcl_surface_setup(exec, &setup.zs_write, &args->zs_write, 64062306a36Sopenharmony_ci true); 64162306a36Sopenharmony_ci if (ret) 64262306a36Sopenharmony_ci return ret; 64362306a36Sopenharmony_ci 64462306a36Sopenharmony_ci ret = vc4_rcl_msaa_surface_setup(exec, &setup.msaa_color_write, 64562306a36Sopenharmony_ci &args->msaa_color_write); 64662306a36Sopenharmony_ci if (ret) 64762306a36Sopenharmony_ci return ret; 64862306a36Sopenharmony_ci 64962306a36Sopenharmony_ci ret = vc4_rcl_msaa_surface_setup(exec, &setup.msaa_zs_write, 65062306a36Sopenharmony_ci &args->msaa_zs_write); 65162306a36Sopenharmony_ci if (ret) 65262306a36Sopenharmony_ci return ret; 65362306a36Sopenharmony_ci 65462306a36Sopenharmony_ci /* We shouldn't even have the job submitted to us if there's no 65562306a36Sopenharmony_ci * surface to write out. 65662306a36Sopenharmony_ci */ 65762306a36Sopenharmony_ci if (!setup.color_write && !setup.zs_write && 65862306a36Sopenharmony_ci !setup.msaa_color_write && !setup.msaa_zs_write) { 65962306a36Sopenharmony_ci DRM_DEBUG("RCL requires color or Z/S write\n"); 66062306a36Sopenharmony_ci return -EINVAL; 66162306a36Sopenharmony_ci } 66262306a36Sopenharmony_ci 66362306a36Sopenharmony_ci return vc4_create_rcl_bo(dev, exec, &setup); 66462306a36Sopenharmony_ci} 665