162306a36Sopenharmony_ci/* 262306a36Sopenharmony_ci * Copyright 2013 Advanced Micro Devices, Inc. 362306a36Sopenharmony_ci * 462306a36Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a 562306a36Sopenharmony_ci * copy of this software and associated documentation files (the "Software"), 662306a36Sopenharmony_ci * to deal in the Software without restriction, including without limitation 762306a36Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense, 862306a36Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the 962306a36Sopenharmony_ci * Software is furnished to do so, subject to the following conditions: 1062306a36Sopenharmony_ci * 1162306a36Sopenharmony_ci * The above copyright notice and this permission notice shall be included in 1262306a36Sopenharmony_ci * all copies or substantial portions of the Software. 1362306a36Sopenharmony_ci * 1462306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1562306a36Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1662306a36Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 1762306a36Sopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 1862306a36Sopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 1962306a36Sopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 2062306a36Sopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE. 2162306a36Sopenharmony_ci * 2262306a36Sopenharmony_ci * Authors: Alex Deucher 2362306a36Sopenharmony_ci */ 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci#include <linux/firmware.h> 2662306a36Sopenharmony_ci#include <linux/module.h> 2762306a36Sopenharmony_ci 2862306a36Sopenharmony_ci#include "amdgpu.h" 2962306a36Sopenharmony_ci#include "amdgpu_ucode.h" 3062306a36Sopenharmony_ci#include "amdgpu_trace.h" 3162306a36Sopenharmony_ci#include "cikd.h" 3262306a36Sopenharmony_ci#include "cik.h" 3362306a36Sopenharmony_ci 3462306a36Sopenharmony_ci#include "bif/bif_4_1_d.h" 3562306a36Sopenharmony_ci#include "bif/bif_4_1_sh_mask.h" 3662306a36Sopenharmony_ci 3762306a36Sopenharmony_ci#include "gca/gfx_7_2_d.h" 3862306a36Sopenharmony_ci#include "gca/gfx_7_2_enum.h" 3962306a36Sopenharmony_ci#include "gca/gfx_7_2_sh_mask.h" 4062306a36Sopenharmony_ci 4162306a36Sopenharmony_ci#include "gmc/gmc_7_1_d.h" 4262306a36Sopenharmony_ci#include "gmc/gmc_7_1_sh_mask.h" 4362306a36Sopenharmony_ci 4462306a36Sopenharmony_ci#include "oss/oss_2_0_d.h" 4562306a36Sopenharmony_ci#include "oss/oss_2_0_sh_mask.h" 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_cistatic const u32 sdma_offsets[SDMA_MAX_INSTANCE] = 4862306a36Sopenharmony_ci{ 4962306a36Sopenharmony_ci SDMA0_REGISTER_OFFSET, 5062306a36Sopenharmony_ci SDMA1_REGISTER_OFFSET 5162306a36Sopenharmony_ci}; 5262306a36Sopenharmony_ci 5362306a36Sopenharmony_cistatic void cik_sdma_set_ring_funcs(struct amdgpu_device *adev); 5462306a36Sopenharmony_cistatic void cik_sdma_set_irq_funcs(struct amdgpu_device *adev); 5562306a36Sopenharmony_cistatic void cik_sdma_set_buffer_funcs(struct amdgpu_device *adev); 5662306a36Sopenharmony_cistatic void cik_sdma_set_vm_pte_funcs(struct amdgpu_device *adev); 5762306a36Sopenharmony_cistatic int cik_sdma_soft_reset(void *handle); 5862306a36Sopenharmony_ci 5962306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/bonaire_sdma.bin"); 6062306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/bonaire_sdma1.bin"); 6162306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/hawaii_sdma.bin"); 6262306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/hawaii_sdma1.bin"); 6362306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/kaveri_sdma.bin"); 6462306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/kaveri_sdma1.bin"); 6562306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/kabini_sdma.bin"); 6662306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/kabini_sdma1.bin"); 6762306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/mullins_sdma.bin"); 6862306a36Sopenharmony_ciMODULE_FIRMWARE("amdgpu/mullins_sdma1.bin"); 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ciu32 amdgpu_cik_gpu_check_soft_reset(struct amdgpu_device *adev); 7162306a36Sopenharmony_ci 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_cistatic void cik_sdma_free_microcode(struct amdgpu_device *adev) 7462306a36Sopenharmony_ci{ 7562306a36Sopenharmony_ci int i; 7662306a36Sopenharmony_ci 7762306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) 7862306a36Sopenharmony_ci amdgpu_ucode_release(&adev->sdma.instance[i].fw); 7962306a36Sopenharmony_ci} 8062306a36Sopenharmony_ci 8162306a36Sopenharmony_ci/* 8262306a36Sopenharmony_ci * sDMA - System DMA 8362306a36Sopenharmony_ci * Starting with CIK, the GPU has new asynchronous 8462306a36Sopenharmony_ci * DMA engines. These engines are used for compute 8562306a36Sopenharmony_ci * and gfx. There are two DMA engines (SDMA0, SDMA1) 8662306a36Sopenharmony_ci * and each one supports 1 ring buffer used for gfx 8762306a36Sopenharmony_ci * and 2 queues used for compute. 8862306a36Sopenharmony_ci * 8962306a36Sopenharmony_ci * The programming model is very similar to the CP 9062306a36Sopenharmony_ci * (ring buffer, IBs, etc.), but sDMA has it's own 9162306a36Sopenharmony_ci * packet format that is different from the PM4 format 9262306a36Sopenharmony_ci * used by the CP. sDMA supports copying data, writing 9362306a36Sopenharmony_ci * embedded data, solid fills, and a number of other 9462306a36Sopenharmony_ci * things. It also has support for tiling/detiling of 9562306a36Sopenharmony_ci * buffers. 9662306a36Sopenharmony_ci */ 9762306a36Sopenharmony_ci 9862306a36Sopenharmony_ci/** 9962306a36Sopenharmony_ci * cik_sdma_init_microcode - load ucode images from disk 10062306a36Sopenharmony_ci * 10162306a36Sopenharmony_ci * @adev: amdgpu_device pointer 10262306a36Sopenharmony_ci * 10362306a36Sopenharmony_ci * Use the firmware interface to load the ucode images into 10462306a36Sopenharmony_ci * the driver (not loaded into hw). 10562306a36Sopenharmony_ci * Returns 0 on success, error on failure. 10662306a36Sopenharmony_ci */ 10762306a36Sopenharmony_cistatic int cik_sdma_init_microcode(struct amdgpu_device *adev) 10862306a36Sopenharmony_ci{ 10962306a36Sopenharmony_ci const char *chip_name; 11062306a36Sopenharmony_ci char fw_name[30]; 11162306a36Sopenharmony_ci int err = 0, i; 11262306a36Sopenharmony_ci 11362306a36Sopenharmony_ci DRM_DEBUG("\n"); 11462306a36Sopenharmony_ci 11562306a36Sopenharmony_ci switch (adev->asic_type) { 11662306a36Sopenharmony_ci case CHIP_BONAIRE: 11762306a36Sopenharmony_ci chip_name = "bonaire"; 11862306a36Sopenharmony_ci break; 11962306a36Sopenharmony_ci case CHIP_HAWAII: 12062306a36Sopenharmony_ci chip_name = "hawaii"; 12162306a36Sopenharmony_ci break; 12262306a36Sopenharmony_ci case CHIP_KAVERI: 12362306a36Sopenharmony_ci chip_name = "kaveri"; 12462306a36Sopenharmony_ci break; 12562306a36Sopenharmony_ci case CHIP_KABINI: 12662306a36Sopenharmony_ci chip_name = "kabini"; 12762306a36Sopenharmony_ci break; 12862306a36Sopenharmony_ci case CHIP_MULLINS: 12962306a36Sopenharmony_ci chip_name = "mullins"; 13062306a36Sopenharmony_ci break; 13162306a36Sopenharmony_ci default: BUG(); 13262306a36Sopenharmony_ci } 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 13562306a36Sopenharmony_ci if (i == 0) 13662306a36Sopenharmony_ci snprintf(fw_name, sizeof(fw_name), "amdgpu/%s_sdma.bin", chip_name); 13762306a36Sopenharmony_ci else 13862306a36Sopenharmony_ci snprintf(fw_name, sizeof(fw_name), "amdgpu/%s_sdma1.bin", chip_name); 13962306a36Sopenharmony_ci err = amdgpu_ucode_request(adev, &adev->sdma.instance[i].fw, fw_name); 14062306a36Sopenharmony_ci if (err) 14162306a36Sopenharmony_ci goto out; 14262306a36Sopenharmony_ci } 14362306a36Sopenharmony_ciout: 14462306a36Sopenharmony_ci if (err) { 14562306a36Sopenharmony_ci pr_err("cik_sdma: Failed to load firmware \"%s\"\n", fw_name); 14662306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) 14762306a36Sopenharmony_ci amdgpu_ucode_release(&adev->sdma.instance[i].fw); 14862306a36Sopenharmony_ci } 14962306a36Sopenharmony_ci return err; 15062306a36Sopenharmony_ci} 15162306a36Sopenharmony_ci 15262306a36Sopenharmony_ci/** 15362306a36Sopenharmony_ci * cik_sdma_ring_get_rptr - get the current read pointer 15462306a36Sopenharmony_ci * 15562306a36Sopenharmony_ci * @ring: amdgpu ring pointer 15662306a36Sopenharmony_ci * 15762306a36Sopenharmony_ci * Get the current rptr from the hardware (CIK+). 15862306a36Sopenharmony_ci */ 15962306a36Sopenharmony_cistatic uint64_t cik_sdma_ring_get_rptr(struct amdgpu_ring *ring) 16062306a36Sopenharmony_ci{ 16162306a36Sopenharmony_ci u32 rptr; 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_ci rptr = *ring->rptr_cpu_addr; 16462306a36Sopenharmony_ci 16562306a36Sopenharmony_ci return (rptr & 0x3fffc) >> 2; 16662306a36Sopenharmony_ci} 16762306a36Sopenharmony_ci 16862306a36Sopenharmony_ci/** 16962306a36Sopenharmony_ci * cik_sdma_ring_get_wptr - get the current write pointer 17062306a36Sopenharmony_ci * 17162306a36Sopenharmony_ci * @ring: amdgpu ring pointer 17262306a36Sopenharmony_ci * 17362306a36Sopenharmony_ci * Get the current wptr from the hardware (CIK+). 17462306a36Sopenharmony_ci */ 17562306a36Sopenharmony_cistatic uint64_t cik_sdma_ring_get_wptr(struct amdgpu_ring *ring) 17662306a36Sopenharmony_ci{ 17762306a36Sopenharmony_ci struct amdgpu_device *adev = ring->adev; 17862306a36Sopenharmony_ci 17962306a36Sopenharmony_ci return (RREG32(mmSDMA0_GFX_RB_WPTR + sdma_offsets[ring->me]) & 0x3fffc) >> 2; 18062306a36Sopenharmony_ci} 18162306a36Sopenharmony_ci 18262306a36Sopenharmony_ci/** 18362306a36Sopenharmony_ci * cik_sdma_ring_set_wptr - commit the write pointer 18462306a36Sopenharmony_ci * 18562306a36Sopenharmony_ci * @ring: amdgpu ring pointer 18662306a36Sopenharmony_ci * 18762306a36Sopenharmony_ci * Write the wptr back to the hardware (CIK+). 18862306a36Sopenharmony_ci */ 18962306a36Sopenharmony_cistatic void cik_sdma_ring_set_wptr(struct amdgpu_ring *ring) 19062306a36Sopenharmony_ci{ 19162306a36Sopenharmony_ci struct amdgpu_device *adev = ring->adev; 19262306a36Sopenharmony_ci 19362306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_WPTR + sdma_offsets[ring->me], 19462306a36Sopenharmony_ci (ring->wptr << 2) & 0x3fffc); 19562306a36Sopenharmony_ci} 19662306a36Sopenharmony_ci 19762306a36Sopenharmony_cistatic void cik_sdma_ring_insert_nop(struct amdgpu_ring *ring, uint32_t count) 19862306a36Sopenharmony_ci{ 19962306a36Sopenharmony_ci struct amdgpu_sdma_instance *sdma = amdgpu_sdma_get_instance_from_ring(ring); 20062306a36Sopenharmony_ci int i; 20162306a36Sopenharmony_ci 20262306a36Sopenharmony_ci for (i = 0; i < count; i++) 20362306a36Sopenharmony_ci if (sdma && sdma->burst_nop && (i == 0)) 20462306a36Sopenharmony_ci amdgpu_ring_write(ring, ring->funcs->nop | 20562306a36Sopenharmony_ci SDMA_NOP_COUNT(count - 1)); 20662306a36Sopenharmony_ci else 20762306a36Sopenharmony_ci amdgpu_ring_write(ring, ring->funcs->nop); 20862306a36Sopenharmony_ci} 20962306a36Sopenharmony_ci 21062306a36Sopenharmony_ci/** 21162306a36Sopenharmony_ci * cik_sdma_ring_emit_ib - Schedule an IB on the DMA engine 21262306a36Sopenharmony_ci * 21362306a36Sopenharmony_ci * @ring: amdgpu ring pointer 21462306a36Sopenharmony_ci * @job: job to retrive vmid from 21562306a36Sopenharmony_ci * @ib: IB object to schedule 21662306a36Sopenharmony_ci * @flags: unused 21762306a36Sopenharmony_ci * 21862306a36Sopenharmony_ci * Schedule an IB in the DMA ring (CIK). 21962306a36Sopenharmony_ci */ 22062306a36Sopenharmony_cistatic void cik_sdma_ring_emit_ib(struct amdgpu_ring *ring, 22162306a36Sopenharmony_ci struct amdgpu_job *job, 22262306a36Sopenharmony_ci struct amdgpu_ib *ib, 22362306a36Sopenharmony_ci uint32_t flags) 22462306a36Sopenharmony_ci{ 22562306a36Sopenharmony_ci unsigned vmid = AMDGPU_JOB_GET_VMID(job); 22662306a36Sopenharmony_ci u32 extra_bits = vmid & 0xf; 22762306a36Sopenharmony_ci 22862306a36Sopenharmony_ci /* IB packet must end on a 8 DW boundary */ 22962306a36Sopenharmony_ci cik_sdma_ring_insert_nop(ring, (4 - lower_32_bits(ring->wptr)) & 7); 23062306a36Sopenharmony_ci 23162306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_INDIRECT_BUFFER, 0, extra_bits)); 23262306a36Sopenharmony_ci amdgpu_ring_write(ring, ib->gpu_addr & 0xffffffe0); /* base must be 32 byte aligned */ 23362306a36Sopenharmony_ci amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr) & 0xffffffff); 23462306a36Sopenharmony_ci amdgpu_ring_write(ring, ib->length_dw); 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci} 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_ci/** 23962306a36Sopenharmony_ci * cik_sdma_ring_emit_hdp_flush - emit an hdp flush on the DMA ring 24062306a36Sopenharmony_ci * 24162306a36Sopenharmony_ci * @ring: amdgpu ring pointer 24262306a36Sopenharmony_ci * 24362306a36Sopenharmony_ci * Emit an hdp flush packet on the requested DMA ring. 24462306a36Sopenharmony_ci */ 24562306a36Sopenharmony_cistatic void cik_sdma_ring_emit_hdp_flush(struct amdgpu_ring *ring) 24662306a36Sopenharmony_ci{ 24762306a36Sopenharmony_ci u32 extra_bits = (SDMA_POLL_REG_MEM_EXTRA_OP(1) | 24862306a36Sopenharmony_ci SDMA_POLL_REG_MEM_EXTRA_FUNC(3)); /* == */ 24962306a36Sopenharmony_ci u32 ref_and_mask; 25062306a36Sopenharmony_ci 25162306a36Sopenharmony_ci if (ring->me == 0) 25262306a36Sopenharmony_ci ref_and_mask = GPU_HDP_FLUSH_DONE__SDMA0_MASK; 25362306a36Sopenharmony_ci else 25462306a36Sopenharmony_ci ref_and_mask = GPU_HDP_FLUSH_DONE__SDMA1_MASK; 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_POLL_REG_MEM, 0, extra_bits)); 25762306a36Sopenharmony_ci amdgpu_ring_write(ring, mmGPU_HDP_FLUSH_DONE << 2); 25862306a36Sopenharmony_ci amdgpu_ring_write(ring, mmGPU_HDP_FLUSH_REQ << 2); 25962306a36Sopenharmony_ci amdgpu_ring_write(ring, ref_and_mask); /* reference */ 26062306a36Sopenharmony_ci amdgpu_ring_write(ring, ref_and_mask); /* mask */ 26162306a36Sopenharmony_ci amdgpu_ring_write(ring, (0xfff << 16) | 10); /* retry count, poll interval */ 26262306a36Sopenharmony_ci} 26362306a36Sopenharmony_ci 26462306a36Sopenharmony_ci/** 26562306a36Sopenharmony_ci * cik_sdma_ring_emit_fence - emit a fence on the DMA ring 26662306a36Sopenharmony_ci * 26762306a36Sopenharmony_ci * @ring: amdgpu ring pointer 26862306a36Sopenharmony_ci * @addr: address 26962306a36Sopenharmony_ci * @seq: sequence number 27062306a36Sopenharmony_ci * @flags: fence related flags 27162306a36Sopenharmony_ci * 27262306a36Sopenharmony_ci * Add a DMA fence packet to the ring to write 27362306a36Sopenharmony_ci * the fence seq number and DMA trap packet to generate 27462306a36Sopenharmony_ci * an interrupt if needed (CIK). 27562306a36Sopenharmony_ci */ 27662306a36Sopenharmony_cistatic void cik_sdma_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq, 27762306a36Sopenharmony_ci unsigned flags) 27862306a36Sopenharmony_ci{ 27962306a36Sopenharmony_ci bool write64bit = flags & AMDGPU_FENCE_FLAG_64BIT; 28062306a36Sopenharmony_ci /* write the fence */ 28162306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_FENCE, 0, 0)); 28262306a36Sopenharmony_ci amdgpu_ring_write(ring, lower_32_bits(addr)); 28362306a36Sopenharmony_ci amdgpu_ring_write(ring, upper_32_bits(addr)); 28462306a36Sopenharmony_ci amdgpu_ring_write(ring, lower_32_bits(seq)); 28562306a36Sopenharmony_ci 28662306a36Sopenharmony_ci /* optionally write high bits as well */ 28762306a36Sopenharmony_ci if (write64bit) { 28862306a36Sopenharmony_ci addr += 4; 28962306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_FENCE, 0, 0)); 29062306a36Sopenharmony_ci amdgpu_ring_write(ring, lower_32_bits(addr)); 29162306a36Sopenharmony_ci amdgpu_ring_write(ring, upper_32_bits(addr)); 29262306a36Sopenharmony_ci amdgpu_ring_write(ring, upper_32_bits(seq)); 29362306a36Sopenharmony_ci } 29462306a36Sopenharmony_ci 29562306a36Sopenharmony_ci /* generate an interrupt */ 29662306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_TRAP, 0, 0)); 29762306a36Sopenharmony_ci} 29862306a36Sopenharmony_ci 29962306a36Sopenharmony_ci/** 30062306a36Sopenharmony_ci * cik_sdma_gfx_stop - stop the gfx async dma engines 30162306a36Sopenharmony_ci * 30262306a36Sopenharmony_ci * @adev: amdgpu_device pointer 30362306a36Sopenharmony_ci * 30462306a36Sopenharmony_ci * Stop the gfx async dma ring buffers (CIK). 30562306a36Sopenharmony_ci */ 30662306a36Sopenharmony_cistatic void cik_sdma_gfx_stop(struct amdgpu_device *adev) 30762306a36Sopenharmony_ci{ 30862306a36Sopenharmony_ci u32 rb_cntl; 30962306a36Sopenharmony_ci int i; 31062306a36Sopenharmony_ci 31162306a36Sopenharmony_ci amdgpu_sdma_unset_buffer_funcs_helper(adev); 31262306a36Sopenharmony_ci 31362306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 31462306a36Sopenharmony_ci rb_cntl = RREG32(mmSDMA0_GFX_RB_CNTL + sdma_offsets[i]); 31562306a36Sopenharmony_ci rb_cntl &= ~SDMA0_GFX_RB_CNTL__RB_ENABLE_MASK; 31662306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_CNTL + sdma_offsets[i], rb_cntl); 31762306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_IB_CNTL + sdma_offsets[i], 0); 31862306a36Sopenharmony_ci } 31962306a36Sopenharmony_ci} 32062306a36Sopenharmony_ci 32162306a36Sopenharmony_ci/** 32262306a36Sopenharmony_ci * cik_sdma_rlc_stop - stop the compute async dma engines 32362306a36Sopenharmony_ci * 32462306a36Sopenharmony_ci * @adev: amdgpu_device pointer 32562306a36Sopenharmony_ci * 32662306a36Sopenharmony_ci * Stop the compute async dma queues (CIK). 32762306a36Sopenharmony_ci */ 32862306a36Sopenharmony_cistatic void cik_sdma_rlc_stop(struct amdgpu_device *adev) 32962306a36Sopenharmony_ci{ 33062306a36Sopenharmony_ci /* XXX todo */ 33162306a36Sopenharmony_ci} 33262306a36Sopenharmony_ci 33362306a36Sopenharmony_ci/** 33462306a36Sopenharmony_ci * cik_ctx_switch_enable - stop the async dma engines context switch 33562306a36Sopenharmony_ci * 33662306a36Sopenharmony_ci * @adev: amdgpu_device pointer 33762306a36Sopenharmony_ci * @enable: enable/disable the DMA MEs context switch. 33862306a36Sopenharmony_ci * 33962306a36Sopenharmony_ci * Halt or unhalt the async dma engines context switch (VI). 34062306a36Sopenharmony_ci */ 34162306a36Sopenharmony_cistatic void cik_ctx_switch_enable(struct amdgpu_device *adev, bool enable) 34262306a36Sopenharmony_ci{ 34362306a36Sopenharmony_ci u32 f32_cntl, phase_quantum = 0; 34462306a36Sopenharmony_ci int i; 34562306a36Sopenharmony_ci 34662306a36Sopenharmony_ci if (amdgpu_sdma_phase_quantum) { 34762306a36Sopenharmony_ci unsigned value = amdgpu_sdma_phase_quantum; 34862306a36Sopenharmony_ci unsigned unit = 0; 34962306a36Sopenharmony_ci 35062306a36Sopenharmony_ci while (value > (SDMA0_PHASE0_QUANTUM__VALUE_MASK >> 35162306a36Sopenharmony_ci SDMA0_PHASE0_QUANTUM__VALUE__SHIFT)) { 35262306a36Sopenharmony_ci value = (value + 1) >> 1; 35362306a36Sopenharmony_ci unit++; 35462306a36Sopenharmony_ci } 35562306a36Sopenharmony_ci if (unit > (SDMA0_PHASE0_QUANTUM__UNIT_MASK >> 35662306a36Sopenharmony_ci SDMA0_PHASE0_QUANTUM__UNIT__SHIFT)) { 35762306a36Sopenharmony_ci value = (SDMA0_PHASE0_QUANTUM__VALUE_MASK >> 35862306a36Sopenharmony_ci SDMA0_PHASE0_QUANTUM__VALUE__SHIFT); 35962306a36Sopenharmony_ci unit = (SDMA0_PHASE0_QUANTUM__UNIT_MASK >> 36062306a36Sopenharmony_ci SDMA0_PHASE0_QUANTUM__UNIT__SHIFT); 36162306a36Sopenharmony_ci WARN_ONCE(1, 36262306a36Sopenharmony_ci "clamping sdma_phase_quantum to %uK clock cycles\n", 36362306a36Sopenharmony_ci value << unit); 36462306a36Sopenharmony_ci } 36562306a36Sopenharmony_ci phase_quantum = 36662306a36Sopenharmony_ci value << SDMA0_PHASE0_QUANTUM__VALUE__SHIFT | 36762306a36Sopenharmony_ci unit << SDMA0_PHASE0_QUANTUM__UNIT__SHIFT; 36862306a36Sopenharmony_ci } 36962306a36Sopenharmony_ci 37062306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 37162306a36Sopenharmony_ci f32_cntl = RREG32(mmSDMA0_CNTL + sdma_offsets[i]); 37262306a36Sopenharmony_ci if (enable) { 37362306a36Sopenharmony_ci f32_cntl = REG_SET_FIELD(f32_cntl, SDMA0_CNTL, 37462306a36Sopenharmony_ci AUTO_CTXSW_ENABLE, 1); 37562306a36Sopenharmony_ci if (amdgpu_sdma_phase_quantum) { 37662306a36Sopenharmony_ci WREG32(mmSDMA0_PHASE0_QUANTUM + sdma_offsets[i], 37762306a36Sopenharmony_ci phase_quantum); 37862306a36Sopenharmony_ci WREG32(mmSDMA0_PHASE1_QUANTUM + sdma_offsets[i], 37962306a36Sopenharmony_ci phase_quantum); 38062306a36Sopenharmony_ci } 38162306a36Sopenharmony_ci } else { 38262306a36Sopenharmony_ci f32_cntl = REG_SET_FIELD(f32_cntl, SDMA0_CNTL, 38362306a36Sopenharmony_ci AUTO_CTXSW_ENABLE, 0); 38462306a36Sopenharmony_ci } 38562306a36Sopenharmony_ci 38662306a36Sopenharmony_ci WREG32(mmSDMA0_CNTL + sdma_offsets[i], f32_cntl); 38762306a36Sopenharmony_ci } 38862306a36Sopenharmony_ci} 38962306a36Sopenharmony_ci 39062306a36Sopenharmony_ci/** 39162306a36Sopenharmony_ci * cik_sdma_enable - stop the async dma engines 39262306a36Sopenharmony_ci * 39362306a36Sopenharmony_ci * @adev: amdgpu_device pointer 39462306a36Sopenharmony_ci * @enable: enable/disable the DMA MEs. 39562306a36Sopenharmony_ci * 39662306a36Sopenharmony_ci * Halt or unhalt the async dma engines (CIK). 39762306a36Sopenharmony_ci */ 39862306a36Sopenharmony_cistatic void cik_sdma_enable(struct amdgpu_device *adev, bool enable) 39962306a36Sopenharmony_ci{ 40062306a36Sopenharmony_ci u32 me_cntl; 40162306a36Sopenharmony_ci int i; 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci if (!enable) { 40462306a36Sopenharmony_ci cik_sdma_gfx_stop(adev); 40562306a36Sopenharmony_ci cik_sdma_rlc_stop(adev); 40662306a36Sopenharmony_ci } 40762306a36Sopenharmony_ci 40862306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 40962306a36Sopenharmony_ci me_cntl = RREG32(mmSDMA0_F32_CNTL + sdma_offsets[i]); 41062306a36Sopenharmony_ci if (enable) 41162306a36Sopenharmony_ci me_cntl &= ~SDMA0_F32_CNTL__HALT_MASK; 41262306a36Sopenharmony_ci else 41362306a36Sopenharmony_ci me_cntl |= SDMA0_F32_CNTL__HALT_MASK; 41462306a36Sopenharmony_ci WREG32(mmSDMA0_F32_CNTL + sdma_offsets[i], me_cntl); 41562306a36Sopenharmony_ci } 41662306a36Sopenharmony_ci} 41762306a36Sopenharmony_ci 41862306a36Sopenharmony_ci/** 41962306a36Sopenharmony_ci * cik_sdma_gfx_resume - setup and start the async dma engines 42062306a36Sopenharmony_ci * 42162306a36Sopenharmony_ci * @adev: amdgpu_device pointer 42262306a36Sopenharmony_ci * 42362306a36Sopenharmony_ci * Set up the gfx DMA ring buffers and enable them (CIK). 42462306a36Sopenharmony_ci * Returns 0 for success, error for failure. 42562306a36Sopenharmony_ci */ 42662306a36Sopenharmony_cistatic int cik_sdma_gfx_resume(struct amdgpu_device *adev) 42762306a36Sopenharmony_ci{ 42862306a36Sopenharmony_ci struct amdgpu_ring *ring; 42962306a36Sopenharmony_ci u32 rb_cntl, ib_cntl; 43062306a36Sopenharmony_ci u32 rb_bufsz; 43162306a36Sopenharmony_ci int i, j, r; 43262306a36Sopenharmony_ci 43362306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 43462306a36Sopenharmony_ci ring = &adev->sdma.instance[i].ring; 43562306a36Sopenharmony_ci 43662306a36Sopenharmony_ci mutex_lock(&adev->srbm_mutex); 43762306a36Sopenharmony_ci for (j = 0; j < 16; j++) { 43862306a36Sopenharmony_ci cik_srbm_select(adev, 0, 0, 0, j); 43962306a36Sopenharmony_ci /* SDMA GFX */ 44062306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_VIRTUAL_ADDR + sdma_offsets[i], 0); 44162306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_APE1_CNTL + sdma_offsets[i], 0); 44262306a36Sopenharmony_ci /* XXX SDMA RLC - todo */ 44362306a36Sopenharmony_ci } 44462306a36Sopenharmony_ci cik_srbm_select(adev, 0, 0, 0, 0); 44562306a36Sopenharmony_ci mutex_unlock(&adev->srbm_mutex); 44662306a36Sopenharmony_ci 44762306a36Sopenharmony_ci WREG32(mmSDMA0_TILING_CONFIG + sdma_offsets[i], 44862306a36Sopenharmony_ci adev->gfx.config.gb_addr_config & 0x70); 44962306a36Sopenharmony_ci 45062306a36Sopenharmony_ci WREG32(mmSDMA0_SEM_INCOMPLETE_TIMER_CNTL + sdma_offsets[i], 0); 45162306a36Sopenharmony_ci WREG32(mmSDMA0_SEM_WAIT_FAIL_TIMER_CNTL + sdma_offsets[i], 0); 45262306a36Sopenharmony_ci 45362306a36Sopenharmony_ci /* Set ring buffer size in dwords */ 45462306a36Sopenharmony_ci rb_bufsz = order_base_2(ring->ring_size / 4); 45562306a36Sopenharmony_ci rb_cntl = rb_bufsz << 1; 45662306a36Sopenharmony_ci#ifdef __BIG_ENDIAN 45762306a36Sopenharmony_ci rb_cntl |= SDMA0_GFX_RB_CNTL__RB_SWAP_ENABLE_MASK | 45862306a36Sopenharmony_ci SDMA0_GFX_RB_CNTL__RPTR_WRITEBACK_SWAP_ENABLE_MASK; 45962306a36Sopenharmony_ci#endif 46062306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_CNTL + sdma_offsets[i], rb_cntl); 46162306a36Sopenharmony_ci 46262306a36Sopenharmony_ci /* Initialize the ring buffer's read and write pointers */ 46362306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_RPTR + sdma_offsets[i], 0); 46462306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_WPTR + sdma_offsets[i], 0); 46562306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_IB_RPTR + sdma_offsets[i], 0); 46662306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_IB_OFFSET + sdma_offsets[i], 0); 46762306a36Sopenharmony_ci 46862306a36Sopenharmony_ci /* set the wb address whether it's enabled or not */ 46962306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_RPTR_ADDR_HI + sdma_offsets[i], 47062306a36Sopenharmony_ci upper_32_bits(ring->rptr_gpu_addr) & 0xFFFFFFFF); 47162306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_RPTR_ADDR_LO + sdma_offsets[i], 47262306a36Sopenharmony_ci ((ring->rptr_gpu_addr) & 0xFFFFFFFC)); 47362306a36Sopenharmony_ci 47462306a36Sopenharmony_ci rb_cntl |= SDMA0_GFX_RB_CNTL__RPTR_WRITEBACK_ENABLE_MASK; 47562306a36Sopenharmony_ci 47662306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_BASE + sdma_offsets[i], ring->gpu_addr >> 8); 47762306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_BASE_HI + sdma_offsets[i], ring->gpu_addr >> 40); 47862306a36Sopenharmony_ci 47962306a36Sopenharmony_ci ring->wptr = 0; 48062306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_WPTR + sdma_offsets[i], ring->wptr << 2); 48162306a36Sopenharmony_ci 48262306a36Sopenharmony_ci /* enable DMA RB */ 48362306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_RB_CNTL + sdma_offsets[i], 48462306a36Sopenharmony_ci rb_cntl | SDMA0_GFX_RB_CNTL__RB_ENABLE_MASK); 48562306a36Sopenharmony_ci 48662306a36Sopenharmony_ci ib_cntl = SDMA0_GFX_IB_CNTL__IB_ENABLE_MASK; 48762306a36Sopenharmony_ci#ifdef __BIG_ENDIAN 48862306a36Sopenharmony_ci ib_cntl |= SDMA0_GFX_IB_CNTL__IB_SWAP_ENABLE_MASK; 48962306a36Sopenharmony_ci#endif 49062306a36Sopenharmony_ci /* enable DMA IBs */ 49162306a36Sopenharmony_ci WREG32(mmSDMA0_GFX_IB_CNTL + sdma_offsets[i], ib_cntl); 49262306a36Sopenharmony_ci } 49362306a36Sopenharmony_ci 49462306a36Sopenharmony_ci cik_sdma_enable(adev, true); 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 49762306a36Sopenharmony_ci ring = &adev->sdma.instance[i].ring; 49862306a36Sopenharmony_ci r = amdgpu_ring_test_helper(ring); 49962306a36Sopenharmony_ci if (r) 50062306a36Sopenharmony_ci return r; 50162306a36Sopenharmony_ci 50262306a36Sopenharmony_ci if (adev->mman.buffer_funcs_ring == ring) 50362306a36Sopenharmony_ci amdgpu_ttm_set_buffer_funcs_status(adev, true); 50462306a36Sopenharmony_ci } 50562306a36Sopenharmony_ci 50662306a36Sopenharmony_ci return 0; 50762306a36Sopenharmony_ci} 50862306a36Sopenharmony_ci 50962306a36Sopenharmony_ci/** 51062306a36Sopenharmony_ci * cik_sdma_rlc_resume - setup and start the async dma engines 51162306a36Sopenharmony_ci * 51262306a36Sopenharmony_ci * @adev: amdgpu_device pointer 51362306a36Sopenharmony_ci * 51462306a36Sopenharmony_ci * Set up the compute DMA queues and enable them (CIK). 51562306a36Sopenharmony_ci * Returns 0 for success, error for failure. 51662306a36Sopenharmony_ci */ 51762306a36Sopenharmony_cistatic int cik_sdma_rlc_resume(struct amdgpu_device *adev) 51862306a36Sopenharmony_ci{ 51962306a36Sopenharmony_ci /* XXX todo */ 52062306a36Sopenharmony_ci return 0; 52162306a36Sopenharmony_ci} 52262306a36Sopenharmony_ci 52362306a36Sopenharmony_ci/** 52462306a36Sopenharmony_ci * cik_sdma_load_microcode - load the sDMA ME ucode 52562306a36Sopenharmony_ci * 52662306a36Sopenharmony_ci * @adev: amdgpu_device pointer 52762306a36Sopenharmony_ci * 52862306a36Sopenharmony_ci * Loads the sDMA0/1 ucode. 52962306a36Sopenharmony_ci * Returns 0 for success, -EINVAL if the ucode is not available. 53062306a36Sopenharmony_ci */ 53162306a36Sopenharmony_cistatic int cik_sdma_load_microcode(struct amdgpu_device *adev) 53262306a36Sopenharmony_ci{ 53362306a36Sopenharmony_ci const struct sdma_firmware_header_v1_0 *hdr; 53462306a36Sopenharmony_ci const __le32 *fw_data; 53562306a36Sopenharmony_ci u32 fw_size; 53662306a36Sopenharmony_ci int i, j; 53762306a36Sopenharmony_ci 53862306a36Sopenharmony_ci /* halt the MEs */ 53962306a36Sopenharmony_ci cik_sdma_enable(adev, false); 54062306a36Sopenharmony_ci 54162306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 54262306a36Sopenharmony_ci if (!adev->sdma.instance[i].fw) 54362306a36Sopenharmony_ci return -EINVAL; 54462306a36Sopenharmony_ci hdr = (const struct sdma_firmware_header_v1_0 *)adev->sdma.instance[i].fw->data; 54562306a36Sopenharmony_ci amdgpu_ucode_print_sdma_hdr(&hdr->header); 54662306a36Sopenharmony_ci fw_size = le32_to_cpu(hdr->header.ucode_size_bytes) / 4; 54762306a36Sopenharmony_ci adev->sdma.instance[i].fw_version = le32_to_cpu(hdr->header.ucode_version); 54862306a36Sopenharmony_ci adev->sdma.instance[i].feature_version = le32_to_cpu(hdr->ucode_feature_version); 54962306a36Sopenharmony_ci if (adev->sdma.instance[i].feature_version >= 20) 55062306a36Sopenharmony_ci adev->sdma.instance[i].burst_nop = true; 55162306a36Sopenharmony_ci fw_data = (const __le32 *) 55262306a36Sopenharmony_ci (adev->sdma.instance[i].fw->data + le32_to_cpu(hdr->header.ucode_array_offset_bytes)); 55362306a36Sopenharmony_ci WREG32(mmSDMA0_UCODE_ADDR + sdma_offsets[i], 0); 55462306a36Sopenharmony_ci for (j = 0; j < fw_size; j++) 55562306a36Sopenharmony_ci WREG32(mmSDMA0_UCODE_DATA + sdma_offsets[i], le32_to_cpup(fw_data++)); 55662306a36Sopenharmony_ci WREG32(mmSDMA0_UCODE_ADDR + sdma_offsets[i], adev->sdma.instance[i].fw_version); 55762306a36Sopenharmony_ci } 55862306a36Sopenharmony_ci 55962306a36Sopenharmony_ci return 0; 56062306a36Sopenharmony_ci} 56162306a36Sopenharmony_ci 56262306a36Sopenharmony_ci/** 56362306a36Sopenharmony_ci * cik_sdma_start - setup and start the async dma engines 56462306a36Sopenharmony_ci * 56562306a36Sopenharmony_ci * @adev: amdgpu_device pointer 56662306a36Sopenharmony_ci * 56762306a36Sopenharmony_ci * Set up the DMA engines and enable them (CIK). 56862306a36Sopenharmony_ci * Returns 0 for success, error for failure. 56962306a36Sopenharmony_ci */ 57062306a36Sopenharmony_cistatic int cik_sdma_start(struct amdgpu_device *adev) 57162306a36Sopenharmony_ci{ 57262306a36Sopenharmony_ci int r; 57362306a36Sopenharmony_ci 57462306a36Sopenharmony_ci r = cik_sdma_load_microcode(adev); 57562306a36Sopenharmony_ci if (r) 57662306a36Sopenharmony_ci return r; 57762306a36Sopenharmony_ci 57862306a36Sopenharmony_ci /* halt the engine before programing */ 57962306a36Sopenharmony_ci cik_sdma_enable(adev, false); 58062306a36Sopenharmony_ci /* enable sdma ring preemption */ 58162306a36Sopenharmony_ci cik_ctx_switch_enable(adev, true); 58262306a36Sopenharmony_ci 58362306a36Sopenharmony_ci /* start the gfx rings and rlc compute queues */ 58462306a36Sopenharmony_ci r = cik_sdma_gfx_resume(adev); 58562306a36Sopenharmony_ci if (r) 58662306a36Sopenharmony_ci return r; 58762306a36Sopenharmony_ci r = cik_sdma_rlc_resume(adev); 58862306a36Sopenharmony_ci if (r) 58962306a36Sopenharmony_ci return r; 59062306a36Sopenharmony_ci 59162306a36Sopenharmony_ci return 0; 59262306a36Sopenharmony_ci} 59362306a36Sopenharmony_ci 59462306a36Sopenharmony_ci/** 59562306a36Sopenharmony_ci * cik_sdma_ring_test_ring - simple async dma engine test 59662306a36Sopenharmony_ci * 59762306a36Sopenharmony_ci * @ring: amdgpu_ring structure holding ring information 59862306a36Sopenharmony_ci * 59962306a36Sopenharmony_ci * Test the DMA engine by writing using it to write an 60062306a36Sopenharmony_ci * value to memory. (CIK). 60162306a36Sopenharmony_ci * Returns 0 for success, error for failure. 60262306a36Sopenharmony_ci */ 60362306a36Sopenharmony_cistatic int cik_sdma_ring_test_ring(struct amdgpu_ring *ring) 60462306a36Sopenharmony_ci{ 60562306a36Sopenharmony_ci struct amdgpu_device *adev = ring->adev; 60662306a36Sopenharmony_ci unsigned i; 60762306a36Sopenharmony_ci unsigned index; 60862306a36Sopenharmony_ci int r; 60962306a36Sopenharmony_ci u32 tmp; 61062306a36Sopenharmony_ci u64 gpu_addr; 61162306a36Sopenharmony_ci 61262306a36Sopenharmony_ci r = amdgpu_device_wb_get(adev, &index); 61362306a36Sopenharmony_ci if (r) 61462306a36Sopenharmony_ci return r; 61562306a36Sopenharmony_ci 61662306a36Sopenharmony_ci gpu_addr = adev->wb.gpu_addr + (index * 4); 61762306a36Sopenharmony_ci tmp = 0xCAFEDEAD; 61862306a36Sopenharmony_ci adev->wb.wb[index] = cpu_to_le32(tmp); 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_ci r = amdgpu_ring_alloc(ring, 5); 62162306a36Sopenharmony_ci if (r) 62262306a36Sopenharmony_ci goto error_free_wb; 62362306a36Sopenharmony_ci 62462306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_WRITE, SDMA_WRITE_SUB_OPCODE_LINEAR, 0)); 62562306a36Sopenharmony_ci amdgpu_ring_write(ring, lower_32_bits(gpu_addr)); 62662306a36Sopenharmony_ci amdgpu_ring_write(ring, upper_32_bits(gpu_addr)); 62762306a36Sopenharmony_ci amdgpu_ring_write(ring, 1); /* number of DWs to follow */ 62862306a36Sopenharmony_ci amdgpu_ring_write(ring, 0xDEADBEEF); 62962306a36Sopenharmony_ci amdgpu_ring_commit(ring); 63062306a36Sopenharmony_ci 63162306a36Sopenharmony_ci for (i = 0; i < adev->usec_timeout; i++) { 63262306a36Sopenharmony_ci tmp = le32_to_cpu(adev->wb.wb[index]); 63362306a36Sopenharmony_ci if (tmp == 0xDEADBEEF) 63462306a36Sopenharmony_ci break; 63562306a36Sopenharmony_ci udelay(1); 63662306a36Sopenharmony_ci } 63762306a36Sopenharmony_ci 63862306a36Sopenharmony_ci if (i >= adev->usec_timeout) 63962306a36Sopenharmony_ci r = -ETIMEDOUT; 64062306a36Sopenharmony_ci 64162306a36Sopenharmony_cierror_free_wb: 64262306a36Sopenharmony_ci amdgpu_device_wb_free(adev, index); 64362306a36Sopenharmony_ci return r; 64462306a36Sopenharmony_ci} 64562306a36Sopenharmony_ci 64662306a36Sopenharmony_ci/** 64762306a36Sopenharmony_ci * cik_sdma_ring_test_ib - test an IB on the DMA engine 64862306a36Sopenharmony_ci * 64962306a36Sopenharmony_ci * @ring: amdgpu_ring structure holding ring information 65062306a36Sopenharmony_ci * @timeout: timeout value in jiffies, or MAX_SCHEDULE_TIMEOUT 65162306a36Sopenharmony_ci * 65262306a36Sopenharmony_ci * Test a simple IB in the DMA ring (CIK). 65362306a36Sopenharmony_ci * Returns 0 on success, error on failure. 65462306a36Sopenharmony_ci */ 65562306a36Sopenharmony_cistatic int cik_sdma_ring_test_ib(struct amdgpu_ring *ring, long timeout) 65662306a36Sopenharmony_ci{ 65762306a36Sopenharmony_ci struct amdgpu_device *adev = ring->adev; 65862306a36Sopenharmony_ci struct amdgpu_ib ib; 65962306a36Sopenharmony_ci struct dma_fence *f = NULL; 66062306a36Sopenharmony_ci unsigned index; 66162306a36Sopenharmony_ci u32 tmp = 0; 66262306a36Sopenharmony_ci u64 gpu_addr; 66362306a36Sopenharmony_ci long r; 66462306a36Sopenharmony_ci 66562306a36Sopenharmony_ci r = amdgpu_device_wb_get(adev, &index); 66662306a36Sopenharmony_ci if (r) 66762306a36Sopenharmony_ci return r; 66862306a36Sopenharmony_ci 66962306a36Sopenharmony_ci gpu_addr = adev->wb.gpu_addr + (index * 4); 67062306a36Sopenharmony_ci tmp = 0xCAFEDEAD; 67162306a36Sopenharmony_ci adev->wb.wb[index] = cpu_to_le32(tmp); 67262306a36Sopenharmony_ci memset(&ib, 0, sizeof(ib)); 67362306a36Sopenharmony_ci r = amdgpu_ib_get(adev, NULL, 256, 67462306a36Sopenharmony_ci AMDGPU_IB_POOL_DIRECT, &ib); 67562306a36Sopenharmony_ci if (r) 67662306a36Sopenharmony_ci goto err0; 67762306a36Sopenharmony_ci 67862306a36Sopenharmony_ci ib.ptr[0] = SDMA_PACKET(SDMA_OPCODE_WRITE, 67962306a36Sopenharmony_ci SDMA_WRITE_SUB_OPCODE_LINEAR, 0); 68062306a36Sopenharmony_ci ib.ptr[1] = lower_32_bits(gpu_addr); 68162306a36Sopenharmony_ci ib.ptr[2] = upper_32_bits(gpu_addr); 68262306a36Sopenharmony_ci ib.ptr[3] = 1; 68362306a36Sopenharmony_ci ib.ptr[4] = 0xDEADBEEF; 68462306a36Sopenharmony_ci ib.length_dw = 5; 68562306a36Sopenharmony_ci r = amdgpu_ib_schedule(ring, 1, &ib, NULL, &f); 68662306a36Sopenharmony_ci if (r) 68762306a36Sopenharmony_ci goto err1; 68862306a36Sopenharmony_ci 68962306a36Sopenharmony_ci r = dma_fence_wait_timeout(f, false, timeout); 69062306a36Sopenharmony_ci if (r == 0) { 69162306a36Sopenharmony_ci r = -ETIMEDOUT; 69262306a36Sopenharmony_ci goto err1; 69362306a36Sopenharmony_ci } else if (r < 0) { 69462306a36Sopenharmony_ci goto err1; 69562306a36Sopenharmony_ci } 69662306a36Sopenharmony_ci tmp = le32_to_cpu(adev->wb.wb[index]); 69762306a36Sopenharmony_ci if (tmp == 0xDEADBEEF) 69862306a36Sopenharmony_ci r = 0; 69962306a36Sopenharmony_ci else 70062306a36Sopenharmony_ci r = -EINVAL; 70162306a36Sopenharmony_ci 70262306a36Sopenharmony_cierr1: 70362306a36Sopenharmony_ci amdgpu_ib_free(adev, &ib, NULL); 70462306a36Sopenharmony_ci dma_fence_put(f); 70562306a36Sopenharmony_cierr0: 70662306a36Sopenharmony_ci amdgpu_device_wb_free(adev, index); 70762306a36Sopenharmony_ci return r; 70862306a36Sopenharmony_ci} 70962306a36Sopenharmony_ci 71062306a36Sopenharmony_ci/** 71162306a36Sopenharmony_ci * cik_sdma_vm_copy_pte - update PTEs by copying them from the GART 71262306a36Sopenharmony_ci * 71362306a36Sopenharmony_ci * @ib: indirect buffer to fill with commands 71462306a36Sopenharmony_ci * @pe: addr of the page entry 71562306a36Sopenharmony_ci * @src: src addr to copy from 71662306a36Sopenharmony_ci * @count: number of page entries to update 71762306a36Sopenharmony_ci * 71862306a36Sopenharmony_ci * Update PTEs by copying them from the GART using sDMA (CIK). 71962306a36Sopenharmony_ci */ 72062306a36Sopenharmony_cistatic void cik_sdma_vm_copy_pte(struct amdgpu_ib *ib, 72162306a36Sopenharmony_ci uint64_t pe, uint64_t src, 72262306a36Sopenharmony_ci unsigned count) 72362306a36Sopenharmony_ci{ 72462306a36Sopenharmony_ci unsigned bytes = count * 8; 72562306a36Sopenharmony_ci 72662306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_COPY, 72762306a36Sopenharmony_ci SDMA_WRITE_SUB_OPCODE_LINEAR, 0); 72862306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = bytes; 72962306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = 0; /* src/dst endian swap */ 73062306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(src); 73162306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(src); 73262306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(pe); 73362306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(pe); 73462306a36Sopenharmony_ci} 73562306a36Sopenharmony_ci 73662306a36Sopenharmony_ci/** 73762306a36Sopenharmony_ci * cik_sdma_vm_write_pte - update PTEs by writing them manually 73862306a36Sopenharmony_ci * 73962306a36Sopenharmony_ci * @ib: indirect buffer to fill with commands 74062306a36Sopenharmony_ci * @pe: addr of the page entry 74162306a36Sopenharmony_ci * @value: dst addr to write into pe 74262306a36Sopenharmony_ci * @count: number of page entries to update 74362306a36Sopenharmony_ci * @incr: increase next addr by incr bytes 74462306a36Sopenharmony_ci * 74562306a36Sopenharmony_ci * Update PTEs by writing them manually using sDMA (CIK). 74662306a36Sopenharmony_ci */ 74762306a36Sopenharmony_cistatic void cik_sdma_vm_write_pte(struct amdgpu_ib *ib, uint64_t pe, 74862306a36Sopenharmony_ci uint64_t value, unsigned count, 74962306a36Sopenharmony_ci uint32_t incr) 75062306a36Sopenharmony_ci{ 75162306a36Sopenharmony_ci unsigned ndw = count * 2; 75262306a36Sopenharmony_ci 75362306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_WRITE, 75462306a36Sopenharmony_ci SDMA_WRITE_SUB_OPCODE_LINEAR, 0); 75562306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(pe); 75662306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(pe); 75762306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = ndw; 75862306a36Sopenharmony_ci for (; ndw > 0; ndw -= 2) { 75962306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(value); 76062306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(value); 76162306a36Sopenharmony_ci value += incr; 76262306a36Sopenharmony_ci } 76362306a36Sopenharmony_ci} 76462306a36Sopenharmony_ci 76562306a36Sopenharmony_ci/** 76662306a36Sopenharmony_ci * cik_sdma_vm_set_pte_pde - update the page tables using sDMA 76762306a36Sopenharmony_ci * 76862306a36Sopenharmony_ci * @ib: indirect buffer to fill with commands 76962306a36Sopenharmony_ci * @pe: addr of the page entry 77062306a36Sopenharmony_ci * @addr: dst addr to write into pe 77162306a36Sopenharmony_ci * @count: number of page entries to update 77262306a36Sopenharmony_ci * @incr: increase next addr by incr bytes 77362306a36Sopenharmony_ci * @flags: access flags 77462306a36Sopenharmony_ci * 77562306a36Sopenharmony_ci * Update the page tables using sDMA (CIK). 77662306a36Sopenharmony_ci */ 77762306a36Sopenharmony_cistatic void cik_sdma_vm_set_pte_pde(struct amdgpu_ib *ib, uint64_t pe, 77862306a36Sopenharmony_ci uint64_t addr, unsigned count, 77962306a36Sopenharmony_ci uint32_t incr, uint64_t flags) 78062306a36Sopenharmony_ci{ 78162306a36Sopenharmony_ci /* for physically contiguous pages (vram) */ 78262306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_GENERATE_PTE_PDE, 0, 0); 78362306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(pe); /* dst addr */ 78462306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(pe); 78562306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(flags); /* mask */ 78662306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(flags); 78762306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(addr); /* value */ 78862306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(addr); 78962306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = incr; /* increment size */ 79062306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = 0; 79162306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = count; /* number of entries */ 79262306a36Sopenharmony_ci} 79362306a36Sopenharmony_ci 79462306a36Sopenharmony_ci/** 79562306a36Sopenharmony_ci * cik_sdma_ring_pad_ib - pad the IB to the required number of dw 79662306a36Sopenharmony_ci * 79762306a36Sopenharmony_ci * @ring: amdgpu_ring structure holding ring information 79862306a36Sopenharmony_ci * @ib: indirect buffer to fill with padding 79962306a36Sopenharmony_ci * 80062306a36Sopenharmony_ci */ 80162306a36Sopenharmony_cistatic void cik_sdma_ring_pad_ib(struct amdgpu_ring *ring, struct amdgpu_ib *ib) 80262306a36Sopenharmony_ci{ 80362306a36Sopenharmony_ci struct amdgpu_sdma_instance *sdma = amdgpu_sdma_get_instance_from_ring(ring); 80462306a36Sopenharmony_ci u32 pad_count; 80562306a36Sopenharmony_ci int i; 80662306a36Sopenharmony_ci 80762306a36Sopenharmony_ci pad_count = (-ib->length_dw) & 7; 80862306a36Sopenharmony_ci for (i = 0; i < pad_count; i++) 80962306a36Sopenharmony_ci if (sdma && sdma->burst_nop && (i == 0)) 81062306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = 81162306a36Sopenharmony_ci SDMA_PACKET(SDMA_OPCODE_NOP, 0, 0) | 81262306a36Sopenharmony_ci SDMA_NOP_COUNT(pad_count - 1); 81362306a36Sopenharmony_ci else 81462306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = 81562306a36Sopenharmony_ci SDMA_PACKET(SDMA_OPCODE_NOP, 0, 0); 81662306a36Sopenharmony_ci} 81762306a36Sopenharmony_ci 81862306a36Sopenharmony_ci/** 81962306a36Sopenharmony_ci * cik_sdma_ring_emit_pipeline_sync - sync the pipeline 82062306a36Sopenharmony_ci * 82162306a36Sopenharmony_ci * @ring: amdgpu_ring pointer 82262306a36Sopenharmony_ci * 82362306a36Sopenharmony_ci * Make sure all previous operations are completed (CIK). 82462306a36Sopenharmony_ci */ 82562306a36Sopenharmony_cistatic void cik_sdma_ring_emit_pipeline_sync(struct amdgpu_ring *ring) 82662306a36Sopenharmony_ci{ 82762306a36Sopenharmony_ci uint32_t seq = ring->fence_drv.sync_seq; 82862306a36Sopenharmony_ci uint64_t addr = ring->fence_drv.gpu_addr; 82962306a36Sopenharmony_ci 83062306a36Sopenharmony_ci /* wait for idle */ 83162306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_POLL_REG_MEM, 0, 83262306a36Sopenharmony_ci SDMA_POLL_REG_MEM_EXTRA_OP(0) | 83362306a36Sopenharmony_ci SDMA_POLL_REG_MEM_EXTRA_FUNC(3) | /* equal */ 83462306a36Sopenharmony_ci SDMA_POLL_REG_MEM_EXTRA_M)); 83562306a36Sopenharmony_ci amdgpu_ring_write(ring, addr & 0xfffffffc); 83662306a36Sopenharmony_ci amdgpu_ring_write(ring, upper_32_bits(addr) & 0xffffffff); 83762306a36Sopenharmony_ci amdgpu_ring_write(ring, seq); /* reference */ 83862306a36Sopenharmony_ci amdgpu_ring_write(ring, 0xffffffff); /* mask */ 83962306a36Sopenharmony_ci amdgpu_ring_write(ring, (0xfff << 16) | 4); /* retry count, poll interval */ 84062306a36Sopenharmony_ci} 84162306a36Sopenharmony_ci 84262306a36Sopenharmony_ci/** 84362306a36Sopenharmony_ci * cik_sdma_ring_emit_vm_flush - cik vm flush using sDMA 84462306a36Sopenharmony_ci * 84562306a36Sopenharmony_ci * @ring: amdgpu_ring pointer 84662306a36Sopenharmony_ci * @vmid: vmid number to use 84762306a36Sopenharmony_ci * @pd_addr: address 84862306a36Sopenharmony_ci * 84962306a36Sopenharmony_ci * Update the page table base and flush the VM TLB 85062306a36Sopenharmony_ci * using sDMA (CIK). 85162306a36Sopenharmony_ci */ 85262306a36Sopenharmony_cistatic void cik_sdma_ring_emit_vm_flush(struct amdgpu_ring *ring, 85362306a36Sopenharmony_ci unsigned vmid, uint64_t pd_addr) 85462306a36Sopenharmony_ci{ 85562306a36Sopenharmony_ci u32 extra_bits = (SDMA_POLL_REG_MEM_EXTRA_OP(0) | 85662306a36Sopenharmony_ci SDMA_POLL_REG_MEM_EXTRA_FUNC(0)); /* always */ 85762306a36Sopenharmony_ci 85862306a36Sopenharmony_ci amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr); 85962306a36Sopenharmony_ci 86062306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_POLL_REG_MEM, 0, extra_bits)); 86162306a36Sopenharmony_ci amdgpu_ring_write(ring, mmVM_INVALIDATE_REQUEST << 2); 86262306a36Sopenharmony_ci amdgpu_ring_write(ring, 0); 86362306a36Sopenharmony_ci amdgpu_ring_write(ring, 0); /* reference */ 86462306a36Sopenharmony_ci amdgpu_ring_write(ring, 0); /* mask */ 86562306a36Sopenharmony_ci amdgpu_ring_write(ring, (0xfff << 16) | 10); /* retry count, poll interval */ 86662306a36Sopenharmony_ci} 86762306a36Sopenharmony_ci 86862306a36Sopenharmony_cistatic void cik_sdma_ring_emit_wreg(struct amdgpu_ring *ring, 86962306a36Sopenharmony_ci uint32_t reg, uint32_t val) 87062306a36Sopenharmony_ci{ 87162306a36Sopenharmony_ci amdgpu_ring_write(ring, SDMA_PACKET(SDMA_OPCODE_SRBM_WRITE, 0, 0xf000)); 87262306a36Sopenharmony_ci amdgpu_ring_write(ring, reg); 87362306a36Sopenharmony_ci amdgpu_ring_write(ring, val); 87462306a36Sopenharmony_ci} 87562306a36Sopenharmony_ci 87662306a36Sopenharmony_cistatic void cik_enable_sdma_mgcg(struct amdgpu_device *adev, 87762306a36Sopenharmony_ci bool enable) 87862306a36Sopenharmony_ci{ 87962306a36Sopenharmony_ci u32 orig, data; 88062306a36Sopenharmony_ci 88162306a36Sopenharmony_ci if (enable && (adev->cg_flags & AMD_CG_SUPPORT_SDMA_MGCG)) { 88262306a36Sopenharmony_ci WREG32(mmSDMA0_CLK_CTRL + SDMA0_REGISTER_OFFSET, 0x00000100); 88362306a36Sopenharmony_ci WREG32(mmSDMA0_CLK_CTRL + SDMA1_REGISTER_OFFSET, 0x00000100); 88462306a36Sopenharmony_ci } else { 88562306a36Sopenharmony_ci orig = data = RREG32(mmSDMA0_CLK_CTRL + SDMA0_REGISTER_OFFSET); 88662306a36Sopenharmony_ci data |= 0xff000000; 88762306a36Sopenharmony_ci if (data != orig) 88862306a36Sopenharmony_ci WREG32(mmSDMA0_CLK_CTRL + SDMA0_REGISTER_OFFSET, data); 88962306a36Sopenharmony_ci 89062306a36Sopenharmony_ci orig = data = RREG32(mmSDMA0_CLK_CTRL + SDMA1_REGISTER_OFFSET); 89162306a36Sopenharmony_ci data |= 0xff000000; 89262306a36Sopenharmony_ci if (data != orig) 89362306a36Sopenharmony_ci WREG32(mmSDMA0_CLK_CTRL + SDMA1_REGISTER_OFFSET, data); 89462306a36Sopenharmony_ci } 89562306a36Sopenharmony_ci} 89662306a36Sopenharmony_ci 89762306a36Sopenharmony_cistatic void cik_enable_sdma_mgls(struct amdgpu_device *adev, 89862306a36Sopenharmony_ci bool enable) 89962306a36Sopenharmony_ci{ 90062306a36Sopenharmony_ci u32 orig, data; 90162306a36Sopenharmony_ci 90262306a36Sopenharmony_ci if (enable && (adev->cg_flags & AMD_CG_SUPPORT_SDMA_LS)) { 90362306a36Sopenharmony_ci orig = data = RREG32(mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET); 90462306a36Sopenharmony_ci data |= 0x100; 90562306a36Sopenharmony_ci if (orig != data) 90662306a36Sopenharmony_ci WREG32(mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET, data); 90762306a36Sopenharmony_ci 90862306a36Sopenharmony_ci orig = data = RREG32(mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET); 90962306a36Sopenharmony_ci data |= 0x100; 91062306a36Sopenharmony_ci if (orig != data) 91162306a36Sopenharmony_ci WREG32(mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET, data); 91262306a36Sopenharmony_ci } else { 91362306a36Sopenharmony_ci orig = data = RREG32(mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET); 91462306a36Sopenharmony_ci data &= ~0x100; 91562306a36Sopenharmony_ci if (orig != data) 91662306a36Sopenharmony_ci WREG32(mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET, data); 91762306a36Sopenharmony_ci 91862306a36Sopenharmony_ci orig = data = RREG32(mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET); 91962306a36Sopenharmony_ci data &= ~0x100; 92062306a36Sopenharmony_ci if (orig != data) 92162306a36Sopenharmony_ci WREG32(mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET, data); 92262306a36Sopenharmony_ci } 92362306a36Sopenharmony_ci} 92462306a36Sopenharmony_ci 92562306a36Sopenharmony_cistatic int cik_sdma_early_init(void *handle) 92662306a36Sopenharmony_ci{ 92762306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 92862306a36Sopenharmony_ci 92962306a36Sopenharmony_ci adev->sdma.num_instances = SDMA_MAX_INSTANCE; 93062306a36Sopenharmony_ci 93162306a36Sopenharmony_ci cik_sdma_set_ring_funcs(adev); 93262306a36Sopenharmony_ci cik_sdma_set_irq_funcs(adev); 93362306a36Sopenharmony_ci cik_sdma_set_buffer_funcs(adev); 93462306a36Sopenharmony_ci cik_sdma_set_vm_pte_funcs(adev); 93562306a36Sopenharmony_ci 93662306a36Sopenharmony_ci return 0; 93762306a36Sopenharmony_ci} 93862306a36Sopenharmony_ci 93962306a36Sopenharmony_cistatic int cik_sdma_sw_init(void *handle) 94062306a36Sopenharmony_ci{ 94162306a36Sopenharmony_ci struct amdgpu_ring *ring; 94262306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 94362306a36Sopenharmony_ci int r, i; 94462306a36Sopenharmony_ci 94562306a36Sopenharmony_ci r = cik_sdma_init_microcode(adev); 94662306a36Sopenharmony_ci if (r) { 94762306a36Sopenharmony_ci DRM_ERROR("Failed to load sdma firmware!\n"); 94862306a36Sopenharmony_ci return r; 94962306a36Sopenharmony_ci } 95062306a36Sopenharmony_ci 95162306a36Sopenharmony_ci /* SDMA trap event */ 95262306a36Sopenharmony_ci r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, 224, 95362306a36Sopenharmony_ci &adev->sdma.trap_irq); 95462306a36Sopenharmony_ci if (r) 95562306a36Sopenharmony_ci return r; 95662306a36Sopenharmony_ci 95762306a36Sopenharmony_ci /* SDMA Privileged inst */ 95862306a36Sopenharmony_ci r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, 241, 95962306a36Sopenharmony_ci &adev->sdma.illegal_inst_irq); 96062306a36Sopenharmony_ci if (r) 96162306a36Sopenharmony_ci return r; 96262306a36Sopenharmony_ci 96362306a36Sopenharmony_ci /* SDMA Privileged inst */ 96462306a36Sopenharmony_ci r = amdgpu_irq_add_id(adev, AMDGPU_IRQ_CLIENTID_LEGACY, 247, 96562306a36Sopenharmony_ci &adev->sdma.illegal_inst_irq); 96662306a36Sopenharmony_ci if (r) 96762306a36Sopenharmony_ci return r; 96862306a36Sopenharmony_ci 96962306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 97062306a36Sopenharmony_ci ring = &adev->sdma.instance[i].ring; 97162306a36Sopenharmony_ci ring->ring_obj = NULL; 97262306a36Sopenharmony_ci sprintf(ring->name, "sdma%d", i); 97362306a36Sopenharmony_ci r = amdgpu_ring_init(adev, ring, 1024, 97462306a36Sopenharmony_ci &adev->sdma.trap_irq, 97562306a36Sopenharmony_ci (i == 0) ? AMDGPU_SDMA_IRQ_INSTANCE0 : 97662306a36Sopenharmony_ci AMDGPU_SDMA_IRQ_INSTANCE1, 97762306a36Sopenharmony_ci AMDGPU_RING_PRIO_DEFAULT, NULL); 97862306a36Sopenharmony_ci if (r) 97962306a36Sopenharmony_ci return r; 98062306a36Sopenharmony_ci } 98162306a36Sopenharmony_ci 98262306a36Sopenharmony_ci return r; 98362306a36Sopenharmony_ci} 98462306a36Sopenharmony_ci 98562306a36Sopenharmony_cistatic int cik_sdma_sw_fini(void *handle) 98662306a36Sopenharmony_ci{ 98762306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 98862306a36Sopenharmony_ci int i; 98962306a36Sopenharmony_ci 99062306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) 99162306a36Sopenharmony_ci amdgpu_ring_fini(&adev->sdma.instance[i].ring); 99262306a36Sopenharmony_ci 99362306a36Sopenharmony_ci cik_sdma_free_microcode(adev); 99462306a36Sopenharmony_ci return 0; 99562306a36Sopenharmony_ci} 99662306a36Sopenharmony_ci 99762306a36Sopenharmony_cistatic int cik_sdma_hw_init(void *handle) 99862306a36Sopenharmony_ci{ 99962306a36Sopenharmony_ci int r; 100062306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 100162306a36Sopenharmony_ci 100262306a36Sopenharmony_ci r = cik_sdma_start(adev); 100362306a36Sopenharmony_ci if (r) 100462306a36Sopenharmony_ci return r; 100562306a36Sopenharmony_ci 100662306a36Sopenharmony_ci return r; 100762306a36Sopenharmony_ci} 100862306a36Sopenharmony_ci 100962306a36Sopenharmony_cistatic int cik_sdma_hw_fini(void *handle) 101062306a36Sopenharmony_ci{ 101162306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 101262306a36Sopenharmony_ci 101362306a36Sopenharmony_ci cik_ctx_switch_enable(adev, false); 101462306a36Sopenharmony_ci cik_sdma_enable(adev, false); 101562306a36Sopenharmony_ci 101662306a36Sopenharmony_ci return 0; 101762306a36Sopenharmony_ci} 101862306a36Sopenharmony_ci 101962306a36Sopenharmony_cistatic int cik_sdma_suspend(void *handle) 102062306a36Sopenharmony_ci{ 102162306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 102262306a36Sopenharmony_ci 102362306a36Sopenharmony_ci return cik_sdma_hw_fini(adev); 102462306a36Sopenharmony_ci} 102562306a36Sopenharmony_ci 102662306a36Sopenharmony_cistatic int cik_sdma_resume(void *handle) 102762306a36Sopenharmony_ci{ 102862306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 102962306a36Sopenharmony_ci 103062306a36Sopenharmony_ci cik_sdma_soft_reset(handle); 103162306a36Sopenharmony_ci 103262306a36Sopenharmony_ci return cik_sdma_hw_init(adev); 103362306a36Sopenharmony_ci} 103462306a36Sopenharmony_ci 103562306a36Sopenharmony_cistatic bool cik_sdma_is_idle(void *handle) 103662306a36Sopenharmony_ci{ 103762306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 103862306a36Sopenharmony_ci u32 tmp = RREG32(mmSRBM_STATUS2); 103962306a36Sopenharmony_ci 104062306a36Sopenharmony_ci if (tmp & (SRBM_STATUS2__SDMA_BUSY_MASK | 104162306a36Sopenharmony_ci SRBM_STATUS2__SDMA1_BUSY_MASK)) 104262306a36Sopenharmony_ci return false; 104362306a36Sopenharmony_ci 104462306a36Sopenharmony_ci return true; 104562306a36Sopenharmony_ci} 104662306a36Sopenharmony_ci 104762306a36Sopenharmony_cistatic int cik_sdma_wait_for_idle(void *handle) 104862306a36Sopenharmony_ci{ 104962306a36Sopenharmony_ci unsigned i; 105062306a36Sopenharmony_ci u32 tmp; 105162306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 105262306a36Sopenharmony_ci 105362306a36Sopenharmony_ci for (i = 0; i < adev->usec_timeout; i++) { 105462306a36Sopenharmony_ci tmp = RREG32(mmSRBM_STATUS2) & (SRBM_STATUS2__SDMA_BUSY_MASK | 105562306a36Sopenharmony_ci SRBM_STATUS2__SDMA1_BUSY_MASK); 105662306a36Sopenharmony_ci 105762306a36Sopenharmony_ci if (!tmp) 105862306a36Sopenharmony_ci return 0; 105962306a36Sopenharmony_ci udelay(1); 106062306a36Sopenharmony_ci } 106162306a36Sopenharmony_ci return -ETIMEDOUT; 106262306a36Sopenharmony_ci} 106362306a36Sopenharmony_ci 106462306a36Sopenharmony_cistatic int cik_sdma_soft_reset(void *handle) 106562306a36Sopenharmony_ci{ 106662306a36Sopenharmony_ci u32 srbm_soft_reset = 0; 106762306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 106862306a36Sopenharmony_ci u32 tmp; 106962306a36Sopenharmony_ci 107062306a36Sopenharmony_ci /* sdma0 */ 107162306a36Sopenharmony_ci tmp = RREG32(mmSDMA0_F32_CNTL + SDMA0_REGISTER_OFFSET); 107262306a36Sopenharmony_ci tmp |= SDMA0_F32_CNTL__HALT_MASK; 107362306a36Sopenharmony_ci WREG32(mmSDMA0_F32_CNTL + SDMA0_REGISTER_OFFSET, tmp); 107462306a36Sopenharmony_ci srbm_soft_reset |= SRBM_SOFT_RESET__SOFT_RESET_SDMA_MASK; 107562306a36Sopenharmony_ci 107662306a36Sopenharmony_ci /* sdma1 */ 107762306a36Sopenharmony_ci tmp = RREG32(mmSDMA0_F32_CNTL + SDMA1_REGISTER_OFFSET); 107862306a36Sopenharmony_ci tmp |= SDMA0_F32_CNTL__HALT_MASK; 107962306a36Sopenharmony_ci WREG32(mmSDMA0_F32_CNTL + SDMA1_REGISTER_OFFSET, tmp); 108062306a36Sopenharmony_ci srbm_soft_reset |= SRBM_SOFT_RESET__SOFT_RESET_SDMA1_MASK; 108162306a36Sopenharmony_ci 108262306a36Sopenharmony_ci if (srbm_soft_reset) { 108362306a36Sopenharmony_ci tmp = RREG32(mmSRBM_SOFT_RESET); 108462306a36Sopenharmony_ci tmp |= srbm_soft_reset; 108562306a36Sopenharmony_ci dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp); 108662306a36Sopenharmony_ci WREG32(mmSRBM_SOFT_RESET, tmp); 108762306a36Sopenharmony_ci tmp = RREG32(mmSRBM_SOFT_RESET); 108862306a36Sopenharmony_ci 108962306a36Sopenharmony_ci udelay(50); 109062306a36Sopenharmony_ci 109162306a36Sopenharmony_ci tmp &= ~srbm_soft_reset; 109262306a36Sopenharmony_ci WREG32(mmSRBM_SOFT_RESET, tmp); 109362306a36Sopenharmony_ci tmp = RREG32(mmSRBM_SOFT_RESET); 109462306a36Sopenharmony_ci 109562306a36Sopenharmony_ci /* Wait a little for things to settle down */ 109662306a36Sopenharmony_ci udelay(50); 109762306a36Sopenharmony_ci } 109862306a36Sopenharmony_ci 109962306a36Sopenharmony_ci return 0; 110062306a36Sopenharmony_ci} 110162306a36Sopenharmony_ci 110262306a36Sopenharmony_cistatic int cik_sdma_set_trap_irq_state(struct amdgpu_device *adev, 110362306a36Sopenharmony_ci struct amdgpu_irq_src *src, 110462306a36Sopenharmony_ci unsigned type, 110562306a36Sopenharmony_ci enum amdgpu_interrupt_state state) 110662306a36Sopenharmony_ci{ 110762306a36Sopenharmony_ci u32 sdma_cntl; 110862306a36Sopenharmony_ci 110962306a36Sopenharmony_ci switch (type) { 111062306a36Sopenharmony_ci case AMDGPU_SDMA_IRQ_INSTANCE0: 111162306a36Sopenharmony_ci switch (state) { 111262306a36Sopenharmony_ci case AMDGPU_IRQ_STATE_DISABLE: 111362306a36Sopenharmony_ci sdma_cntl = RREG32(mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET); 111462306a36Sopenharmony_ci sdma_cntl &= ~SDMA0_CNTL__TRAP_ENABLE_MASK; 111562306a36Sopenharmony_ci WREG32(mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET, sdma_cntl); 111662306a36Sopenharmony_ci break; 111762306a36Sopenharmony_ci case AMDGPU_IRQ_STATE_ENABLE: 111862306a36Sopenharmony_ci sdma_cntl = RREG32(mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET); 111962306a36Sopenharmony_ci sdma_cntl |= SDMA0_CNTL__TRAP_ENABLE_MASK; 112062306a36Sopenharmony_ci WREG32(mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET, sdma_cntl); 112162306a36Sopenharmony_ci break; 112262306a36Sopenharmony_ci default: 112362306a36Sopenharmony_ci break; 112462306a36Sopenharmony_ci } 112562306a36Sopenharmony_ci break; 112662306a36Sopenharmony_ci case AMDGPU_SDMA_IRQ_INSTANCE1: 112762306a36Sopenharmony_ci switch (state) { 112862306a36Sopenharmony_ci case AMDGPU_IRQ_STATE_DISABLE: 112962306a36Sopenharmony_ci sdma_cntl = RREG32(mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET); 113062306a36Sopenharmony_ci sdma_cntl &= ~SDMA0_CNTL__TRAP_ENABLE_MASK; 113162306a36Sopenharmony_ci WREG32(mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET, sdma_cntl); 113262306a36Sopenharmony_ci break; 113362306a36Sopenharmony_ci case AMDGPU_IRQ_STATE_ENABLE: 113462306a36Sopenharmony_ci sdma_cntl = RREG32(mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET); 113562306a36Sopenharmony_ci sdma_cntl |= SDMA0_CNTL__TRAP_ENABLE_MASK; 113662306a36Sopenharmony_ci WREG32(mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET, sdma_cntl); 113762306a36Sopenharmony_ci break; 113862306a36Sopenharmony_ci default: 113962306a36Sopenharmony_ci break; 114062306a36Sopenharmony_ci } 114162306a36Sopenharmony_ci break; 114262306a36Sopenharmony_ci default: 114362306a36Sopenharmony_ci break; 114462306a36Sopenharmony_ci } 114562306a36Sopenharmony_ci return 0; 114662306a36Sopenharmony_ci} 114762306a36Sopenharmony_ci 114862306a36Sopenharmony_cistatic int cik_sdma_process_trap_irq(struct amdgpu_device *adev, 114962306a36Sopenharmony_ci struct amdgpu_irq_src *source, 115062306a36Sopenharmony_ci struct amdgpu_iv_entry *entry) 115162306a36Sopenharmony_ci{ 115262306a36Sopenharmony_ci u8 instance_id, queue_id; 115362306a36Sopenharmony_ci 115462306a36Sopenharmony_ci instance_id = (entry->ring_id & 0x3) >> 0; 115562306a36Sopenharmony_ci queue_id = (entry->ring_id & 0xc) >> 2; 115662306a36Sopenharmony_ci DRM_DEBUG("IH: SDMA trap\n"); 115762306a36Sopenharmony_ci switch (instance_id) { 115862306a36Sopenharmony_ci case 0: 115962306a36Sopenharmony_ci switch (queue_id) { 116062306a36Sopenharmony_ci case 0: 116162306a36Sopenharmony_ci amdgpu_fence_process(&adev->sdma.instance[0].ring); 116262306a36Sopenharmony_ci break; 116362306a36Sopenharmony_ci case 1: 116462306a36Sopenharmony_ci /* XXX compute */ 116562306a36Sopenharmony_ci break; 116662306a36Sopenharmony_ci case 2: 116762306a36Sopenharmony_ci /* XXX compute */ 116862306a36Sopenharmony_ci break; 116962306a36Sopenharmony_ci } 117062306a36Sopenharmony_ci break; 117162306a36Sopenharmony_ci case 1: 117262306a36Sopenharmony_ci switch (queue_id) { 117362306a36Sopenharmony_ci case 0: 117462306a36Sopenharmony_ci amdgpu_fence_process(&adev->sdma.instance[1].ring); 117562306a36Sopenharmony_ci break; 117662306a36Sopenharmony_ci case 1: 117762306a36Sopenharmony_ci /* XXX compute */ 117862306a36Sopenharmony_ci break; 117962306a36Sopenharmony_ci case 2: 118062306a36Sopenharmony_ci /* XXX compute */ 118162306a36Sopenharmony_ci break; 118262306a36Sopenharmony_ci } 118362306a36Sopenharmony_ci break; 118462306a36Sopenharmony_ci } 118562306a36Sopenharmony_ci 118662306a36Sopenharmony_ci return 0; 118762306a36Sopenharmony_ci} 118862306a36Sopenharmony_ci 118962306a36Sopenharmony_cistatic int cik_sdma_process_illegal_inst_irq(struct amdgpu_device *adev, 119062306a36Sopenharmony_ci struct amdgpu_irq_src *source, 119162306a36Sopenharmony_ci struct amdgpu_iv_entry *entry) 119262306a36Sopenharmony_ci{ 119362306a36Sopenharmony_ci u8 instance_id; 119462306a36Sopenharmony_ci 119562306a36Sopenharmony_ci DRM_ERROR("Illegal instruction in SDMA command stream\n"); 119662306a36Sopenharmony_ci instance_id = (entry->ring_id & 0x3) >> 0; 119762306a36Sopenharmony_ci drm_sched_fault(&adev->sdma.instance[instance_id].ring.sched); 119862306a36Sopenharmony_ci return 0; 119962306a36Sopenharmony_ci} 120062306a36Sopenharmony_ci 120162306a36Sopenharmony_cistatic int cik_sdma_set_clockgating_state(void *handle, 120262306a36Sopenharmony_ci enum amd_clockgating_state state) 120362306a36Sopenharmony_ci{ 120462306a36Sopenharmony_ci bool gate = false; 120562306a36Sopenharmony_ci struct amdgpu_device *adev = (struct amdgpu_device *)handle; 120662306a36Sopenharmony_ci 120762306a36Sopenharmony_ci if (state == AMD_CG_STATE_GATE) 120862306a36Sopenharmony_ci gate = true; 120962306a36Sopenharmony_ci 121062306a36Sopenharmony_ci cik_enable_sdma_mgcg(adev, gate); 121162306a36Sopenharmony_ci cik_enable_sdma_mgls(adev, gate); 121262306a36Sopenharmony_ci 121362306a36Sopenharmony_ci return 0; 121462306a36Sopenharmony_ci} 121562306a36Sopenharmony_ci 121662306a36Sopenharmony_cistatic int cik_sdma_set_powergating_state(void *handle, 121762306a36Sopenharmony_ci enum amd_powergating_state state) 121862306a36Sopenharmony_ci{ 121962306a36Sopenharmony_ci return 0; 122062306a36Sopenharmony_ci} 122162306a36Sopenharmony_ci 122262306a36Sopenharmony_cistatic const struct amd_ip_funcs cik_sdma_ip_funcs = { 122362306a36Sopenharmony_ci .name = "cik_sdma", 122462306a36Sopenharmony_ci .early_init = cik_sdma_early_init, 122562306a36Sopenharmony_ci .late_init = NULL, 122662306a36Sopenharmony_ci .sw_init = cik_sdma_sw_init, 122762306a36Sopenharmony_ci .sw_fini = cik_sdma_sw_fini, 122862306a36Sopenharmony_ci .hw_init = cik_sdma_hw_init, 122962306a36Sopenharmony_ci .hw_fini = cik_sdma_hw_fini, 123062306a36Sopenharmony_ci .suspend = cik_sdma_suspend, 123162306a36Sopenharmony_ci .resume = cik_sdma_resume, 123262306a36Sopenharmony_ci .is_idle = cik_sdma_is_idle, 123362306a36Sopenharmony_ci .wait_for_idle = cik_sdma_wait_for_idle, 123462306a36Sopenharmony_ci .soft_reset = cik_sdma_soft_reset, 123562306a36Sopenharmony_ci .set_clockgating_state = cik_sdma_set_clockgating_state, 123662306a36Sopenharmony_ci .set_powergating_state = cik_sdma_set_powergating_state, 123762306a36Sopenharmony_ci}; 123862306a36Sopenharmony_ci 123962306a36Sopenharmony_cistatic const struct amdgpu_ring_funcs cik_sdma_ring_funcs = { 124062306a36Sopenharmony_ci .type = AMDGPU_RING_TYPE_SDMA, 124162306a36Sopenharmony_ci .align_mask = 0xf, 124262306a36Sopenharmony_ci .nop = SDMA_PACKET(SDMA_OPCODE_NOP, 0, 0), 124362306a36Sopenharmony_ci .support_64bit_ptrs = false, 124462306a36Sopenharmony_ci .get_rptr = cik_sdma_ring_get_rptr, 124562306a36Sopenharmony_ci .get_wptr = cik_sdma_ring_get_wptr, 124662306a36Sopenharmony_ci .set_wptr = cik_sdma_ring_set_wptr, 124762306a36Sopenharmony_ci .emit_frame_size = 124862306a36Sopenharmony_ci 6 + /* cik_sdma_ring_emit_hdp_flush */ 124962306a36Sopenharmony_ci 3 + /* hdp invalidate */ 125062306a36Sopenharmony_ci 6 + /* cik_sdma_ring_emit_pipeline_sync */ 125162306a36Sopenharmony_ci CIK_FLUSH_GPU_TLB_NUM_WREG * 3 + 6 + /* cik_sdma_ring_emit_vm_flush */ 125262306a36Sopenharmony_ci 9 + 9 + 9, /* cik_sdma_ring_emit_fence x3 for user fence, vm fence */ 125362306a36Sopenharmony_ci .emit_ib_size = 7 + 4, /* cik_sdma_ring_emit_ib */ 125462306a36Sopenharmony_ci .emit_ib = cik_sdma_ring_emit_ib, 125562306a36Sopenharmony_ci .emit_fence = cik_sdma_ring_emit_fence, 125662306a36Sopenharmony_ci .emit_pipeline_sync = cik_sdma_ring_emit_pipeline_sync, 125762306a36Sopenharmony_ci .emit_vm_flush = cik_sdma_ring_emit_vm_flush, 125862306a36Sopenharmony_ci .emit_hdp_flush = cik_sdma_ring_emit_hdp_flush, 125962306a36Sopenharmony_ci .test_ring = cik_sdma_ring_test_ring, 126062306a36Sopenharmony_ci .test_ib = cik_sdma_ring_test_ib, 126162306a36Sopenharmony_ci .insert_nop = cik_sdma_ring_insert_nop, 126262306a36Sopenharmony_ci .pad_ib = cik_sdma_ring_pad_ib, 126362306a36Sopenharmony_ci .emit_wreg = cik_sdma_ring_emit_wreg, 126462306a36Sopenharmony_ci}; 126562306a36Sopenharmony_ci 126662306a36Sopenharmony_cistatic void cik_sdma_set_ring_funcs(struct amdgpu_device *adev) 126762306a36Sopenharmony_ci{ 126862306a36Sopenharmony_ci int i; 126962306a36Sopenharmony_ci 127062306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 127162306a36Sopenharmony_ci adev->sdma.instance[i].ring.funcs = &cik_sdma_ring_funcs; 127262306a36Sopenharmony_ci adev->sdma.instance[i].ring.me = i; 127362306a36Sopenharmony_ci } 127462306a36Sopenharmony_ci} 127562306a36Sopenharmony_ci 127662306a36Sopenharmony_cistatic const struct amdgpu_irq_src_funcs cik_sdma_trap_irq_funcs = { 127762306a36Sopenharmony_ci .set = cik_sdma_set_trap_irq_state, 127862306a36Sopenharmony_ci .process = cik_sdma_process_trap_irq, 127962306a36Sopenharmony_ci}; 128062306a36Sopenharmony_ci 128162306a36Sopenharmony_cistatic const struct amdgpu_irq_src_funcs cik_sdma_illegal_inst_irq_funcs = { 128262306a36Sopenharmony_ci .process = cik_sdma_process_illegal_inst_irq, 128362306a36Sopenharmony_ci}; 128462306a36Sopenharmony_ci 128562306a36Sopenharmony_cistatic void cik_sdma_set_irq_funcs(struct amdgpu_device *adev) 128662306a36Sopenharmony_ci{ 128762306a36Sopenharmony_ci adev->sdma.trap_irq.num_types = AMDGPU_SDMA_IRQ_LAST; 128862306a36Sopenharmony_ci adev->sdma.trap_irq.funcs = &cik_sdma_trap_irq_funcs; 128962306a36Sopenharmony_ci adev->sdma.illegal_inst_irq.funcs = &cik_sdma_illegal_inst_irq_funcs; 129062306a36Sopenharmony_ci} 129162306a36Sopenharmony_ci 129262306a36Sopenharmony_ci/** 129362306a36Sopenharmony_ci * cik_sdma_emit_copy_buffer - copy buffer using the sDMA engine 129462306a36Sopenharmony_ci * 129562306a36Sopenharmony_ci * @ib: indirect buffer to copy to 129662306a36Sopenharmony_ci * @src_offset: src GPU address 129762306a36Sopenharmony_ci * @dst_offset: dst GPU address 129862306a36Sopenharmony_ci * @byte_count: number of bytes to xfer 129962306a36Sopenharmony_ci * @tmz: is this a secure operation 130062306a36Sopenharmony_ci * 130162306a36Sopenharmony_ci * Copy GPU buffers using the DMA engine (CIK). 130262306a36Sopenharmony_ci * Used by the amdgpu ttm implementation to move pages if 130362306a36Sopenharmony_ci * registered as the asic copy callback. 130462306a36Sopenharmony_ci */ 130562306a36Sopenharmony_cistatic void cik_sdma_emit_copy_buffer(struct amdgpu_ib *ib, 130662306a36Sopenharmony_ci uint64_t src_offset, 130762306a36Sopenharmony_ci uint64_t dst_offset, 130862306a36Sopenharmony_ci uint32_t byte_count, 130962306a36Sopenharmony_ci bool tmz) 131062306a36Sopenharmony_ci{ 131162306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_COPY, SDMA_COPY_SUB_OPCODE_LINEAR, 0); 131262306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = byte_count; 131362306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = 0; /* src/dst endian swap */ 131462306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(src_offset); 131562306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(src_offset); 131662306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(dst_offset); 131762306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(dst_offset); 131862306a36Sopenharmony_ci} 131962306a36Sopenharmony_ci 132062306a36Sopenharmony_ci/** 132162306a36Sopenharmony_ci * cik_sdma_emit_fill_buffer - fill buffer using the sDMA engine 132262306a36Sopenharmony_ci * 132362306a36Sopenharmony_ci * @ib: indirect buffer to fill 132462306a36Sopenharmony_ci * @src_data: value to write to buffer 132562306a36Sopenharmony_ci * @dst_offset: dst GPU address 132662306a36Sopenharmony_ci * @byte_count: number of bytes to xfer 132762306a36Sopenharmony_ci * 132862306a36Sopenharmony_ci * Fill GPU buffers using the DMA engine (CIK). 132962306a36Sopenharmony_ci */ 133062306a36Sopenharmony_cistatic void cik_sdma_emit_fill_buffer(struct amdgpu_ib *ib, 133162306a36Sopenharmony_ci uint32_t src_data, 133262306a36Sopenharmony_ci uint64_t dst_offset, 133362306a36Sopenharmony_ci uint32_t byte_count) 133462306a36Sopenharmony_ci{ 133562306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_CONSTANT_FILL, 0, 0); 133662306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = lower_32_bits(dst_offset); 133762306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = upper_32_bits(dst_offset); 133862306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = src_data; 133962306a36Sopenharmony_ci ib->ptr[ib->length_dw++] = byte_count; 134062306a36Sopenharmony_ci} 134162306a36Sopenharmony_ci 134262306a36Sopenharmony_cistatic const struct amdgpu_buffer_funcs cik_sdma_buffer_funcs = { 134362306a36Sopenharmony_ci .copy_max_bytes = 0x1fffff, 134462306a36Sopenharmony_ci .copy_num_dw = 7, 134562306a36Sopenharmony_ci .emit_copy_buffer = cik_sdma_emit_copy_buffer, 134662306a36Sopenharmony_ci 134762306a36Sopenharmony_ci .fill_max_bytes = 0x1fffff, 134862306a36Sopenharmony_ci .fill_num_dw = 5, 134962306a36Sopenharmony_ci .emit_fill_buffer = cik_sdma_emit_fill_buffer, 135062306a36Sopenharmony_ci}; 135162306a36Sopenharmony_ci 135262306a36Sopenharmony_cistatic void cik_sdma_set_buffer_funcs(struct amdgpu_device *adev) 135362306a36Sopenharmony_ci{ 135462306a36Sopenharmony_ci adev->mman.buffer_funcs = &cik_sdma_buffer_funcs; 135562306a36Sopenharmony_ci adev->mman.buffer_funcs_ring = &adev->sdma.instance[0].ring; 135662306a36Sopenharmony_ci} 135762306a36Sopenharmony_ci 135862306a36Sopenharmony_cistatic const struct amdgpu_vm_pte_funcs cik_sdma_vm_pte_funcs = { 135962306a36Sopenharmony_ci .copy_pte_num_dw = 7, 136062306a36Sopenharmony_ci .copy_pte = cik_sdma_vm_copy_pte, 136162306a36Sopenharmony_ci 136262306a36Sopenharmony_ci .write_pte = cik_sdma_vm_write_pte, 136362306a36Sopenharmony_ci .set_pte_pde = cik_sdma_vm_set_pte_pde, 136462306a36Sopenharmony_ci}; 136562306a36Sopenharmony_ci 136662306a36Sopenharmony_cistatic void cik_sdma_set_vm_pte_funcs(struct amdgpu_device *adev) 136762306a36Sopenharmony_ci{ 136862306a36Sopenharmony_ci unsigned i; 136962306a36Sopenharmony_ci 137062306a36Sopenharmony_ci adev->vm_manager.vm_pte_funcs = &cik_sdma_vm_pte_funcs; 137162306a36Sopenharmony_ci for (i = 0; i < adev->sdma.num_instances; i++) { 137262306a36Sopenharmony_ci adev->vm_manager.vm_pte_scheds[i] = 137362306a36Sopenharmony_ci &adev->sdma.instance[i].ring.sched; 137462306a36Sopenharmony_ci } 137562306a36Sopenharmony_ci adev->vm_manager.vm_pte_num_scheds = adev->sdma.num_instances; 137662306a36Sopenharmony_ci} 137762306a36Sopenharmony_ci 137862306a36Sopenharmony_ciconst struct amdgpu_ip_block_version cik_sdma_ip_block = 137962306a36Sopenharmony_ci{ 138062306a36Sopenharmony_ci .type = AMD_IP_BLOCK_TYPE_SDMA, 138162306a36Sopenharmony_ci .major = 2, 138262306a36Sopenharmony_ci .minor = 0, 138362306a36Sopenharmony_ci .rev = 0, 138462306a36Sopenharmony_ci .funcs = &cik_sdma_ip_funcs, 138562306a36Sopenharmony_ci}; 1386