18c2ecf20Sopenharmony_ci/* 28c2ecf20Sopenharmony_ci * Copyright 2014 Advanced Micro Devices, Inc. 38c2ecf20Sopenharmony_ci * 48c2ecf20Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a 58c2ecf20Sopenharmony_ci * copy of this software and associated documentation files (the "Software"), 68c2ecf20Sopenharmony_ci * to deal in the Software without restriction, including without limitation 78c2ecf20Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense, 88c2ecf20Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the 98c2ecf20Sopenharmony_ci * Software is furnished to do so, subject to the following conditions: 108c2ecf20Sopenharmony_ci * 118c2ecf20Sopenharmony_ci * The above copyright notice and this permission notice shall be included in 128c2ecf20Sopenharmony_ci * all copies or substantial portions of the Software. 138c2ecf20Sopenharmony_ci * 148c2ecf20Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 158c2ecf20Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 168c2ecf20Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 178c2ecf20Sopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 188c2ecf20Sopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 198c2ecf20Sopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 208c2ecf20Sopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE. 218c2ecf20Sopenharmony_ci */ 228c2ecf20Sopenharmony_ci 238c2ecf20Sopenharmony_ci#include <linux/device.h> 248c2ecf20Sopenharmony_ci#include <linux/export.h> 258c2ecf20Sopenharmony_ci#include <linux/err.h> 268c2ecf20Sopenharmony_ci#include <linux/fs.h> 278c2ecf20Sopenharmony_ci#include <linux/file.h> 288c2ecf20Sopenharmony_ci#include <linux/sched.h> 298c2ecf20Sopenharmony_ci#include <linux/slab.h> 308c2ecf20Sopenharmony_ci#include <linux/uaccess.h> 318c2ecf20Sopenharmony_ci#include <linux/compat.h> 328c2ecf20Sopenharmony_ci#include <uapi/linux/kfd_ioctl.h> 338c2ecf20Sopenharmony_ci#include <linux/time.h> 348c2ecf20Sopenharmony_ci#include <linux/mm.h> 358c2ecf20Sopenharmony_ci#include <linux/mman.h> 368c2ecf20Sopenharmony_ci#include <linux/dma-buf.h> 378c2ecf20Sopenharmony_ci#include <asm/processor.h> 388c2ecf20Sopenharmony_ci#include "kfd_priv.h" 398c2ecf20Sopenharmony_ci#include "kfd_device_queue_manager.h" 408c2ecf20Sopenharmony_ci#include "kfd_dbgmgr.h" 418c2ecf20Sopenharmony_ci#include "amdgpu_amdkfd.h" 428c2ecf20Sopenharmony_ci#include "kfd_smi_events.h" 438c2ecf20Sopenharmony_ci 448c2ecf20Sopenharmony_cistatic long kfd_ioctl(struct file *, unsigned int, unsigned long); 458c2ecf20Sopenharmony_cistatic int kfd_open(struct inode *, struct file *); 468c2ecf20Sopenharmony_cistatic int kfd_release(struct inode *, struct file *); 478c2ecf20Sopenharmony_cistatic int kfd_mmap(struct file *, struct vm_area_struct *); 488c2ecf20Sopenharmony_ci 498c2ecf20Sopenharmony_cistatic const char kfd_dev_name[] = "kfd"; 508c2ecf20Sopenharmony_ci 518c2ecf20Sopenharmony_cistatic const struct file_operations kfd_fops = { 528c2ecf20Sopenharmony_ci .owner = THIS_MODULE, 538c2ecf20Sopenharmony_ci .unlocked_ioctl = kfd_ioctl, 548c2ecf20Sopenharmony_ci .compat_ioctl = compat_ptr_ioctl, 558c2ecf20Sopenharmony_ci .open = kfd_open, 568c2ecf20Sopenharmony_ci .release = kfd_release, 578c2ecf20Sopenharmony_ci .mmap = kfd_mmap, 588c2ecf20Sopenharmony_ci}; 598c2ecf20Sopenharmony_ci 608c2ecf20Sopenharmony_cistatic int kfd_char_dev_major = -1; 618c2ecf20Sopenharmony_cistatic struct class *kfd_class; 628c2ecf20Sopenharmony_cistruct device *kfd_device; 638c2ecf20Sopenharmony_ci 648c2ecf20Sopenharmony_ciint kfd_chardev_init(void) 658c2ecf20Sopenharmony_ci{ 668c2ecf20Sopenharmony_ci int err = 0; 678c2ecf20Sopenharmony_ci 688c2ecf20Sopenharmony_ci kfd_char_dev_major = register_chrdev(0, kfd_dev_name, &kfd_fops); 698c2ecf20Sopenharmony_ci err = kfd_char_dev_major; 708c2ecf20Sopenharmony_ci if (err < 0) 718c2ecf20Sopenharmony_ci goto err_register_chrdev; 728c2ecf20Sopenharmony_ci 738c2ecf20Sopenharmony_ci kfd_class = class_create(THIS_MODULE, kfd_dev_name); 748c2ecf20Sopenharmony_ci err = PTR_ERR(kfd_class); 758c2ecf20Sopenharmony_ci if (IS_ERR(kfd_class)) 768c2ecf20Sopenharmony_ci goto err_class_create; 778c2ecf20Sopenharmony_ci 788c2ecf20Sopenharmony_ci kfd_device = device_create(kfd_class, NULL, 798c2ecf20Sopenharmony_ci MKDEV(kfd_char_dev_major, 0), 808c2ecf20Sopenharmony_ci NULL, kfd_dev_name); 818c2ecf20Sopenharmony_ci err = PTR_ERR(kfd_device); 828c2ecf20Sopenharmony_ci if (IS_ERR(kfd_device)) 838c2ecf20Sopenharmony_ci goto err_device_create; 848c2ecf20Sopenharmony_ci 858c2ecf20Sopenharmony_ci return 0; 868c2ecf20Sopenharmony_ci 878c2ecf20Sopenharmony_cierr_device_create: 888c2ecf20Sopenharmony_ci class_destroy(kfd_class); 898c2ecf20Sopenharmony_cierr_class_create: 908c2ecf20Sopenharmony_ci unregister_chrdev(kfd_char_dev_major, kfd_dev_name); 918c2ecf20Sopenharmony_cierr_register_chrdev: 928c2ecf20Sopenharmony_ci return err; 938c2ecf20Sopenharmony_ci} 948c2ecf20Sopenharmony_ci 958c2ecf20Sopenharmony_civoid kfd_chardev_exit(void) 968c2ecf20Sopenharmony_ci{ 978c2ecf20Sopenharmony_ci device_destroy(kfd_class, MKDEV(kfd_char_dev_major, 0)); 988c2ecf20Sopenharmony_ci class_destroy(kfd_class); 998c2ecf20Sopenharmony_ci unregister_chrdev(kfd_char_dev_major, kfd_dev_name); 1008c2ecf20Sopenharmony_ci kfd_device = NULL; 1018c2ecf20Sopenharmony_ci} 1028c2ecf20Sopenharmony_ci 1038c2ecf20Sopenharmony_cistruct device *kfd_chardev(void) 1048c2ecf20Sopenharmony_ci{ 1058c2ecf20Sopenharmony_ci return kfd_device; 1068c2ecf20Sopenharmony_ci} 1078c2ecf20Sopenharmony_ci 1088c2ecf20Sopenharmony_ci 1098c2ecf20Sopenharmony_cistatic int kfd_open(struct inode *inode, struct file *filep) 1108c2ecf20Sopenharmony_ci{ 1118c2ecf20Sopenharmony_ci struct kfd_process *process; 1128c2ecf20Sopenharmony_ci bool is_32bit_user_mode; 1138c2ecf20Sopenharmony_ci 1148c2ecf20Sopenharmony_ci if (iminor(inode) != 0) 1158c2ecf20Sopenharmony_ci return -ENODEV; 1168c2ecf20Sopenharmony_ci 1178c2ecf20Sopenharmony_ci is_32bit_user_mode = in_compat_syscall(); 1188c2ecf20Sopenharmony_ci 1198c2ecf20Sopenharmony_ci if (is_32bit_user_mode) { 1208c2ecf20Sopenharmony_ci dev_warn(kfd_device, 1218c2ecf20Sopenharmony_ci "Process %d (32-bit) failed to open /dev/kfd\n" 1228c2ecf20Sopenharmony_ci "32-bit processes are not supported by amdkfd\n", 1238c2ecf20Sopenharmony_ci current->pid); 1248c2ecf20Sopenharmony_ci return -EPERM; 1258c2ecf20Sopenharmony_ci } 1268c2ecf20Sopenharmony_ci 1278c2ecf20Sopenharmony_ci process = kfd_create_process(filep); 1288c2ecf20Sopenharmony_ci if (IS_ERR(process)) 1298c2ecf20Sopenharmony_ci return PTR_ERR(process); 1308c2ecf20Sopenharmony_ci 1318c2ecf20Sopenharmony_ci if (kfd_is_locked()) { 1328c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "kfd is locked!\n" 1338c2ecf20Sopenharmony_ci "process %d unreferenced", process->pasid); 1348c2ecf20Sopenharmony_ci kfd_unref_process(process); 1358c2ecf20Sopenharmony_ci return -EAGAIN; 1368c2ecf20Sopenharmony_ci } 1378c2ecf20Sopenharmony_ci 1388c2ecf20Sopenharmony_ci /* filep now owns the reference returned by kfd_create_process */ 1398c2ecf20Sopenharmony_ci filep->private_data = process; 1408c2ecf20Sopenharmony_ci 1418c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "process %d opened, compat mode (32 bit) - %d\n", 1428c2ecf20Sopenharmony_ci process->pasid, process->is_32bit_user_mode); 1438c2ecf20Sopenharmony_ci 1448c2ecf20Sopenharmony_ci return 0; 1458c2ecf20Sopenharmony_ci} 1468c2ecf20Sopenharmony_ci 1478c2ecf20Sopenharmony_cistatic int kfd_release(struct inode *inode, struct file *filep) 1488c2ecf20Sopenharmony_ci{ 1498c2ecf20Sopenharmony_ci struct kfd_process *process = filep->private_data; 1508c2ecf20Sopenharmony_ci 1518c2ecf20Sopenharmony_ci if (process) 1528c2ecf20Sopenharmony_ci kfd_unref_process(process); 1538c2ecf20Sopenharmony_ci 1548c2ecf20Sopenharmony_ci return 0; 1558c2ecf20Sopenharmony_ci} 1568c2ecf20Sopenharmony_ci 1578c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_version(struct file *filep, struct kfd_process *p, 1588c2ecf20Sopenharmony_ci void *data) 1598c2ecf20Sopenharmony_ci{ 1608c2ecf20Sopenharmony_ci struct kfd_ioctl_get_version_args *args = data; 1618c2ecf20Sopenharmony_ci 1628c2ecf20Sopenharmony_ci args->major_version = KFD_IOCTL_MAJOR_VERSION; 1638c2ecf20Sopenharmony_ci args->minor_version = KFD_IOCTL_MINOR_VERSION; 1648c2ecf20Sopenharmony_ci 1658c2ecf20Sopenharmony_ci return 0; 1668c2ecf20Sopenharmony_ci} 1678c2ecf20Sopenharmony_ci 1688c2ecf20Sopenharmony_cistatic int set_queue_properties_from_user(struct queue_properties *q_properties, 1698c2ecf20Sopenharmony_ci struct kfd_ioctl_create_queue_args *args) 1708c2ecf20Sopenharmony_ci{ 1718c2ecf20Sopenharmony_ci if (args->queue_percentage > KFD_MAX_QUEUE_PERCENTAGE) { 1728c2ecf20Sopenharmony_ci pr_err("Queue percentage must be between 0 to KFD_MAX_QUEUE_PERCENTAGE\n"); 1738c2ecf20Sopenharmony_ci return -EINVAL; 1748c2ecf20Sopenharmony_ci } 1758c2ecf20Sopenharmony_ci 1768c2ecf20Sopenharmony_ci if (args->queue_priority > KFD_MAX_QUEUE_PRIORITY) { 1778c2ecf20Sopenharmony_ci pr_err("Queue priority must be between 0 to KFD_MAX_QUEUE_PRIORITY\n"); 1788c2ecf20Sopenharmony_ci return -EINVAL; 1798c2ecf20Sopenharmony_ci } 1808c2ecf20Sopenharmony_ci 1818c2ecf20Sopenharmony_ci if ((args->ring_base_address) && 1828c2ecf20Sopenharmony_ci (!access_ok((const void __user *) args->ring_base_address, 1838c2ecf20Sopenharmony_ci sizeof(uint64_t)))) { 1848c2ecf20Sopenharmony_ci pr_err("Can't access ring base address\n"); 1858c2ecf20Sopenharmony_ci return -EFAULT; 1868c2ecf20Sopenharmony_ci } 1878c2ecf20Sopenharmony_ci 1888c2ecf20Sopenharmony_ci if (!is_power_of_2(args->ring_size) && (args->ring_size != 0)) { 1898c2ecf20Sopenharmony_ci pr_err("Ring size must be a power of 2 or 0\n"); 1908c2ecf20Sopenharmony_ci return -EINVAL; 1918c2ecf20Sopenharmony_ci } 1928c2ecf20Sopenharmony_ci 1938c2ecf20Sopenharmony_ci if (!access_ok((const void __user *) args->read_pointer_address, 1948c2ecf20Sopenharmony_ci sizeof(uint32_t))) { 1958c2ecf20Sopenharmony_ci pr_err("Can't access read pointer\n"); 1968c2ecf20Sopenharmony_ci return -EFAULT; 1978c2ecf20Sopenharmony_ci } 1988c2ecf20Sopenharmony_ci 1998c2ecf20Sopenharmony_ci if (!access_ok((const void __user *) args->write_pointer_address, 2008c2ecf20Sopenharmony_ci sizeof(uint32_t))) { 2018c2ecf20Sopenharmony_ci pr_err("Can't access write pointer\n"); 2028c2ecf20Sopenharmony_ci return -EFAULT; 2038c2ecf20Sopenharmony_ci } 2048c2ecf20Sopenharmony_ci 2058c2ecf20Sopenharmony_ci if (args->eop_buffer_address && 2068c2ecf20Sopenharmony_ci !access_ok((const void __user *) args->eop_buffer_address, 2078c2ecf20Sopenharmony_ci sizeof(uint32_t))) { 2088c2ecf20Sopenharmony_ci pr_debug("Can't access eop buffer"); 2098c2ecf20Sopenharmony_ci return -EFAULT; 2108c2ecf20Sopenharmony_ci } 2118c2ecf20Sopenharmony_ci 2128c2ecf20Sopenharmony_ci if (args->ctx_save_restore_address && 2138c2ecf20Sopenharmony_ci !access_ok((const void __user *) args->ctx_save_restore_address, 2148c2ecf20Sopenharmony_ci sizeof(uint32_t))) { 2158c2ecf20Sopenharmony_ci pr_debug("Can't access ctx save restore buffer"); 2168c2ecf20Sopenharmony_ci return -EFAULT; 2178c2ecf20Sopenharmony_ci } 2188c2ecf20Sopenharmony_ci 2198c2ecf20Sopenharmony_ci q_properties->is_interop = false; 2208c2ecf20Sopenharmony_ci q_properties->is_gws = false; 2218c2ecf20Sopenharmony_ci q_properties->queue_percent = args->queue_percentage; 2228c2ecf20Sopenharmony_ci q_properties->priority = args->queue_priority; 2238c2ecf20Sopenharmony_ci q_properties->queue_address = args->ring_base_address; 2248c2ecf20Sopenharmony_ci q_properties->queue_size = args->ring_size; 2258c2ecf20Sopenharmony_ci q_properties->read_ptr = (uint32_t *) args->read_pointer_address; 2268c2ecf20Sopenharmony_ci q_properties->write_ptr = (uint32_t *) args->write_pointer_address; 2278c2ecf20Sopenharmony_ci q_properties->eop_ring_buffer_address = args->eop_buffer_address; 2288c2ecf20Sopenharmony_ci q_properties->eop_ring_buffer_size = args->eop_buffer_size; 2298c2ecf20Sopenharmony_ci q_properties->ctx_save_restore_area_address = 2308c2ecf20Sopenharmony_ci args->ctx_save_restore_address; 2318c2ecf20Sopenharmony_ci q_properties->ctx_save_restore_area_size = args->ctx_save_restore_size; 2328c2ecf20Sopenharmony_ci q_properties->ctl_stack_size = args->ctl_stack_size; 2338c2ecf20Sopenharmony_ci if (args->queue_type == KFD_IOC_QUEUE_TYPE_COMPUTE || 2348c2ecf20Sopenharmony_ci args->queue_type == KFD_IOC_QUEUE_TYPE_COMPUTE_AQL) 2358c2ecf20Sopenharmony_ci q_properties->type = KFD_QUEUE_TYPE_COMPUTE; 2368c2ecf20Sopenharmony_ci else if (args->queue_type == KFD_IOC_QUEUE_TYPE_SDMA) 2378c2ecf20Sopenharmony_ci q_properties->type = KFD_QUEUE_TYPE_SDMA; 2388c2ecf20Sopenharmony_ci else if (args->queue_type == KFD_IOC_QUEUE_TYPE_SDMA_XGMI) 2398c2ecf20Sopenharmony_ci q_properties->type = KFD_QUEUE_TYPE_SDMA_XGMI; 2408c2ecf20Sopenharmony_ci else 2418c2ecf20Sopenharmony_ci return -ENOTSUPP; 2428c2ecf20Sopenharmony_ci 2438c2ecf20Sopenharmony_ci if (args->queue_type == KFD_IOC_QUEUE_TYPE_COMPUTE_AQL) 2448c2ecf20Sopenharmony_ci q_properties->format = KFD_QUEUE_FORMAT_AQL; 2458c2ecf20Sopenharmony_ci else 2468c2ecf20Sopenharmony_ci q_properties->format = KFD_QUEUE_FORMAT_PM4; 2478c2ecf20Sopenharmony_ci 2488c2ecf20Sopenharmony_ci pr_debug("Queue Percentage: %d, %d\n", 2498c2ecf20Sopenharmony_ci q_properties->queue_percent, args->queue_percentage); 2508c2ecf20Sopenharmony_ci 2518c2ecf20Sopenharmony_ci pr_debug("Queue Priority: %d, %d\n", 2528c2ecf20Sopenharmony_ci q_properties->priority, args->queue_priority); 2538c2ecf20Sopenharmony_ci 2548c2ecf20Sopenharmony_ci pr_debug("Queue Address: 0x%llX, 0x%llX\n", 2558c2ecf20Sopenharmony_ci q_properties->queue_address, args->ring_base_address); 2568c2ecf20Sopenharmony_ci 2578c2ecf20Sopenharmony_ci pr_debug("Queue Size: 0x%llX, %u\n", 2588c2ecf20Sopenharmony_ci q_properties->queue_size, args->ring_size); 2598c2ecf20Sopenharmony_ci 2608c2ecf20Sopenharmony_ci pr_debug("Queue r/w Pointers: %px, %px\n", 2618c2ecf20Sopenharmony_ci q_properties->read_ptr, 2628c2ecf20Sopenharmony_ci q_properties->write_ptr); 2638c2ecf20Sopenharmony_ci 2648c2ecf20Sopenharmony_ci pr_debug("Queue Format: %d\n", q_properties->format); 2658c2ecf20Sopenharmony_ci 2668c2ecf20Sopenharmony_ci pr_debug("Queue EOP: 0x%llX\n", q_properties->eop_ring_buffer_address); 2678c2ecf20Sopenharmony_ci 2688c2ecf20Sopenharmony_ci pr_debug("Queue CTX save area: 0x%llX\n", 2698c2ecf20Sopenharmony_ci q_properties->ctx_save_restore_area_address); 2708c2ecf20Sopenharmony_ci 2718c2ecf20Sopenharmony_ci return 0; 2728c2ecf20Sopenharmony_ci} 2738c2ecf20Sopenharmony_ci 2748c2ecf20Sopenharmony_cistatic int kfd_ioctl_create_queue(struct file *filep, struct kfd_process *p, 2758c2ecf20Sopenharmony_ci void *data) 2768c2ecf20Sopenharmony_ci{ 2778c2ecf20Sopenharmony_ci struct kfd_ioctl_create_queue_args *args = data; 2788c2ecf20Sopenharmony_ci struct kfd_dev *dev; 2798c2ecf20Sopenharmony_ci int err = 0; 2808c2ecf20Sopenharmony_ci unsigned int queue_id; 2818c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 2828c2ecf20Sopenharmony_ci struct queue_properties q_properties; 2838c2ecf20Sopenharmony_ci uint32_t doorbell_offset_in_process = 0; 2848c2ecf20Sopenharmony_ci 2858c2ecf20Sopenharmony_ci memset(&q_properties, 0, sizeof(struct queue_properties)); 2868c2ecf20Sopenharmony_ci 2878c2ecf20Sopenharmony_ci pr_debug("Creating queue ioctl\n"); 2888c2ecf20Sopenharmony_ci 2898c2ecf20Sopenharmony_ci err = set_queue_properties_from_user(&q_properties, args); 2908c2ecf20Sopenharmony_ci if (err) 2918c2ecf20Sopenharmony_ci return err; 2928c2ecf20Sopenharmony_ci 2938c2ecf20Sopenharmony_ci pr_debug("Looking for gpu id 0x%x\n", args->gpu_id); 2948c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 2958c2ecf20Sopenharmony_ci if (!dev) { 2968c2ecf20Sopenharmony_ci pr_debug("Could not find gpu id 0x%x\n", args->gpu_id); 2978c2ecf20Sopenharmony_ci return -EINVAL; 2988c2ecf20Sopenharmony_ci } 2998c2ecf20Sopenharmony_ci 3008c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 3018c2ecf20Sopenharmony_ci 3028c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 3038c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 3048c2ecf20Sopenharmony_ci err = -ESRCH; 3058c2ecf20Sopenharmony_ci goto err_bind_process; 3068c2ecf20Sopenharmony_ci } 3078c2ecf20Sopenharmony_ci 3088c2ecf20Sopenharmony_ci pr_debug("Creating queue for PASID 0x%x on gpu 0x%x\n", 3098c2ecf20Sopenharmony_ci p->pasid, 3108c2ecf20Sopenharmony_ci dev->id); 3118c2ecf20Sopenharmony_ci 3128c2ecf20Sopenharmony_ci err = pqm_create_queue(&p->pqm, dev, filep, &q_properties, &queue_id, 3138c2ecf20Sopenharmony_ci &doorbell_offset_in_process); 3148c2ecf20Sopenharmony_ci if (err != 0) 3158c2ecf20Sopenharmony_ci goto err_create_queue; 3168c2ecf20Sopenharmony_ci 3178c2ecf20Sopenharmony_ci args->queue_id = queue_id; 3188c2ecf20Sopenharmony_ci 3198c2ecf20Sopenharmony_ci 3208c2ecf20Sopenharmony_ci /* Return gpu_id as doorbell offset for mmap usage */ 3218c2ecf20Sopenharmony_ci args->doorbell_offset = KFD_MMAP_TYPE_DOORBELL; 3228c2ecf20Sopenharmony_ci args->doorbell_offset |= KFD_MMAP_GPU_ID(args->gpu_id); 3238c2ecf20Sopenharmony_ci if (KFD_IS_SOC15(dev->device_info->asic_family)) 3248c2ecf20Sopenharmony_ci /* On SOC15 ASICs, include the doorbell offset within the 3258c2ecf20Sopenharmony_ci * process doorbell frame, which is 2 pages. 3268c2ecf20Sopenharmony_ci */ 3278c2ecf20Sopenharmony_ci args->doorbell_offset |= doorbell_offset_in_process; 3288c2ecf20Sopenharmony_ci 3298c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 3308c2ecf20Sopenharmony_ci 3318c2ecf20Sopenharmony_ci pr_debug("Queue id %d was created successfully\n", args->queue_id); 3328c2ecf20Sopenharmony_ci 3338c2ecf20Sopenharmony_ci pr_debug("Ring buffer address == 0x%016llX\n", 3348c2ecf20Sopenharmony_ci args->ring_base_address); 3358c2ecf20Sopenharmony_ci 3368c2ecf20Sopenharmony_ci pr_debug("Read ptr address == 0x%016llX\n", 3378c2ecf20Sopenharmony_ci args->read_pointer_address); 3388c2ecf20Sopenharmony_ci 3398c2ecf20Sopenharmony_ci pr_debug("Write ptr address == 0x%016llX\n", 3408c2ecf20Sopenharmony_ci args->write_pointer_address); 3418c2ecf20Sopenharmony_ci 3428c2ecf20Sopenharmony_ci return 0; 3438c2ecf20Sopenharmony_ci 3448c2ecf20Sopenharmony_cierr_create_queue: 3458c2ecf20Sopenharmony_cierr_bind_process: 3468c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 3478c2ecf20Sopenharmony_ci return err; 3488c2ecf20Sopenharmony_ci} 3498c2ecf20Sopenharmony_ci 3508c2ecf20Sopenharmony_cistatic int kfd_ioctl_destroy_queue(struct file *filp, struct kfd_process *p, 3518c2ecf20Sopenharmony_ci void *data) 3528c2ecf20Sopenharmony_ci{ 3538c2ecf20Sopenharmony_ci int retval; 3548c2ecf20Sopenharmony_ci struct kfd_ioctl_destroy_queue_args *args = data; 3558c2ecf20Sopenharmony_ci 3568c2ecf20Sopenharmony_ci pr_debug("Destroying queue id %d for pasid 0x%x\n", 3578c2ecf20Sopenharmony_ci args->queue_id, 3588c2ecf20Sopenharmony_ci p->pasid); 3598c2ecf20Sopenharmony_ci 3608c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 3618c2ecf20Sopenharmony_ci 3628c2ecf20Sopenharmony_ci retval = pqm_destroy_queue(&p->pqm, args->queue_id); 3638c2ecf20Sopenharmony_ci 3648c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 3658c2ecf20Sopenharmony_ci return retval; 3668c2ecf20Sopenharmony_ci} 3678c2ecf20Sopenharmony_ci 3688c2ecf20Sopenharmony_cistatic int kfd_ioctl_update_queue(struct file *filp, struct kfd_process *p, 3698c2ecf20Sopenharmony_ci void *data) 3708c2ecf20Sopenharmony_ci{ 3718c2ecf20Sopenharmony_ci int retval; 3728c2ecf20Sopenharmony_ci struct kfd_ioctl_update_queue_args *args = data; 3738c2ecf20Sopenharmony_ci struct queue_properties properties; 3748c2ecf20Sopenharmony_ci 3758c2ecf20Sopenharmony_ci if (args->queue_percentage > KFD_MAX_QUEUE_PERCENTAGE) { 3768c2ecf20Sopenharmony_ci pr_err("Queue percentage must be between 0 to KFD_MAX_QUEUE_PERCENTAGE\n"); 3778c2ecf20Sopenharmony_ci return -EINVAL; 3788c2ecf20Sopenharmony_ci } 3798c2ecf20Sopenharmony_ci 3808c2ecf20Sopenharmony_ci if (args->queue_priority > KFD_MAX_QUEUE_PRIORITY) { 3818c2ecf20Sopenharmony_ci pr_err("Queue priority must be between 0 to KFD_MAX_QUEUE_PRIORITY\n"); 3828c2ecf20Sopenharmony_ci return -EINVAL; 3838c2ecf20Sopenharmony_ci } 3848c2ecf20Sopenharmony_ci 3858c2ecf20Sopenharmony_ci if ((args->ring_base_address) && 3868c2ecf20Sopenharmony_ci (!access_ok((const void __user *) args->ring_base_address, 3878c2ecf20Sopenharmony_ci sizeof(uint64_t)))) { 3888c2ecf20Sopenharmony_ci pr_err("Can't access ring base address\n"); 3898c2ecf20Sopenharmony_ci return -EFAULT; 3908c2ecf20Sopenharmony_ci } 3918c2ecf20Sopenharmony_ci 3928c2ecf20Sopenharmony_ci if (!is_power_of_2(args->ring_size) && (args->ring_size != 0)) { 3938c2ecf20Sopenharmony_ci pr_err("Ring size must be a power of 2 or 0\n"); 3948c2ecf20Sopenharmony_ci return -EINVAL; 3958c2ecf20Sopenharmony_ci } 3968c2ecf20Sopenharmony_ci 3978c2ecf20Sopenharmony_ci properties.queue_address = args->ring_base_address; 3988c2ecf20Sopenharmony_ci properties.queue_size = args->ring_size; 3998c2ecf20Sopenharmony_ci properties.queue_percent = args->queue_percentage; 4008c2ecf20Sopenharmony_ci properties.priority = args->queue_priority; 4018c2ecf20Sopenharmony_ci 4028c2ecf20Sopenharmony_ci pr_debug("Updating queue id %d for pasid 0x%x\n", 4038c2ecf20Sopenharmony_ci args->queue_id, p->pasid); 4048c2ecf20Sopenharmony_ci 4058c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 4068c2ecf20Sopenharmony_ci 4078c2ecf20Sopenharmony_ci retval = pqm_update_queue(&p->pqm, args->queue_id, &properties); 4088c2ecf20Sopenharmony_ci 4098c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 4108c2ecf20Sopenharmony_ci 4118c2ecf20Sopenharmony_ci return retval; 4128c2ecf20Sopenharmony_ci} 4138c2ecf20Sopenharmony_ci 4148c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_cu_mask(struct file *filp, struct kfd_process *p, 4158c2ecf20Sopenharmony_ci void *data) 4168c2ecf20Sopenharmony_ci{ 4178c2ecf20Sopenharmony_ci int retval; 4188c2ecf20Sopenharmony_ci const int max_num_cus = 1024; 4198c2ecf20Sopenharmony_ci struct kfd_ioctl_set_cu_mask_args *args = data; 4208c2ecf20Sopenharmony_ci struct queue_properties properties; 4218c2ecf20Sopenharmony_ci uint32_t __user *cu_mask_ptr = (uint32_t __user *)args->cu_mask_ptr; 4228c2ecf20Sopenharmony_ci size_t cu_mask_size = sizeof(uint32_t) * (args->num_cu_mask / 32); 4238c2ecf20Sopenharmony_ci 4248c2ecf20Sopenharmony_ci if ((args->num_cu_mask % 32) != 0) { 4258c2ecf20Sopenharmony_ci pr_debug("num_cu_mask 0x%x must be a multiple of 32", 4268c2ecf20Sopenharmony_ci args->num_cu_mask); 4278c2ecf20Sopenharmony_ci return -EINVAL; 4288c2ecf20Sopenharmony_ci } 4298c2ecf20Sopenharmony_ci 4308c2ecf20Sopenharmony_ci properties.cu_mask_count = args->num_cu_mask; 4318c2ecf20Sopenharmony_ci if (properties.cu_mask_count == 0) { 4328c2ecf20Sopenharmony_ci pr_debug("CU mask cannot be 0"); 4338c2ecf20Sopenharmony_ci return -EINVAL; 4348c2ecf20Sopenharmony_ci } 4358c2ecf20Sopenharmony_ci 4368c2ecf20Sopenharmony_ci /* To prevent an unreasonably large CU mask size, set an arbitrary 4378c2ecf20Sopenharmony_ci * limit of max_num_cus bits. We can then just drop any CU mask bits 4388c2ecf20Sopenharmony_ci * past max_num_cus bits and just use the first max_num_cus bits. 4398c2ecf20Sopenharmony_ci */ 4408c2ecf20Sopenharmony_ci if (properties.cu_mask_count > max_num_cus) { 4418c2ecf20Sopenharmony_ci pr_debug("CU mask cannot be greater than 1024 bits"); 4428c2ecf20Sopenharmony_ci properties.cu_mask_count = max_num_cus; 4438c2ecf20Sopenharmony_ci cu_mask_size = sizeof(uint32_t) * (max_num_cus/32); 4448c2ecf20Sopenharmony_ci } 4458c2ecf20Sopenharmony_ci 4468c2ecf20Sopenharmony_ci properties.cu_mask = kzalloc(cu_mask_size, GFP_KERNEL); 4478c2ecf20Sopenharmony_ci if (!properties.cu_mask) 4488c2ecf20Sopenharmony_ci return -ENOMEM; 4498c2ecf20Sopenharmony_ci 4508c2ecf20Sopenharmony_ci retval = copy_from_user(properties.cu_mask, cu_mask_ptr, cu_mask_size); 4518c2ecf20Sopenharmony_ci if (retval) { 4528c2ecf20Sopenharmony_ci pr_debug("Could not copy CU mask from userspace"); 4538c2ecf20Sopenharmony_ci kfree(properties.cu_mask); 4548c2ecf20Sopenharmony_ci return -EFAULT; 4558c2ecf20Sopenharmony_ci } 4568c2ecf20Sopenharmony_ci 4578c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 4588c2ecf20Sopenharmony_ci 4598c2ecf20Sopenharmony_ci retval = pqm_set_cu_mask(&p->pqm, args->queue_id, &properties); 4608c2ecf20Sopenharmony_ci 4618c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 4628c2ecf20Sopenharmony_ci 4638c2ecf20Sopenharmony_ci if (retval) 4648c2ecf20Sopenharmony_ci kfree(properties.cu_mask); 4658c2ecf20Sopenharmony_ci 4668c2ecf20Sopenharmony_ci return retval; 4678c2ecf20Sopenharmony_ci} 4688c2ecf20Sopenharmony_ci 4698c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_queue_wave_state(struct file *filep, 4708c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 4718c2ecf20Sopenharmony_ci{ 4728c2ecf20Sopenharmony_ci struct kfd_ioctl_get_queue_wave_state_args *args = data; 4738c2ecf20Sopenharmony_ci int r; 4748c2ecf20Sopenharmony_ci 4758c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 4768c2ecf20Sopenharmony_ci 4778c2ecf20Sopenharmony_ci r = pqm_get_wave_state(&p->pqm, args->queue_id, 4788c2ecf20Sopenharmony_ci (void __user *)args->ctl_stack_address, 4798c2ecf20Sopenharmony_ci &args->ctl_stack_used_size, 4808c2ecf20Sopenharmony_ci &args->save_area_used_size); 4818c2ecf20Sopenharmony_ci 4828c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 4838c2ecf20Sopenharmony_ci 4848c2ecf20Sopenharmony_ci return r; 4858c2ecf20Sopenharmony_ci} 4868c2ecf20Sopenharmony_ci 4878c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_memory_policy(struct file *filep, 4888c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 4898c2ecf20Sopenharmony_ci{ 4908c2ecf20Sopenharmony_ci struct kfd_ioctl_set_memory_policy_args *args = data; 4918c2ecf20Sopenharmony_ci struct kfd_dev *dev; 4928c2ecf20Sopenharmony_ci int err = 0; 4938c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 4948c2ecf20Sopenharmony_ci enum cache_policy default_policy, alternate_policy; 4958c2ecf20Sopenharmony_ci 4968c2ecf20Sopenharmony_ci if (args->default_policy != KFD_IOC_CACHE_POLICY_COHERENT 4978c2ecf20Sopenharmony_ci && args->default_policy != KFD_IOC_CACHE_POLICY_NONCOHERENT) { 4988c2ecf20Sopenharmony_ci return -EINVAL; 4998c2ecf20Sopenharmony_ci } 5008c2ecf20Sopenharmony_ci 5018c2ecf20Sopenharmony_ci if (args->alternate_policy != KFD_IOC_CACHE_POLICY_COHERENT 5028c2ecf20Sopenharmony_ci && args->alternate_policy != KFD_IOC_CACHE_POLICY_NONCOHERENT) { 5038c2ecf20Sopenharmony_ci return -EINVAL; 5048c2ecf20Sopenharmony_ci } 5058c2ecf20Sopenharmony_ci 5068c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 5078c2ecf20Sopenharmony_ci if (!dev) 5088c2ecf20Sopenharmony_ci return -EINVAL; 5098c2ecf20Sopenharmony_ci 5108c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 5118c2ecf20Sopenharmony_ci 5128c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 5138c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 5148c2ecf20Sopenharmony_ci err = -ESRCH; 5158c2ecf20Sopenharmony_ci goto out; 5168c2ecf20Sopenharmony_ci } 5178c2ecf20Sopenharmony_ci 5188c2ecf20Sopenharmony_ci default_policy = (args->default_policy == KFD_IOC_CACHE_POLICY_COHERENT) 5198c2ecf20Sopenharmony_ci ? cache_policy_coherent : cache_policy_noncoherent; 5208c2ecf20Sopenharmony_ci 5218c2ecf20Sopenharmony_ci alternate_policy = 5228c2ecf20Sopenharmony_ci (args->alternate_policy == KFD_IOC_CACHE_POLICY_COHERENT) 5238c2ecf20Sopenharmony_ci ? cache_policy_coherent : cache_policy_noncoherent; 5248c2ecf20Sopenharmony_ci 5258c2ecf20Sopenharmony_ci if (!dev->dqm->ops.set_cache_memory_policy(dev->dqm, 5268c2ecf20Sopenharmony_ci &pdd->qpd, 5278c2ecf20Sopenharmony_ci default_policy, 5288c2ecf20Sopenharmony_ci alternate_policy, 5298c2ecf20Sopenharmony_ci (void __user *)args->alternate_aperture_base, 5308c2ecf20Sopenharmony_ci args->alternate_aperture_size)) 5318c2ecf20Sopenharmony_ci err = -EINVAL; 5328c2ecf20Sopenharmony_ci 5338c2ecf20Sopenharmony_ciout: 5348c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 5358c2ecf20Sopenharmony_ci 5368c2ecf20Sopenharmony_ci return err; 5378c2ecf20Sopenharmony_ci} 5388c2ecf20Sopenharmony_ci 5398c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_trap_handler(struct file *filep, 5408c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 5418c2ecf20Sopenharmony_ci{ 5428c2ecf20Sopenharmony_ci struct kfd_ioctl_set_trap_handler_args *args = data; 5438c2ecf20Sopenharmony_ci struct kfd_dev *dev; 5448c2ecf20Sopenharmony_ci int err = 0; 5458c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 5468c2ecf20Sopenharmony_ci 5478c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 5488c2ecf20Sopenharmony_ci if (!dev) 5498c2ecf20Sopenharmony_ci return -EINVAL; 5508c2ecf20Sopenharmony_ci 5518c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 5528c2ecf20Sopenharmony_ci 5538c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 5548c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 5558c2ecf20Sopenharmony_ci err = -ESRCH; 5568c2ecf20Sopenharmony_ci goto out; 5578c2ecf20Sopenharmony_ci } 5588c2ecf20Sopenharmony_ci 5598c2ecf20Sopenharmony_ci if (dev->dqm->ops.set_trap_handler(dev->dqm, 5608c2ecf20Sopenharmony_ci &pdd->qpd, 5618c2ecf20Sopenharmony_ci args->tba_addr, 5628c2ecf20Sopenharmony_ci args->tma_addr)) 5638c2ecf20Sopenharmony_ci err = -EINVAL; 5648c2ecf20Sopenharmony_ci 5658c2ecf20Sopenharmony_ciout: 5668c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 5678c2ecf20Sopenharmony_ci 5688c2ecf20Sopenharmony_ci return err; 5698c2ecf20Sopenharmony_ci} 5708c2ecf20Sopenharmony_ci 5718c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_register(struct file *filep, 5728c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 5738c2ecf20Sopenharmony_ci{ 5748c2ecf20Sopenharmony_ci struct kfd_ioctl_dbg_register_args *args = data; 5758c2ecf20Sopenharmony_ci struct kfd_dev *dev; 5768c2ecf20Sopenharmony_ci struct kfd_dbgmgr *dbgmgr_ptr; 5778c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 5788c2ecf20Sopenharmony_ci bool create_ok; 5798c2ecf20Sopenharmony_ci long status = 0; 5808c2ecf20Sopenharmony_ci 5818c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 5828c2ecf20Sopenharmony_ci if (!dev) 5838c2ecf20Sopenharmony_ci return -EINVAL; 5848c2ecf20Sopenharmony_ci 5858c2ecf20Sopenharmony_ci if (dev->device_info->asic_family == CHIP_CARRIZO) { 5868c2ecf20Sopenharmony_ci pr_debug("kfd_ioctl_dbg_register not supported on CZ\n"); 5878c2ecf20Sopenharmony_ci return -EINVAL; 5888c2ecf20Sopenharmony_ci } 5898c2ecf20Sopenharmony_ci 5908c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 5918c2ecf20Sopenharmony_ci mutex_lock(kfd_get_dbgmgr_mutex()); 5928c2ecf20Sopenharmony_ci 5938c2ecf20Sopenharmony_ci /* 5948c2ecf20Sopenharmony_ci * make sure that we have pdd, if this the first queue created for 5958c2ecf20Sopenharmony_ci * this process 5968c2ecf20Sopenharmony_ci */ 5978c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 5988c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 5998c2ecf20Sopenharmony_ci status = PTR_ERR(pdd); 6008c2ecf20Sopenharmony_ci goto out; 6018c2ecf20Sopenharmony_ci } 6028c2ecf20Sopenharmony_ci 6038c2ecf20Sopenharmony_ci if (!dev->dbgmgr) { 6048c2ecf20Sopenharmony_ci /* In case of a legal call, we have no dbgmgr yet */ 6058c2ecf20Sopenharmony_ci create_ok = kfd_dbgmgr_create(&dbgmgr_ptr, dev); 6068c2ecf20Sopenharmony_ci if (create_ok) { 6078c2ecf20Sopenharmony_ci status = kfd_dbgmgr_register(dbgmgr_ptr, p); 6088c2ecf20Sopenharmony_ci if (status != 0) 6098c2ecf20Sopenharmony_ci kfd_dbgmgr_destroy(dbgmgr_ptr); 6108c2ecf20Sopenharmony_ci else 6118c2ecf20Sopenharmony_ci dev->dbgmgr = dbgmgr_ptr; 6128c2ecf20Sopenharmony_ci } 6138c2ecf20Sopenharmony_ci } else { 6148c2ecf20Sopenharmony_ci pr_debug("debugger already registered\n"); 6158c2ecf20Sopenharmony_ci status = -EINVAL; 6168c2ecf20Sopenharmony_ci } 6178c2ecf20Sopenharmony_ci 6188c2ecf20Sopenharmony_ciout: 6198c2ecf20Sopenharmony_ci mutex_unlock(kfd_get_dbgmgr_mutex()); 6208c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 6218c2ecf20Sopenharmony_ci 6228c2ecf20Sopenharmony_ci return status; 6238c2ecf20Sopenharmony_ci} 6248c2ecf20Sopenharmony_ci 6258c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_unregister(struct file *filep, 6268c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 6278c2ecf20Sopenharmony_ci{ 6288c2ecf20Sopenharmony_ci struct kfd_ioctl_dbg_unregister_args *args = data; 6298c2ecf20Sopenharmony_ci struct kfd_dev *dev; 6308c2ecf20Sopenharmony_ci long status; 6318c2ecf20Sopenharmony_ci 6328c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 6338c2ecf20Sopenharmony_ci if (!dev || !dev->dbgmgr) 6348c2ecf20Sopenharmony_ci return -EINVAL; 6358c2ecf20Sopenharmony_ci 6368c2ecf20Sopenharmony_ci if (dev->device_info->asic_family == CHIP_CARRIZO) { 6378c2ecf20Sopenharmony_ci pr_debug("kfd_ioctl_dbg_unregister not supported on CZ\n"); 6388c2ecf20Sopenharmony_ci return -EINVAL; 6398c2ecf20Sopenharmony_ci } 6408c2ecf20Sopenharmony_ci 6418c2ecf20Sopenharmony_ci mutex_lock(kfd_get_dbgmgr_mutex()); 6428c2ecf20Sopenharmony_ci 6438c2ecf20Sopenharmony_ci status = kfd_dbgmgr_unregister(dev->dbgmgr, p); 6448c2ecf20Sopenharmony_ci if (!status) { 6458c2ecf20Sopenharmony_ci kfd_dbgmgr_destroy(dev->dbgmgr); 6468c2ecf20Sopenharmony_ci dev->dbgmgr = NULL; 6478c2ecf20Sopenharmony_ci } 6488c2ecf20Sopenharmony_ci 6498c2ecf20Sopenharmony_ci mutex_unlock(kfd_get_dbgmgr_mutex()); 6508c2ecf20Sopenharmony_ci 6518c2ecf20Sopenharmony_ci return status; 6528c2ecf20Sopenharmony_ci} 6538c2ecf20Sopenharmony_ci 6548c2ecf20Sopenharmony_ci/* 6558c2ecf20Sopenharmony_ci * Parse and generate variable size data structure for address watch. 6568c2ecf20Sopenharmony_ci * Total size of the buffer and # watch points is limited in order 6578c2ecf20Sopenharmony_ci * to prevent kernel abuse. (no bearing to the much smaller HW limitation 6588c2ecf20Sopenharmony_ci * which is enforced by dbgdev module) 6598c2ecf20Sopenharmony_ci * please also note that the watch address itself are not "copied from user", 6608c2ecf20Sopenharmony_ci * since it be set into the HW in user mode values. 6618c2ecf20Sopenharmony_ci * 6628c2ecf20Sopenharmony_ci */ 6638c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_address_watch(struct file *filep, 6648c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 6658c2ecf20Sopenharmony_ci{ 6668c2ecf20Sopenharmony_ci struct kfd_ioctl_dbg_address_watch_args *args = data; 6678c2ecf20Sopenharmony_ci struct kfd_dev *dev; 6688c2ecf20Sopenharmony_ci struct dbg_address_watch_info aw_info; 6698c2ecf20Sopenharmony_ci unsigned char *args_buff; 6708c2ecf20Sopenharmony_ci long status; 6718c2ecf20Sopenharmony_ci void __user *cmd_from_user; 6728c2ecf20Sopenharmony_ci uint64_t watch_mask_value = 0; 6738c2ecf20Sopenharmony_ci unsigned int args_idx = 0; 6748c2ecf20Sopenharmony_ci 6758c2ecf20Sopenharmony_ci memset((void *) &aw_info, 0, sizeof(struct dbg_address_watch_info)); 6768c2ecf20Sopenharmony_ci 6778c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 6788c2ecf20Sopenharmony_ci if (!dev) 6798c2ecf20Sopenharmony_ci return -EINVAL; 6808c2ecf20Sopenharmony_ci 6818c2ecf20Sopenharmony_ci if (dev->device_info->asic_family == CHIP_CARRIZO) { 6828c2ecf20Sopenharmony_ci pr_debug("kfd_ioctl_dbg_wave_control not supported on CZ\n"); 6838c2ecf20Sopenharmony_ci return -EINVAL; 6848c2ecf20Sopenharmony_ci } 6858c2ecf20Sopenharmony_ci 6868c2ecf20Sopenharmony_ci cmd_from_user = (void __user *) args->content_ptr; 6878c2ecf20Sopenharmony_ci 6888c2ecf20Sopenharmony_ci /* Validate arguments */ 6898c2ecf20Sopenharmony_ci 6908c2ecf20Sopenharmony_ci if ((args->buf_size_in_bytes > MAX_ALLOWED_AW_BUFF_SIZE) || 6918c2ecf20Sopenharmony_ci (args->buf_size_in_bytes <= sizeof(*args) + sizeof(int) * 2) || 6928c2ecf20Sopenharmony_ci (cmd_from_user == NULL)) 6938c2ecf20Sopenharmony_ci return -EINVAL; 6948c2ecf20Sopenharmony_ci 6958c2ecf20Sopenharmony_ci /* this is the actual buffer to work with */ 6968c2ecf20Sopenharmony_ci args_buff = memdup_user(cmd_from_user, 6978c2ecf20Sopenharmony_ci args->buf_size_in_bytes - sizeof(*args)); 6988c2ecf20Sopenharmony_ci if (IS_ERR(args_buff)) 6998c2ecf20Sopenharmony_ci return PTR_ERR(args_buff); 7008c2ecf20Sopenharmony_ci 7018c2ecf20Sopenharmony_ci aw_info.process = p; 7028c2ecf20Sopenharmony_ci 7038c2ecf20Sopenharmony_ci aw_info.num_watch_points = *((uint32_t *)(&args_buff[args_idx])); 7048c2ecf20Sopenharmony_ci args_idx += sizeof(aw_info.num_watch_points); 7058c2ecf20Sopenharmony_ci 7068c2ecf20Sopenharmony_ci aw_info.watch_mode = (enum HSA_DBG_WATCH_MODE *) &args_buff[args_idx]; 7078c2ecf20Sopenharmony_ci args_idx += sizeof(enum HSA_DBG_WATCH_MODE) * aw_info.num_watch_points; 7088c2ecf20Sopenharmony_ci 7098c2ecf20Sopenharmony_ci /* 7108c2ecf20Sopenharmony_ci * set watch address base pointer to point on the array base 7118c2ecf20Sopenharmony_ci * within args_buff 7128c2ecf20Sopenharmony_ci */ 7138c2ecf20Sopenharmony_ci aw_info.watch_address = (uint64_t *) &args_buff[args_idx]; 7148c2ecf20Sopenharmony_ci 7158c2ecf20Sopenharmony_ci /* skip over the addresses buffer */ 7168c2ecf20Sopenharmony_ci args_idx += sizeof(aw_info.watch_address) * aw_info.num_watch_points; 7178c2ecf20Sopenharmony_ci 7188c2ecf20Sopenharmony_ci if (args_idx >= args->buf_size_in_bytes - sizeof(*args)) { 7198c2ecf20Sopenharmony_ci status = -EINVAL; 7208c2ecf20Sopenharmony_ci goto out; 7218c2ecf20Sopenharmony_ci } 7228c2ecf20Sopenharmony_ci 7238c2ecf20Sopenharmony_ci watch_mask_value = (uint64_t) args_buff[args_idx]; 7248c2ecf20Sopenharmony_ci 7258c2ecf20Sopenharmony_ci if (watch_mask_value > 0) { 7268c2ecf20Sopenharmony_ci /* 7278c2ecf20Sopenharmony_ci * There is an array of masks. 7288c2ecf20Sopenharmony_ci * set watch mask base pointer to point on the array base 7298c2ecf20Sopenharmony_ci * within args_buff 7308c2ecf20Sopenharmony_ci */ 7318c2ecf20Sopenharmony_ci aw_info.watch_mask = (uint64_t *) &args_buff[args_idx]; 7328c2ecf20Sopenharmony_ci 7338c2ecf20Sopenharmony_ci /* skip over the masks buffer */ 7348c2ecf20Sopenharmony_ci args_idx += sizeof(aw_info.watch_mask) * 7358c2ecf20Sopenharmony_ci aw_info.num_watch_points; 7368c2ecf20Sopenharmony_ci } else { 7378c2ecf20Sopenharmony_ci /* just the NULL mask, set to NULL and skip over it */ 7388c2ecf20Sopenharmony_ci aw_info.watch_mask = NULL; 7398c2ecf20Sopenharmony_ci args_idx += sizeof(aw_info.watch_mask); 7408c2ecf20Sopenharmony_ci } 7418c2ecf20Sopenharmony_ci 7428c2ecf20Sopenharmony_ci if (args_idx >= args->buf_size_in_bytes - sizeof(args)) { 7438c2ecf20Sopenharmony_ci status = -EINVAL; 7448c2ecf20Sopenharmony_ci goto out; 7458c2ecf20Sopenharmony_ci } 7468c2ecf20Sopenharmony_ci 7478c2ecf20Sopenharmony_ci /* Currently HSA Event is not supported for DBG */ 7488c2ecf20Sopenharmony_ci aw_info.watch_event = NULL; 7498c2ecf20Sopenharmony_ci 7508c2ecf20Sopenharmony_ci mutex_lock(kfd_get_dbgmgr_mutex()); 7518c2ecf20Sopenharmony_ci 7528c2ecf20Sopenharmony_ci status = kfd_dbgmgr_address_watch(dev->dbgmgr, &aw_info); 7538c2ecf20Sopenharmony_ci 7548c2ecf20Sopenharmony_ci mutex_unlock(kfd_get_dbgmgr_mutex()); 7558c2ecf20Sopenharmony_ci 7568c2ecf20Sopenharmony_ciout: 7578c2ecf20Sopenharmony_ci kfree(args_buff); 7588c2ecf20Sopenharmony_ci 7598c2ecf20Sopenharmony_ci return status; 7608c2ecf20Sopenharmony_ci} 7618c2ecf20Sopenharmony_ci 7628c2ecf20Sopenharmony_ci/* Parse and generate fixed size data structure for wave control */ 7638c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_wave_control(struct file *filep, 7648c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 7658c2ecf20Sopenharmony_ci{ 7668c2ecf20Sopenharmony_ci struct kfd_ioctl_dbg_wave_control_args *args = data; 7678c2ecf20Sopenharmony_ci struct kfd_dev *dev; 7688c2ecf20Sopenharmony_ci struct dbg_wave_control_info wac_info; 7698c2ecf20Sopenharmony_ci unsigned char *args_buff; 7708c2ecf20Sopenharmony_ci uint32_t computed_buff_size; 7718c2ecf20Sopenharmony_ci long status; 7728c2ecf20Sopenharmony_ci void __user *cmd_from_user; 7738c2ecf20Sopenharmony_ci unsigned int args_idx = 0; 7748c2ecf20Sopenharmony_ci 7758c2ecf20Sopenharmony_ci memset((void *) &wac_info, 0, sizeof(struct dbg_wave_control_info)); 7768c2ecf20Sopenharmony_ci 7778c2ecf20Sopenharmony_ci /* we use compact form, independent of the packing attribute value */ 7788c2ecf20Sopenharmony_ci computed_buff_size = sizeof(*args) + 7798c2ecf20Sopenharmony_ci sizeof(wac_info.mode) + 7808c2ecf20Sopenharmony_ci sizeof(wac_info.operand) + 7818c2ecf20Sopenharmony_ci sizeof(wac_info.dbgWave_msg.DbgWaveMsg) + 7828c2ecf20Sopenharmony_ci sizeof(wac_info.dbgWave_msg.MemoryVA) + 7838c2ecf20Sopenharmony_ci sizeof(wac_info.trapId); 7848c2ecf20Sopenharmony_ci 7858c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 7868c2ecf20Sopenharmony_ci if (!dev) 7878c2ecf20Sopenharmony_ci return -EINVAL; 7888c2ecf20Sopenharmony_ci 7898c2ecf20Sopenharmony_ci if (dev->device_info->asic_family == CHIP_CARRIZO) { 7908c2ecf20Sopenharmony_ci pr_debug("kfd_ioctl_dbg_wave_control not supported on CZ\n"); 7918c2ecf20Sopenharmony_ci return -EINVAL; 7928c2ecf20Sopenharmony_ci } 7938c2ecf20Sopenharmony_ci 7948c2ecf20Sopenharmony_ci /* input size must match the computed "compact" size */ 7958c2ecf20Sopenharmony_ci if (args->buf_size_in_bytes != computed_buff_size) { 7968c2ecf20Sopenharmony_ci pr_debug("size mismatch, computed : actual %u : %u\n", 7978c2ecf20Sopenharmony_ci args->buf_size_in_bytes, computed_buff_size); 7988c2ecf20Sopenharmony_ci return -EINVAL; 7998c2ecf20Sopenharmony_ci } 8008c2ecf20Sopenharmony_ci 8018c2ecf20Sopenharmony_ci cmd_from_user = (void __user *) args->content_ptr; 8028c2ecf20Sopenharmony_ci 8038c2ecf20Sopenharmony_ci if (cmd_from_user == NULL) 8048c2ecf20Sopenharmony_ci return -EINVAL; 8058c2ecf20Sopenharmony_ci 8068c2ecf20Sopenharmony_ci /* copy the entire buffer from user */ 8078c2ecf20Sopenharmony_ci 8088c2ecf20Sopenharmony_ci args_buff = memdup_user(cmd_from_user, 8098c2ecf20Sopenharmony_ci args->buf_size_in_bytes - sizeof(*args)); 8108c2ecf20Sopenharmony_ci if (IS_ERR(args_buff)) 8118c2ecf20Sopenharmony_ci return PTR_ERR(args_buff); 8128c2ecf20Sopenharmony_ci 8138c2ecf20Sopenharmony_ci /* move ptr to the start of the "pay-load" area */ 8148c2ecf20Sopenharmony_ci wac_info.process = p; 8158c2ecf20Sopenharmony_ci 8168c2ecf20Sopenharmony_ci wac_info.operand = *((enum HSA_DBG_WAVEOP *)(&args_buff[args_idx])); 8178c2ecf20Sopenharmony_ci args_idx += sizeof(wac_info.operand); 8188c2ecf20Sopenharmony_ci 8198c2ecf20Sopenharmony_ci wac_info.mode = *((enum HSA_DBG_WAVEMODE *)(&args_buff[args_idx])); 8208c2ecf20Sopenharmony_ci args_idx += sizeof(wac_info.mode); 8218c2ecf20Sopenharmony_ci 8228c2ecf20Sopenharmony_ci wac_info.trapId = *((uint32_t *)(&args_buff[args_idx])); 8238c2ecf20Sopenharmony_ci args_idx += sizeof(wac_info.trapId); 8248c2ecf20Sopenharmony_ci 8258c2ecf20Sopenharmony_ci wac_info.dbgWave_msg.DbgWaveMsg.WaveMsgInfoGen2.Value = 8268c2ecf20Sopenharmony_ci *((uint32_t *)(&args_buff[args_idx])); 8278c2ecf20Sopenharmony_ci wac_info.dbgWave_msg.MemoryVA = NULL; 8288c2ecf20Sopenharmony_ci 8298c2ecf20Sopenharmony_ci mutex_lock(kfd_get_dbgmgr_mutex()); 8308c2ecf20Sopenharmony_ci 8318c2ecf20Sopenharmony_ci pr_debug("Calling dbg manager process %p, operand %u, mode %u, trapId %u, message %u\n", 8328c2ecf20Sopenharmony_ci wac_info.process, wac_info.operand, 8338c2ecf20Sopenharmony_ci wac_info.mode, wac_info.trapId, 8348c2ecf20Sopenharmony_ci wac_info.dbgWave_msg.DbgWaveMsg.WaveMsgInfoGen2.Value); 8358c2ecf20Sopenharmony_ci 8368c2ecf20Sopenharmony_ci status = kfd_dbgmgr_wave_control(dev->dbgmgr, &wac_info); 8378c2ecf20Sopenharmony_ci 8388c2ecf20Sopenharmony_ci pr_debug("Returned status of dbg manager is %ld\n", status); 8398c2ecf20Sopenharmony_ci 8408c2ecf20Sopenharmony_ci mutex_unlock(kfd_get_dbgmgr_mutex()); 8418c2ecf20Sopenharmony_ci 8428c2ecf20Sopenharmony_ci kfree(args_buff); 8438c2ecf20Sopenharmony_ci 8448c2ecf20Sopenharmony_ci return status; 8458c2ecf20Sopenharmony_ci} 8468c2ecf20Sopenharmony_ci 8478c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_clock_counters(struct file *filep, 8488c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 8498c2ecf20Sopenharmony_ci{ 8508c2ecf20Sopenharmony_ci struct kfd_ioctl_get_clock_counters_args *args = data; 8518c2ecf20Sopenharmony_ci struct kfd_dev *dev; 8528c2ecf20Sopenharmony_ci 8538c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 8548c2ecf20Sopenharmony_ci if (dev) 8558c2ecf20Sopenharmony_ci /* Reading GPU clock counter from KGD */ 8568c2ecf20Sopenharmony_ci args->gpu_clock_counter = amdgpu_amdkfd_get_gpu_clock_counter(dev->kgd); 8578c2ecf20Sopenharmony_ci else 8588c2ecf20Sopenharmony_ci /* Node without GPU resource */ 8598c2ecf20Sopenharmony_ci args->gpu_clock_counter = 0; 8608c2ecf20Sopenharmony_ci 8618c2ecf20Sopenharmony_ci /* No access to rdtsc. Using raw monotonic time */ 8628c2ecf20Sopenharmony_ci args->cpu_clock_counter = ktime_get_raw_ns(); 8638c2ecf20Sopenharmony_ci args->system_clock_counter = ktime_get_boottime_ns(); 8648c2ecf20Sopenharmony_ci 8658c2ecf20Sopenharmony_ci /* Since the counter is in nano-seconds we use 1GHz frequency */ 8668c2ecf20Sopenharmony_ci args->system_clock_freq = 1000000000; 8678c2ecf20Sopenharmony_ci 8688c2ecf20Sopenharmony_ci return 0; 8698c2ecf20Sopenharmony_ci} 8708c2ecf20Sopenharmony_ci 8718c2ecf20Sopenharmony_ci 8728c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_process_apertures(struct file *filp, 8738c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 8748c2ecf20Sopenharmony_ci{ 8758c2ecf20Sopenharmony_ci struct kfd_ioctl_get_process_apertures_args *args = data; 8768c2ecf20Sopenharmony_ci struct kfd_process_device_apertures *pAperture; 8778c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 8788c2ecf20Sopenharmony_ci 8798c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "get apertures for PASID 0x%x", p->pasid); 8808c2ecf20Sopenharmony_ci 8818c2ecf20Sopenharmony_ci args->num_of_nodes = 0; 8828c2ecf20Sopenharmony_ci 8838c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 8848c2ecf20Sopenharmony_ci 8858c2ecf20Sopenharmony_ci /*if the process-device list isn't empty*/ 8868c2ecf20Sopenharmony_ci if (kfd_has_process_device_data(p)) { 8878c2ecf20Sopenharmony_ci /* Run over all pdd of the process */ 8888c2ecf20Sopenharmony_ci pdd = kfd_get_first_process_device_data(p); 8898c2ecf20Sopenharmony_ci do { 8908c2ecf20Sopenharmony_ci pAperture = 8918c2ecf20Sopenharmony_ci &args->process_apertures[args->num_of_nodes]; 8928c2ecf20Sopenharmony_ci pAperture->gpu_id = pdd->dev->id; 8938c2ecf20Sopenharmony_ci pAperture->lds_base = pdd->lds_base; 8948c2ecf20Sopenharmony_ci pAperture->lds_limit = pdd->lds_limit; 8958c2ecf20Sopenharmony_ci pAperture->gpuvm_base = pdd->gpuvm_base; 8968c2ecf20Sopenharmony_ci pAperture->gpuvm_limit = pdd->gpuvm_limit; 8978c2ecf20Sopenharmony_ci pAperture->scratch_base = pdd->scratch_base; 8988c2ecf20Sopenharmony_ci pAperture->scratch_limit = pdd->scratch_limit; 8998c2ecf20Sopenharmony_ci 9008c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9018c2ecf20Sopenharmony_ci "node id %u\n", args->num_of_nodes); 9028c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9038c2ecf20Sopenharmony_ci "gpu id %u\n", pdd->dev->id); 9048c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9058c2ecf20Sopenharmony_ci "lds_base %llX\n", pdd->lds_base); 9068c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9078c2ecf20Sopenharmony_ci "lds_limit %llX\n", pdd->lds_limit); 9088c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9098c2ecf20Sopenharmony_ci "gpuvm_base %llX\n", pdd->gpuvm_base); 9108c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9118c2ecf20Sopenharmony_ci "gpuvm_limit %llX\n", pdd->gpuvm_limit); 9128c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9138c2ecf20Sopenharmony_ci "scratch_base %llX\n", pdd->scratch_base); 9148c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9158c2ecf20Sopenharmony_ci "scratch_limit %llX\n", pdd->scratch_limit); 9168c2ecf20Sopenharmony_ci 9178c2ecf20Sopenharmony_ci args->num_of_nodes++; 9188c2ecf20Sopenharmony_ci 9198c2ecf20Sopenharmony_ci pdd = kfd_get_next_process_device_data(p, pdd); 9208c2ecf20Sopenharmony_ci } while (pdd && (args->num_of_nodes < NUM_OF_SUPPORTED_GPUS)); 9218c2ecf20Sopenharmony_ci } 9228c2ecf20Sopenharmony_ci 9238c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 9248c2ecf20Sopenharmony_ci 9258c2ecf20Sopenharmony_ci return 0; 9268c2ecf20Sopenharmony_ci} 9278c2ecf20Sopenharmony_ci 9288c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_process_apertures_new(struct file *filp, 9298c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 9308c2ecf20Sopenharmony_ci{ 9318c2ecf20Sopenharmony_ci struct kfd_ioctl_get_process_apertures_new_args *args = data; 9328c2ecf20Sopenharmony_ci struct kfd_process_device_apertures *pa; 9338c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 9348c2ecf20Sopenharmony_ci uint32_t nodes = 0; 9358c2ecf20Sopenharmony_ci int ret; 9368c2ecf20Sopenharmony_ci 9378c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "get apertures for PASID 0x%x", p->pasid); 9388c2ecf20Sopenharmony_ci 9398c2ecf20Sopenharmony_ci if (args->num_of_nodes == 0) { 9408c2ecf20Sopenharmony_ci /* Return number of nodes, so that user space can alloacate 9418c2ecf20Sopenharmony_ci * sufficient memory 9428c2ecf20Sopenharmony_ci */ 9438c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 9448c2ecf20Sopenharmony_ci 9458c2ecf20Sopenharmony_ci if (!kfd_has_process_device_data(p)) 9468c2ecf20Sopenharmony_ci goto out_unlock; 9478c2ecf20Sopenharmony_ci 9488c2ecf20Sopenharmony_ci /* Run over all pdd of the process */ 9498c2ecf20Sopenharmony_ci pdd = kfd_get_first_process_device_data(p); 9508c2ecf20Sopenharmony_ci do { 9518c2ecf20Sopenharmony_ci args->num_of_nodes++; 9528c2ecf20Sopenharmony_ci pdd = kfd_get_next_process_device_data(p, pdd); 9538c2ecf20Sopenharmony_ci } while (pdd); 9548c2ecf20Sopenharmony_ci 9558c2ecf20Sopenharmony_ci goto out_unlock; 9568c2ecf20Sopenharmony_ci } 9578c2ecf20Sopenharmony_ci 9588c2ecf20Sopenharmony_ci /* Fill in process-aperture information for all available 9598c2ecf20Sopenharmony_ci * nodes, but not more than args->num_of_nodes as that is 9608c2ecf20Sopenharmony_ci * the amount of memory allocated by user 9618c2ecf20Sopenharmony_ci */ 9628c2ecf20Sopenharmony_ci pa = kzalloc((sizeof(struct kfd_process_device_apertures) * 9638c2ecf20Sopenharmony_ci args->num_of_nodes), GFP_KERNEL); 9648c2ecf20Sopenharmony_ci if (!pa) 9658c2ecf20Sopenharmony_ci return -ENOMEM; 9668c2ecf20Sopenharmony_ci 9678c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 9688c2ecf20Sopenharmony_ci 9698c2ecf20Sopenharmony_ci if (!kfd_has_process_device_data(p)) { 9708c2ecf20Sopenharmony_ci args->num_of_nodes = 0; 9718c2ecf20Sopenharmony_ci kfree(pa); 9728c2ecf20Sopenharmony_ci goto out_unlock; 9738c2ecf20Sopenharmony_ci } 9748c2ecf20Sopenharmony_ci 9758c2ecf20Sopenharmony_ci /* Run over all pdd of the process */ 9768c2ecf20Sopenharmony_ci pdd = kfd_get_first_process_device_data(p); 9778c2ecf20Sopenharmony_ci do { 9788c2ecf20Sopenharmony_ci pa[nodes].gpu_id = pdd->dev->id; 9798c2ecf20Sopenharmony_ci pa[nodes].lds_base = pdd->lds_base; 9808c2ecf20Sopenharmony_ci pa[nodes].lds_limit = pdd->lds_limit; 9818c2ecf20Sopenharmony_ci pa[nodes].gpuvm_base = pdd->gpuvm_base; 9828c2ecf20Sopenharmony_ci pa[nodes].gpuvm_limit = pdd->gpuvm_limit; 9838c2ecf20Sopenharmony_ci pa[nodes].scratch_base = pdd->scratch_base; 9848c2ecf20Sopenharmony_ci pa[nodes].scratch_limit = pdd->scratch_limit; 9858c2ecf20Sopenharmony_ci 9868c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9878c2ecf20Sopenharmony_ci "gpu id %u\n", pdd->dev->id); 9888c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9898c2ecf20Sopenharmony_ci "lds_base %llX\n", pdd->lds_base); 9908c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9918c2ecf20Sopenharmony_ci "lds_limit %llX\n", pdd->lds_limit); 9928c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9938c2ecf20Sopenharmony_ci "gpuvm_base %llX\n", pdd->gpuvm_base); 9948c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9958c2ecf20Sopenharmony_ci "gpuvm_limit %llX\n", pdd->gpuvm_limit); 9968c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9978c2ecf20Sopenharmony_ci "scratch_base %llX\n", pdd->scratch_base); 9988c2ecf20Sopenharmony_ci dev_dbg(kfd_device, 9998c2ecf20Sopenharmony_ci "scratch_limit %llX\n", pdd->scratch_limit); 10008c2ecf20Sopenharmony_ci nodes++; 10018c2ecf20Sopenharmony_ci 10028c2ecf20Sopenharmony_ci pdd = kfd_get_next_process_device_data(p, pdd); 10038c2ecf20Sopenharmony_ci } while (pdd && (nodes < args->num_of_nodes)); 10048c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 10058c2ecf20Sopenharmony_ci 10068c2ecf20Sopenharmony_ci args->num_of_nodes = nodes; 10078c2ecf20Sopenharmony_ci ret = copy_to_user( 10088c2ecf20Sopenharmony_ci (void __user *)args->kfd_process_device_apertures_ptr, 10098c2ecf20Sopenharmony_ci pa, 10108c2ecf20Sopenharmony_ci (nodes * sizeof(struct kfd_process_device_apertures))); 10118c2ecf20Sopenharmony_ci kfree(pa); 10128c2ecf20Sopenharmony_ci return ret ? -EFAULT : 0; 10138c2ecf20Sopenharmony_ci 10148c2ecf20Sopenharmony_ciout_unlock: 10158c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 10168c2ecf20Sopenharmony_ci return 0; 10178c2ecf20Sopenharmony_ci} 10188c2ecf20Sopenharmony_ci 10198c2ecf20Sopenharmony_cistatic int kfd_ioctl_create_event(struct file *filp, struct kfd_process *p, 10208c2ecf20Sopenharmony_ci void *data) 10218c2ecf20Sopenharmony_ci{ 10228c2ecf20Sopenharmony_ci struct kfd_ioctl_create_event_args *args = data; 10238c2ecf20Sopenharmony_ci int err; 10248c2ecf20Sopenharmony_ci 10258c2ecf20Sopenharmony_ci /* For dGPUs the event page is allocated in user mode. The 10268c2ecf20Sopenharmony_ci * handle is passed to KFD with the first call to this IOCTL 10278c2ecf20Sopenharmony_ci * through the event_page_offset field. 10288c2ecf20Sopenharmony_ci */ 10298c2ecf20Sopenharmony_ci if (args->event_page_offset) { 10308c2ecf20Sopenharmony_ci struct kfd_dev *kfd; 10318c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 10328c2ecf20Sopenharmony_ci void *mem, *kern_addr; 10338c2ecf20Sopenharmony_ci uint64_t size; 10348c2ecf20Sopenharmony_ci 10358c2ecf20Sopenharmony_ci if (p->signal_page) { 10368c2ecf20Sopenharmony_ci pr_err("Event page is already set\n"); 10378c2ecf20Sopenharmony_ci return -EINVAL; 10388c2ecf20Sopenharmony_ci } 10398c2ecf20Sopenharmony_ci 10408c2ecf20Sopenharmony_ci kfd = kfd_device_by_id(GET_GPU_ID(args->event_page_offset)); 10418c2ecf20Sopenharmony_ci if (!kfd) { 10428c2ecf20Sopenharmony_ci pr_err("Getting device by id failed in %s\n", __func__); 10438c2ecf20Sopenharmony_ci return -EINVAL; 10448c2ecf20Sopenharmony_ci } 10458c2ecf20Sopenharmony_ci 10468c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 10478c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(kfd, p); 10488c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 10498c2ecf20Sopenharmony_ci err = PTR_ERR(pdd); 10508c2ecf20Sopenharmony_ci goto out_unlock; 10518c2ecf20Sopenharmony_ci } 10528c2ecf20Sopenharmony_ci 10538c2ecf20Sopenharmony_ci mem = kfd_process_device_translate_handle(pdd, 10548c2ecf20Sopenharmony_ci GET_IDR_HANDLE(args->event_page_offset)); 10558c2ecf20Sopenharmony_ci if (!mem) { 10568c2ecf20Sopenharmony_ci pr_err("Can't find BO, offset is 0x%llx\n", 10578c2ecf20Sopenharmony_ci args->event_page_offset); 10588c2ecf20Sopenharmony_ci err = -EINVAL; 10598c2ecf20Sopenharmony_ci goto out_unlock; 10608c2ecf20Sopenharmony_ci } 10618c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 10628c2ecf20Sopenharmony_ci 10638c2ecf20Sopenharmony_ci err = amdgpu_amdkfd_gpuvm_map_gtt_bo_to_kernel(kfd->kgd, 10648c2ecf20Sopenharmony_ci mem, &kern_addr, &size); 10658c2ecf20Sopenharmony_ci if (err) { 10668c2ecf20Sopenharmony_ci pr_err("Failed to map event page to kernel\n"); 10678c2ecf20Sopenharmony_ci return err; 10688c2ecf20Sopenharmony_ci } 10698c2ecf20Sopenharmony_ci 10708c2ecf20Sopenharmony_ci err = kfd_event_page_set(p, kern_addr, size); 10718c2ecf20Sopenharmony_ci if (err) { 10728c2ecf20Sopenharmony_ci pr_err("Failed to set event page\n"); 10738c2ecf20Sopenharmony_ci return err; 10748c2ecf20Sopenharmony_ci } 10758c2ecf20Sopenharmony_ci } 10768c2ecf20Sopenharmony_ci 10778c2ecf20Sopenharmony_ci err = kfd_event_create(filp, p, args->event_type, 10788c2ecf20Sopenharmony_ci args->auto_reset != 0, args->node_id, 10798c2ecf20Sopenharmony_ci &args->event_id, &args->event_trigger_data, 10808c2ecf20Sopenharmony_ci &args->event_page_offset, 10818c2ecf20Sopenharmony_ci &args->event_slot_index); 10828c2ecf20Sopenharmony_ci 10838c2ecf20Sopenharmony_ci return err; 10848c2ecf20Sopenharmony_ci 10858c2ecf20Sopenharmony_ciout_unlock: 10868c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 10878c2ecf20Sopenharmony_ci return err; 10888c2ecf20Sopenharmony_ci} 10898c2ecf20Sopenharmony_ci 10908c2ecf20Sopenharmony_cistatic int kfd_ioctl_destroy_event(struct file *filp, struct kfd_process *p, 10918c2ecf20Sopenharmony_ci void *data) 10928c2ecf20Sopenharmony_ci{ 10938c2ecf20Sopenharmony_ci struct kfd_ioctl_destroy_event_args *args = data; 10948c2ecf20Sopenharmony_ci 10958c2ecf20Sopenharmony_ci return kfd_event_destroy(p, args->event_id); 10968c2ecf20Sopenharmony_ci} 10978c2ecf20Sopenharmony_ci 10988c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_event(struct file *filp, struct kfd_process *p, 10998c2ecf20Sopenharmony_ci void *data) 11008c2ecf20Sopenharmony_ci{ 11018c2ecf20Sopenharmony_ci struct kfd_ioctl_set_event_args *args = data; 11028c2ecf20Sopenharmony_ci 11038c2ecf20Sopenharmony_ci return kfd_set_event(p, args->event_id); 11048c2ecf20Sopenharmony_ci} 11058c2ecf20Sopenharmony_ci 11068c2ecf20Sopenharmony_cistatic int kfd_ioctl_reset_event(struct file *filp, struct kfd_process *p, 11078c2ecf20Sopenharmony_ci void *data) 11088c2ecf20Sopenharmony_ci{ 11098c2ecf20Sopenharmony_ci struct kfd_ioctl_reset_event_args *args = data; 11108c2ecf20Sopenharmony_ci 11118c2ecf20Sopenharmony_ci return kfd_reset_event(p, args->event_id); 11128c2ecf20Sopenharmony_ci} 11138c2ecf20Sopenharmony_ci 11148c2ecf20Sopenharmony_cistatic int kfd_ioctl_wait_events(struct file *filp, struct kfd_process *p, 11158c2ecf20Sopenharmony_ci void *data) 11168c2ecf20Sopenharmony_ci{ 11178c2ecf20Sopenharmony_ci struct kfd_ioctl_wait_events_args *args = data; 11188c2ecf20Sopenharmony_ci int err; 11198c2ecf20Sopenharmony_ci 11208c2ecf20Sopenharmony_ci err = kfd_wait_on_events(p, args->num_events, 11218c2ecf20Sopenharmony_ci (void __user *)args->events_ptr, 11228c2ecf20Sopenharmony_ci (args->wait_for_all != 0), 11238c2ecf20Sopenharmony_ci args->timeout, &args->wait_result); 11248c2ecf20Sopenharmony_ci 11258c2ecf20Sopenharmony_ci return err; 11268c2ecf20Sopenharmony_ci} 11278c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_scratch_backing_va(struct file *filep, 11288c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 11298c2ecf20Sopenharmony_ci{ 11308c2ecf20Sopenharmony_ci struct kfd_ioctl_set_scratch_backing_va_args *args = data; 11318c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 11328c2ecf20Sopenharmony_ci struct kfd_dev *dev; 11338c2ecf20Sopenharmony_ci long err; 11348c2ecf20Sopenharmony_ci 11358c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 11368c2ecf20Sopenharmony_ci if (!dev) 11378c2ecf20Sopenharmony_ci return -EINVAL; 11388c2ecf20Sopenharmony_ci 11398c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 11408c2ecf20Sopenharmony_ci 11418c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 11428c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 11438c2ecf20Sopenharmony_ci err = PTR_ERR(pdd); 11448c2ecf20Sopenharmony_ci goto bind_process_to_device_fail; 11458c2ecf20Sopenharmony_ci } 11468c2ecf20Sopenharmony_ci 11478c2ecf20Sopenharmony_ci pdd->qpd.sh_hidden_private_base = args->va_addr; 11488c2ecf20Sopenharmony_ci 11498c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 11508c2ecf20Sopenharmony_ci 11518c2ecf20Sopenharmony_ci if (dev->dqm->sched_policy == KFD_SCHED_POLICY_NO_HWS && 11528c2ecf20Sopenharmony_ci pdd->qpd.vmid != 0 && dev->kfd2kgd->set_scratch_backing_va) 11538c2ecf20Sopenharmony_ci dev->kfd2kgd->set_scratch_backing_va( 11548c2ecf20Sopenharmony_ci dev->kgd, args->va_addr, pdd->qpd.vmid); 11558c2ecf20Sopenharmony_ci 11568c2ecf20Sopenharmony_ci return 0; 11578c2ecf20Sopenharmony_ci 11588c2ecf20Sopenharmony_cibind_process_to_device_fail: 11598c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 11608c2ecf20Sopenharmony_ci return err; 11618c2ecf20Sopenharmony_ci} 11628c2ecf20Sopenharmony_ci 11638c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_tile_config(struct file *filep, 11648c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 11658c2ecf20Sopenharmony_ci{ 11668c2ecf20Sopenharmony_ci struct kfd_ioctl_get_tile_config_args *args = data; 11678c2ecf20Sopenharmony_ci struct kfd_dev *dev; 11688c2ecf20Sopenharmony_ci struct tile_config config; 11698c2ecf20Sopenharmony_ci int err = 0; 11708c2ecf20Sopenharmony_ci 11718c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 11728c2ecf20Sopenharmony_ci if (!dev) 11738c2ecf20Sopenharmony_ci return -EINVAL; 11748c2ecf20Sopenharmony_ci 11758c2ecf20Sopenharmony_ci amdgpu_amdkfd_get_tile_config(dev->kgd, &config); 11768c2ecf20Sopenharmony_ci 11778c2ecf20Sopenharmony_ci args->gb_addr_config = config.gb_addr_config; 11788c2ecf20Sopenharmony_ci args->num_banks = config.num_banks; 11798c2ecf20Sopenharmony_ci args->num_ranks = config.num_ranks; 11808c2ecf20Sopenharmony_ci 11818c2ecf20Sopenharmony_ci if (args->num_tile_configs > config.num_tile_configs) 11828c2ecf20Sopenharmony_ci args->num_tile_configs = config.num_tile_configs; 11838c2ecf20Sopenharmony_ci err = copy_to_user((void __user *)args->tile_config_ptr, 11848c2ecf20Sopenharmony_ci config.tile_config_ptr, 11858c2ecf20Sopenharmony_ci args->num_tile_configs * sizeof(uint32_t)); 11868c2ecf20Sopenharmony_ci if (err) { 11878c2ecf20Sopenharmony_ci args->num_tile_configs = 0; 11888c2ecf20Sopenharmony_ci return -EFAULT; 11898c2ecf20Sopenharmony_ci } 11908c2ecf20Sopenharmony_ci 11918c2ecf20Sopenharmony_ci if (args->num_macro_tile_configs > config.num_macro_tile_configs) 11928c2ecf20Sopenharmony_ci args->num_macro_tile_configs = 11938c2ecf20Sopenharmony_ci config.num_macro_tile_configs; 11948c2ecf20Sopenharmony_ci err = copy_to_user((void __user *)args->macro_tile_config_ptr, 11958c2ecf20Sopenharmony_ci config.macro_tile_config_ptr, 11968c2ecf20Sopenharmony_ci args->num_macro_tile_configs * sizeof(uint32_t)); 11978c2ecf20Sopenharmony_ci if (err) { 11988c2ecf20Sopenharmony_ci args->num_macro_tile_configs = 0; 11998c2ecf20Sopenharmony_ci return -EFAULT; 12008c2ecf20Sopenharmony_ci } 12018c2ecf20Sopenharmony_ci 12028c2ecf20Sopenharmony_ci return 0; 12038c2ecf20Sopenharmony_ci} 12048c2ecf20Sopenharmony_ci 12058c2ecf20Sopenharmony_cistatic int kfd_ioctl_acquire_vm(struct file *filep, struct kfd_process *p, 12068c2ecf20Sopenharmony_ci void *data) 12078c2ecf20Sopenharmony_ci{ 12088c2ecf20Sopenharmony_ci struct kfd_ioctl_acquire_vm_args *args = data; 12098c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 12108c2ecf20Sopenharmony_ci struct kfd_dev *dev; 12118c2ecf20Sopenharmony_ci struct file *drm_file; 12128c2ecf20Sopenharmony_ci int ret; 12138c2ecf20Sopenharmony_ci 12148c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 12158c2ecf20Sopenharmony_ci if (!dev) 12168c2ecf20Sopenharmony_ci return -EINVAL; 12178c2ecf20Sopenharmony_ci 12188c2ecf20Sopenharmony_ci drm_file = fget(args->drm_fd); 12198c2ecf20Sopenharmony_ci if (!drm_file) 12208c2ecf20Sopenharmony_ci return -EINVAL; 12218c2ecf20Sopenharmony_ci 12228c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 12238c2ecf20Sopenharmony_ci 12248c2ecf20Sopenharmony_ci pdd = kfd_get_process_device_data(dev, p); 12258c2ecf20Sopenharmony_ci if (!pdd) { 12268c2ecf20Sopenharmony_ci ret = -EINVAL; 12278c2ecf20Sopenharmony_ci goto err_unlock; 12288c2ecf20Sopenharmony_ci } 12298c2ecf20Sopenharmony_ci 12308c2ecf20Sopenharmony_ci if (pdd->drm_file) { 12318c2ecf20Sopenharmony_ci ret = pdd->drm_file == drm_file ? 0 : -EBUSY; 12328c2ecf20Sopenharmony_ci goto err_unlock; 12338c2ecf20Sopenharmony_ci } 12348c2ecf20Sopenharmony_ci 12358c2ecf20Sopenharmony_ci ret = kfd_process_device_init_vm(pdd, drm_file); 12368c2ecf20Sopenharmony_ci if (ret) 12378c2ecf20Sopenharmony_ci goto err_unlock; 12388c2ecf20Sopenharmony_ci /* On success, the PDD keeps the drm_file reference */ 12398c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 12408c2ecf20Sopenharmony_ci 12418c2ecf20Sopenharmony_ci return 0; 12428c2ecf20Sopenharmony_ci 12438c2ecf20Sopenharmony_cierr_unlock: 12448c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 12458c2ecf20Sopenharmony_ci fput(drm_file); 12468c2ecf20Sopenharmony_ci return ret; 12478c2ecf20Sopenharmony_ci} 12488c2ecf20Sopenharmony_ci 12498c2ecf20Sopenharmony_cibool kfd_dev_is_large_bar(struct kfd_dev *dev) 12508c2ecf20Sopenharmony_ci{ 12518c2ecf20Sopenharmony_ci struct kfd_local_mem_info mem_info; 12528c2ecf20Sopenharmony_ci 12538c2ecf20Sopenharmony_ci if (debug_largebar) { 12548c2ecf20Sopenharmony_ci pr_debug("Simulate large-bar allocation on non large-bar machine\n"); 12558c2ecf20Sopenharmony_ci return true; 12568c2ecf20Sopenharmony_ci } 12578c2ecf20Sopenharmony_ci 12588c2ecf20Sopenharmony_ci if (dev->use_iommu_v2) 12598c2ecf20Sopenharmony_ci return false; 12608c2ecf20Sopenharmony_ci 12618c2ecf20Sopenharmony_ci amdgpu_amdkfd_get_local_mem_info(dev->kgd, &mem_info); 12628c2ecf20Sopenharmony_ci if (mem_info.local_mem_size_private == 0 && 12638c2ecf20Sopenharmony_ci mem_info.local_mem_size_public > 0) 12648c2ecf20Sopenharmony_ci return true; 12658c2ecf20Sopenharmony_ci return false; 12668c2ecf20Sopenharmony_ci} 12678c2ecf20Sopenharmony_ci 12688c2ecf20Sopenharmony_cistatic int kfd_ioctl_alloc_memory_of_gpu(struct file *filep, 12698c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 12708c2ecf20Sopenharmony_ci{ 12718c2ecf20Sopenharmony_ci struct kfd_ioctl_alloc_memory_of_gpu_args *args = data; 12728c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 12738c2ecf20Sopenharmony_ci void *mem; 12748c2ecf20Sopenharmony_ci struct kfd_dev *dev; 12758c2ecf20Sopenharmony_ci int idr_handle; 12768c2ecf20Sopenharmony_ci long err; 12778c2ecf20Sopenharmony_ci uint64_t offset = args->mmap_offset; 12788c2ecf20Sopenharmony_ci uint32_t flags = args->flags; 12798c2ecf20Sopenharmony_ci 12808c2ecf20Sopenharmony_ci if (args->size == 0) 12818c2ecf20Sopenharmony_ci return -EINVAL; 12828c2ecf20Sopenharmony_ci 12838c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 12848c2ecf20Sopenharmony_ci if (!dev) 12858c2ecf20Sopenharmony_ci return -EINVAL; 12868c2ecf20Sopenharmony_ci 12878c2ecf20Sopenharmony_ci if ((flags & KFD_IOC_ALLOC_MEM_FLAGS_PUBLIC) && 12888c2ecf20Sopenharmony_ci (flags & KFD_IOC_ALLOC_MEM_FLAGS_VRAM) && 12898c2ecf20Sopenharmony_ci !kfd_dev_is_large_bar(dev)) { 12908c2ecf20Sopenharmony_ci pr_err("Alloc host visible vram on small bar is not allowed\n"); 12918c2ecf20Sopenharmony_ci return -EINVAL; 12928c2ecf20Sopenharmony_ci } 12938c2ecf20Sopenharmony_ci 12948c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 12958c2ecf20Sopenharmony_ci 12968c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 12978c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 12988c2ecf20Sopenharmony_ci err = PTR_ERR(pdd); 12998c2ecf20Sopenharmony_ci goto err_unlock; 13008c2ecf20Sopenharmony_ci } 13018c2ecf20Sopenharmony_ci 13028c2ecf20Sopenharmony_ci if (flags & KFD_IOC_ALLOC_MEM_FLAGS_DOORBELL) { 13038c2ecf20Sopenharmony_ci if (args->size != kfd_doorbell_process_slice(dev)) { 13048c2ecf20Sopenharmony_ci err = -EINVAL; 13058c2ecf20Sopenharmony_ci goto err_unlock; 13068c2ecf20Sopenharmony_ci } 13078c2ecf20Sopenharmony_ci offset = kfd_get_process_doorbells(pdd); 13088c2ecf20Sopenharmony_ci } else if (flags & KFD_IOC_ALLOC_MEM_FLAGS_MMIO_REMAP) { 13098c2ecf20Sopenharmony_ci if (args->size != PAGE_SIZE) { 13108c2ecf20Sopenharmony_ci err = -EINVAL; 13118c2ecf20Sopenharmony_ci goto err_unlock; 13128c2ecf20Sopenharmony_ci } 13138c2ecf20Sopenharmony_ci offset = amdgpu_amdkfd_get_mmio_remap_phys_addr(dev->kgd); 13148c2ecf20Sopenharmony_ci if (!offset) { 13158c2ecf20Sopenharmony_ci err = -ENOMEM; 13168c2ecf20Sopenharmony_ci goto err_unlock; 13178c2ecf20Sopenharmony_ci } 13188c2ecf20Sopenharmony_ci } 13198c2ecf20Sopenharmony_ci 13208c2ecf20Sopenharmony_ci err = amdgpu_amdkfd_gpuvm_alloc_memory_of_gpu( 13218c2ecf20Sopenharmony_ci dev->kgd, args->va_addr, args->size, 13228c2ecf20Sopenharmony_ci pdd->vm, (struct kgd_mem **) &mem, &offset, 13238c2ecf20Sopenharmony_ci flags); 13248c2ecf20Sopenharmony_ci 13258c2ecf20Sopenharmony_ci if (err) 13268c2ecf20Sopenharmony_ci goto err_unlock; 13278c2ecf20Sopenharmony_ci 13288c2ecf20Sopenharmony_ci idr_handle = kfd_process_device_create_obj_handle(pdd, mem); 13298c2ecf20Sopenharmony_ci if (idr_handle < 0) { 13308c2ecf20Sopenharmony_ci err = -EFAULT; 13318c2ecf20Sopenharmony_ci goto err_free; 13328c2ecf20Sopenharmony_ci } 13338c2ecf20Sopenharmony_ci 13348c2ecf20Sopenharmony_ci /* Update the VRAM usage count */ 13358c2ecf20Sopenharmony_ci if (flags & KFD_IOC_ALLOC_MEM_FLAGS_VRAM) 13368c2ecf20Sopenharmony_ci WRITE_ONCE(pdd->vram_usage, pdd->vram_usage + args->size); 13378c2ecf20Sopenharmony_ci 13388c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 13398c2ecf20Sopenharmony_ci 13408c2ecf20Sopenharmony_ci args->handle = MAKE_HANDLE(args->gpu_id, idr_handle); 13418c2ecf20Sopenharmony_ci args->mmap_offset = offset; 13428c2ecf20Sopenharmony_ci 13438c2ecf20Sopenharmony_ci /* MMIO is mapped through kfd device 13448c2ecf20Sopenharmony_ci * Generate a kfd mmap offset 13458c2ecf20Sopenharmony_ci */ 13468c2ecf20Sopenharmony_ci if (flags & KFD_IOC_ALLOC_MEM_FLAGS_MMIO_REMAP) 13478c2ecf20Sopenharmony_ci args->mmap_offset = KFD_MMAP_TYPE_MMIO 13488c2ecf20Sopenharmony_ci | KFD_MMAP_GPU_ID(args->gpu_id); 13498c2ecf20Sopenharmony_ci 13508c2ecf20Sopenharmony_ci return 0; 13518c2ecf20Sopenharmony_ci 13528c2ecf20Sopenharmony_cierr_free: 13538c2ecf20Sopenharmony_ci amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem, NULL); 13548c2ecf20Sopenharmony_cierr_unlock: 13558c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 13568c2ecf20Sopenharmony_ci return err; 13578c2ecf20Sopenharmony_ci} 13588c2ecf20Sopenharmony_ci 13598c2ecf20Sopenharmony_cistatic int kfd_ioctl_free_memory_of_gpu(struct file *filep, 13608c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 13618c2ecf20Sopenharmony_ci{ 13628c2ecf20Sopenharmony_ci struct kfd_ioctl_free_memory_of_gpu_args *args = data; 13638c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 13648c2ecf20Sopenharmony_ci void *mem; 13658c2ecf20Sopenharmony_ci struct kfd_dev *dev; 13668c2ecf20Sopenharmony_ci int ret; 13678c2ecf20Sopenharmony_ci uint64_t size = 0; 13688c2ecf20Sopenharmony_ci 13698c2ecf20Sopenharmony_ci dev = kfd_device_by_id(GET_GPU_ID(args->handle)); 13708c2ecf20Sopenharmony_ci if (!dev) 13718c2ecf20Sopenharmony_ci return -EINVAL; 13728c2ecf20Sopenharmony_ci 13738c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 13748c2ecf20Sopenharmony_ci 13758c2ecf20Sopenharmony_ci pdd = kfd_get_process_device_data(dev, p); 13768c2ecf20Sopenharmony_ci if (!pdd) { 13778c2ecf20Sopenharmony_ci pr_err("Process device data doesn't exist\n"); 13788c2ecf20Sopenharmony_ci ret = -EINVAL; 13798c2ecf20Sopenharmony_ci goto err_unlock; 13808c2ecf20Sopenharmony_ci } 13818c2ecf20Sopenharmony_ci 13828c2ecf20Sopenharmony_ci mem = kfd_process_device_translate_handle( 13838c2ecf20Sopenharmony_ci pdd, GET_IDR_HANDLE(args->handle)); 13848c2ecf20Sopenharmony_ci if (!mem) { 13858c2ecf20Sopenharmony_ci ret = -EINVAL; 13868c2ecf20Sopenharmony_ci goto err_unlock; 13878c2ecf20Sopenharmony_ci } 13888c2ecf20Sopenharmony_ci 13898c2ecf20Sopenharmony_ci ret = amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, 13908c2ecf20Sopenharmony_ci (struct kgd_mem *)mem, &size); 13918c2ecf20Sopenharmony_ci 13928c2ecf20Sopenharmony_ci /* If freeing the buffer failed, leave the handle in place for 13938c2ecf20Sopenharmony_ci * clean-up during process tear-down. 13948c2ecf20Sopenharmony_ci */ 13958c2ecf20Sopenharmony_ci if (!ret) 13968c2ecf20Sopenharmony_ci kfd_process_device_remove_obj_handle( 13978c2ecf20Sopenharmony_ci pdd, GET_IDR_HANDLE(args->handle)); 13988c2ecf20Sopenharmony_ci 13998c2ecf20Sopenharmony_ci WRITE_ONCE(pdd->vram_usage, pdd->vram_usage - size); 14008c2ecf20Sopenharmony_ci 14018c2ecf20Sopenharmony_cierr_unlock: 14028c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 14038c2ecf20Sopenharmony_ci return ret; 14048c2ecf20Sopenharmony_ci} 14058c2ecf20Sopenharmony_ci 14068c2ecf20Sopenharmony_cistatic int kfd_ioctl_map_memory_to_gpu(struct file *filep, 14078c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 14088c2ecf20Sopenharmony_ci{ 14098c2ecf20Sopenharmony_ci struct kfd_ioctl_map_memory_to_gpu_args *args = data; 14108c2ecf20Sopenharmony_ci struct kfd_process_device *pdd, *peer_pdd; 14118c2ecf20Sopenharmony_ci void *mem; 14128c2ecf20Sopenharmony_ci struct kfd_dev *dev, *peer; 14138c2ecf20Sopenharmony_ci long err = 0; 14148c2ecf20Sopenharmony_ci int i; 14158c2ecf20Sopenharmony_ci uint32_t *devices_arr = NULL; 14168c2ecf20Sopenharmony_ci 14178c2ecf20Sopenharmony_ci dev = kfd_device_by_id(GET_GPU_ID(args->handle)); 14188c2ecf20Sopenharmony_ci if (!dev) 14198c2ecf20Sopenharmony_ci return -EINVAL; 14208c2ecf20Sopenharmony_ci 14218c2ecf20Sopenharmony_ci if (!args->n_devices) { 14228c2ecf20Sopenharmony_ci pr_debug("Device IDs array empty\n"); 14238c2ecf20Sopenharmony_ci return -EINVAL; 14248c2ecf20Sopenharmony_ci } 14258c2ecf20Sopenharmony_ci if (args->n_success > args->n_devices) { 14268c2ecf20Sopenharmony_ci pr_debug("n_success exceeds n_devices\n"); 14278c2ecf20Sopenharmony_ci return -EINVAL; 14288c2ecf20Sopenharmony_ci } 14298c2ecf20Sopenharmony_ci 14308c2ecf20Sopenharmony_ci devices_arr = kmalloc_array(args->n_devices, sizeof(*devices_arr), 14318c2ecf20Sopenharmony_ci GFP_KERNEL); 14328c2ecf20Sopenharmony_ci if (!devices_arr) 14338c2ecf20Sopenharmony_ci return -ENOMEM; 14348c2ecf20Sopenharmony_ci 14358c2ecf20Sopenharmony_ci err = copy_from_user(devices_arr, 14368c2ecf20Sopenharmony_ci (void __user *)args->device_ids_array_ptr, 14378c2ecf20Sopenharmony_ci args->n_devices * sizeof(*devices_arr)); 14388c2ecf20Sopenharmony_ci if (err != 0) { 14398c2ecf20Sopenharmony_ci err = -EFAULT; 14408c2ecf20Sopenharmony_ci goto copy_from_user_failed; 14418c2ecf20Sopenharmony_ci } 14428c2ecf20Sopenharmony_ci 14438c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 14448c2ecf20Sopenharmony_ci 14458c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 14468c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 14478c2ecf20Sopenharmony_ci err = PTR_ERR(pdd); 14488c2ecf20Sopenharmony_ci goto bind_process_to_device_failed; 14498c2ecf20Sopenharmony_ci } 14508c2ecf20Sopenharmony_ci 14518c2ecf20Sopenharmony_ci mem = kfd_process_device_translate_handle(pdd, 14528c2ecf20Sopenharmony_ci GET_IDR_HANDLE(args->handle)); 14538c2ecf20Sopenharmony_ci if (!mem) { 14548c2ecf20Sopenharmony_ci err = -ENOMEM; 14558c2ecf20Sopenharmony_ci goto get_mem_obj_from_handle_failed; 14568c2ecf20Sopenharmony_ci } 14578c2ecf20Sopenharmony_ci 14588c2ecf20Sopenharmony_ci for (i = args->n_success; i < args->n_devices; i++) { 14598c2ecf20Sopenharmony_ci peer = kfd_device_by_id(devices_arr[i]); 14608c2ecf20Sopenharmony_ci if (!peer) { 14618c2ecf20Sopenharmony_ci pr_debug("Getting device by id failed for 0x%x\n", 14628c2ecf20Sopenharmony_ci devices_arr[i]); 14638c2ecf20Sopenharmony_ci err = -EINVAL; 14648c2ecf20Sopenharmony_ci goto get_mem_obj_from_handle_failed; 14658c2ecf20Sopenharmony_ci } 14668c2ecf20Sopenharmony_ci 14678c2ecf20Sopenharmony_ci peer_pdd = kfd_bind_process_to_device(peer, p); 14688c2ecf20Sopenharmony_ci if (IS_ERR(peer_pdd)) { 14698c2ecf20Sopenharmony_ci err = PTR_ERR(peer_pdd); 14708c2ecf20Sopenharmony_ci goto get_mem_obj_from_handle_failed; 14718c2ecf20Sopenharmony_ci } 14728c2ecf20Sopenharmony_ci err = amdgpu_amdkfd_gpuvm_map_memory_to_gpu( 14738c2ecf20Sopenharmony_ci peer->kgd, (struct kgd_mem *)mem, peer_pdd->vm); 14748c2ecf20Sopenharmony_ci if (err) { 14758c2ecf20Sopenharmony_ci pr_err("Failed to map to gpu %d/%d\n", 14768c2ecf20Sopenharmony_ci i, args->n_devices); 14778c2ecf20Sopenharmony_ci goto map_memory_to_gpu_failed; 14788c2ecf20Sopenharmony_ci } 14798c2ecf20Sopenharmony_ci args->n_success = i+1; 14808c2ecf20Sopenharmony_ci } 14818c2ecf20Sopenharmony_ci 14828c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 14838c2ecf20Sopenharmony_ci 14848c2ecf20Sopenharmony_ci err = amdgpu_amdkfd_gpuvm_sync_memory(dev->kgd, (struct kgd_mem *) mem, true); 14858c2ecf20Sopenharmony_ci if (err) { 14868c2ecf20Sopenharmony_ci pr_debug("Sync memory failed, wait interrupted by user signal\n"); 14878c2ecf20Sopenharmony_ci goto sync_memory_failed; 14888c2ecf20Sopenharmony_ci } 14898c2ecf20Sopenharmony_ci 14908c2ecf20Sopenharmony_ci /* Flush TLBs after waiting for the page table updates to complete */ 14918c2ecf20Sopenharmony_ci for (i = 0; i < args->n_devices; i++) { 14928c2ecf20Sopenharmony_ci peer = kfd_device_by_id(devices_arr[i]); 14938c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(!peer)) 14948c2ecf20Sopenharmony_ci continue; 14958c2ecf20Sopenharmony_ci peer_pdd = kfd_get_process_device_data(peer, p); 14968c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(!peer_pdd)) 14978c2ecf20Sopenharmony_ci continue; 14988c2ecf20Sopenharmony_ci kfd_flush_tlb(peer_pdd); 14998c2ecf20Sopenharmony_ci } 15008c2ecf20Sopenharmony_ci 15018c2ecf20Sopenharmony_ci kfree(devices_arr); 15028c2ecf20Sopenharmony_ci 15038c2ecf20Sopenharmony_ci return err; 15048c2ecf20Sopenharmony_ci 15058c2ecf20Sopenharmony_cibind_process_to_device_failed: 15068c2ecf20Sopenharmony_ciget_mem_obj_from_handle_failed: 15078c2ecf20Sopenharmony_cimap_memory_to_gpu_failed: 15088c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 15098c2ecf20Sopenharmony_cicopy_from_user_failed: 15108c2ecf20Sopenharmony_cisync_memory_failed: 15118c2ecf20Sopenharmony_ci kfree(devices_arr); 15128c2ecf20Sopenharmony_ci 15138c2ecf20Sopenharmony_ci return err; 15148c2ecf20Sopenharmony_ci} 15158c2ecf20Sopenharmony_ci 15168c2ecf20Sopenharmony_cistatic int kfd_ioctl_unmap_memory_from_gpu(struct file *filep, 15178c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 15188c2ecf20Sopenharmony_ci{ 15198c2ecf20Sopenharmony_ci struct kfd_ioctl_unmap_memory_from_gpu_args *args = data; 15208c2ecf20Sopenharmony_ci struct kfd_process_device *pdd, *peer_pdd; 15218c2ecf20Sopenharmony_ci void *mem; 15228c2ecf20Sopenharmony_ci struct kfd_dev *dev, *peer; 15238c2ecf20Sopenharmony_ci long err = 0; 15248c2ecf20Sopenharmony_ci uint32_t *devices_arr = NULL, i; 15258c2ecf20Sopenharmony_ci 15268c2ecf20Sopenharmony_ci dev = kfd_device_by_id(GET_GPU_ID(args->handle)); 15278c2ecf20Sopenharmony_ci if (!dev) 15288c2ecf20Sopenharmony_ci return -EINVAL; 15298c2ecf20Sopenharmony_ci 15308c2ecf20Sopenharmony_ci if (!args->n_devices) { 15318c2ecf20Sopenharmony_ci pr_debug("Device IDs array empty\n"); 15328c2ecf20Sopenharmony_ci return -EINVAL; 15338c2ecf20Sopenharmony_ci } 15348c2ecf20Sopenharmony_ci if (args->n_success > args->n_devices) { 15358c2ecf20Sopenharmony_ci pr_debug("n_success exceeds n_devices\n"); 15368c2ecf20Sopenharmony_ci return -EINVAL; 15378c2ecf20Sopenharmony_ci } 15388c2ecf20Sopenharmony_ci 15398c2ecf20Sopenharmony_ci devices_arr = kmalloc_array(args->n_devices, sizeof(*devices_arr), 15408c2ecf20Sopenharmony_ci GFP_KERNEL); 15418c2ecf20Sopenharmony_ci if (!devices_arr) 15428c2ecf20Sopenharmony_ci return -ENOMEM; 15438c2ecf20Sopenharmony_ci 15448c2ecf20Sopenharmony_ci err = copy_from_user(devices_arr, 15458c2ecf20Sopenharmony_ci (void __user *)args->device_ids_array_ptr, 15468c2ecf20Sopenharmony_ci args->n_devices * sizeof(*devices_arr)); 15478c2ecf20Sopenharmony_ci if (err != 0) { 15488c2ecf20Sopenharmony_ci err = -EFAULT; 15498c2ecf20Sopenharmony_ci goto copy_from_user_failed; 15508c2ecf20Sopenharmony_ci } 15518c2ecf20Sopenharmony_ci 15528c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 15538c2ecf20Sopenharmony_ci 15548c2ecf20Sopenharmony_ci pdd = kfd_get_process_device_data(dev, p); 15558c2ecf20Sopenharmony_ci if (!pdd) { 15568c2ecf20Sopenharmony_ci err = -EINVAL; 15578c2ecf20Sopenharmony_ci goto bind_process_to_device_failed; 15588c2ecf20Sopenharmony_ci } 15598c2ecf20Sopenharmony_ci 15608c2ecf20Sopenharmony_ci mem = kfd_process_device_translate_handle(pdd, 15618c2ecf20Sopenharmony_ci GET_IDR_HANDLE(args->handle)); 15628c2ecf20Sopenharmony_ci if (!mem) { 15638c2ecf20Sopenharmony_ci err = -ENOMEM; 15648c2ecf20Sopenharmony_ci goto get_mem_obj_from_handle_failed; 15658c2ecf20Sopenharmony_ci } 15668c2ecf20Sopenharmony_ci 15678c2ecf20Sopenharmony_ci for (i = args->n_success; i < args->n_devices; i++) { 15688c2ecf20Sopenharmony_ci peer = kfd_device_by_id(devices_arr[i]); 15698c2ecf20Sopenharmony_ci if (!peer) { 15708c2ecf20Sopenharmony_ci err = -EINVAL; 15718c2ecf20Sopenharmony_ci goto get_mem_obj_from_handle_failed; 15728c2ecf20Sopenharmony_ci } 15738c2ecf20Sopenharmony_ci 15748c2ecf20Sopenharmony_ci peer_pdd = kfd_get_process_device_data(peer, p); 15758c2ecf20Sopenharmony_ci if (!peer_pdd) { 15768c2ecf20Sopenharmony_ci err = -ENODEV; 15778c2ecf20Sopenharmony_ci goto get_mem_obj_from_handle_failed; 15788c2ecf20Sopenharmony_ci } 15798c2ecf20Sopenharmony_ci err = amdgpu_amdkfd_gpuvm_unmap_memory_from_gpu( 15808c2ecf20Sopenharmony_ci peer->kgd, (struct kgd_mem *)mem, peer_pdd->vm); 15818c2ecf20Sopenharmony_ci if (err) { 15828c2ecf20Sopenharmony_ci pr_err("Failed to unmap from gpu %d/%d\n", 15838c2ecf20Sopenharmony_ci i, args->n_devices); 15848c2ecf20Sopenharmony_ci goto unmap_memory_from_gpu_failed; 15858c2ecf20Sopenharmony_ci } 15868c2ecf20Sopenharmony_ci args->n_success = i+1; 15878c2ecf20Sopenharmony_ci } 15888c2ecf20Sopenharmony_ci kfree(devices_arr); 15898c2ecf20Sopenharmony_ci 15908c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 15918c2ecf20Sopenharmony_ci 15928c2ecf20Sopenharmony_ci return 0; 15938c2ecf20Sopenharmony_ci 15948c2ecf20Sopenharmony_cibind_process_to_device_failed: 15958c2ecf20Sopenharmony_ciget_mem_obj_from_handle_failed: 15968c2ecf20Sopenharmony_ciunmap_memory_from_gpu_failed: 15978c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 15988c2ecf20Sopenharmony_cicopy_from_user_failed: 15998c2ecf20Sopenharmony_ci kfree(devices_arr); 16008c2ecf20Sopenharmony_ci return err; 16018c2ecf20Sopenharmony_ci} 16028c2ecf20Sopenharmony_ci 16038c2ecf20Sopenharmony_cistatic int kfd_ioctl_alloc_queue_gws(struct file *filep, 16048c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 16058c2ecf20Sopenharmony_ci{ 16068c2ecf20Sopenharmony_ci int retval; 16078c2ecf20Sopenharmony_ci struct kfd_ioctl_alloc_queue_gws_args *args = data; 16088c2ecf20Sopenharmony_ci struct queue *q; 16098c2ecf20Sopenharmony_ci struct kfd_dev *dev; 16108c2ecf20Sopenharmony_ci 16118c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 16128c2ecf20Sopenharmony_ci q = pqm_get_user_queue(&p->pqm, args->queue_id); 16138c2ecf20Sopenharmony_ci 16148c2ecf20Sopenharmony_ci if (q) { 16158c2ecf20Sopenharmony_ci dev = q->device; 16168c2ecf20Sopenharmony_ci } else { 16178c2ecf20Sopenharmony_ci retval = -EINVAL; 16188c2ecf20Sopenharmony_ci goto out_unlock; 16198c2ecf20Sopenharmony_ci } 16208c2ecf20Sopenharmony_ci 16218c2ecf20Sopenharmony_ci if (!dev->gws) { 16228c2ecf20Sopenharmony_ci retval = -ENODEV; 16238c2ecf20Sopenharmony_ci goto out_unlock; 16248c2ecf20Sopenharmony_ci } 16258c2ecf20Sopenharmony_ci 16268c2ecf20Sopenharmony_ci if (dev->dqm->sched_policy == KFD_SCHED_POLICY_NO_HWS) { 16278c2ecf20Sopenharmony_ci retval = -ENODEV; 16288c2ecf20Sopenharmony_ci goto out_unlock; 16298c2ecf20Sopenharmony_ci } 16308c2ecf20Sopenharmony_ci 16318c2ecf20Sopenharmony_ci retval = pqm_set_gws(&p->pqm, args->queue_id, args->num_gws ? dev->gws : NULL); 16328c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 16338c2ecf20Sopenharmony_ci 16348c2ecf20Sopenharmony_ci args->first_gws = 0; 16358c2ecf20Sopenharmony_ci return retval; 16368c2ecf20Sopenharmony_ci 16378c2ecf20Sopenharmony_ciout_unlock: 16388c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 16398c2ecf20Sopenharmony_ci return retval; 16408c2ecf20Sopenharmony_ci} 16418c2ecf20Sopenharmony_ci 16428c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_dmabuf_info(struct file *filep, 16438c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 16448c2ecf20Sopenharmony_ci{ 16458c2ecf20Sopenharmony_ci struct kfd_ioctl_get_dmabuf_info_args *args = data; 16468c2ecf20Sopenharmony_ci struct kfd_dev *dev = NULL; 16478c2ecf20Sopenharmony_ci struct kgd_dev *dma_buf_kgd; 16488c2ecf20Sopenharmony_ci void *metadata_buffer = NULL; 16498c2ecf20Sopenharmony_ci uint32_t flags; 16508c2ecf20Sopenharmony_ci unsigned int i; 16518c2ecf20Sopenharmony_ci int r; 16528c2ecf20Sopenharmony_ci 16538c2ecf20Sopenharmony_ci /* Find a KFD GPU device that supports the get_dmabuf_info query */ 16548c2ecf20Sopenharmony_ci for (i = 0; kfd_topology_enum_kfd_devices(i, &dev) == 0; i++) 16558c2ecf20Sopenharmony_ci if (dev) 16568c2ecf20Sopenharmony_ci break; 16578c2ecf20Sopenharmony_ci if (!dev) 16588c2ecf20Sopenharmony_ci return -EINVAL; 16598c2ecf20Sopenharmony_ci 16608c2ecf20Sopenharmony_ci if (args->metadata_ptr) { 16618c2ecf20Sopenharmony_ci metadata_buffer = kzalloc(args->metadata_size, GFP_KERNEL); 16628c2ecf20Sopenharmony_ci if (!metadata_buffer) 16638c2ecf20Sopenharmony_ci return -ENOMEM; 16648c2ecf20Sopenharmony_ci } 16658c2ecf20Sopenharmony_ci 16668c2ecf20Sopenharmony_ci /* Get dmabuf info from KGD */ 16678c2ecf20Sopenharmony_ci r = amdgpu_amdkfd_get_dmabuf_info(dev->kgd, args->dmabuf_fd, 16688c2ecf20Sopenharmony_ci &dma_buf_kgd, &args->size, 16698c2ecf20Sopenharmony_ci metadata_buffer, args->metadata_size, 16708c2ecf20Sopenharmony_ci &args->metadata_size, &flags); 16718c2ecf20Sopenharmony_ci if (r) 16728c2ecf20Sopenharmony_ci goto exit; 16738c2ecf20Sopenharmony_ci 16748c2ecf20Sopenharmony_ci /* Reverse-lookup gpu_id from kgd pointer */ 16758c2ecf20Sopenharmony_ci dev = kfd_device_by_kgd(dma_buf_kgd); 16768c2ecf20Sopenharmony_ci if (!dev) { 16778c2ecf20Sopenharmony_ci r = -EINVAL; 16788c2ecf20Sopenharmony_ci goto exit; 16798c2ecf20Sopenharmony_ci } 16808c2ecf20Sopenharmony_ci args->gpu_id = dev->id; 16818c2ecf20Sopenharmony_ci args->flags = flags; 16828c2ecf20Sopenharmony_ci 16838c2ecf20Sopenharmony_ci /* Copy metadata buffer to user mode */ 16848c2ecf20Sopenharmony_ci if (metadata_buffer) { 16858c2ecf20Sopenharmony_ci r = copy_to_user((void __user *)args->metadata_ptr, 16868c2ecf20Sopenharmony_ci metadata_buffer, args->metadata_size); 16878c2ecf20Sopenharmony_ci if (r != 0) 16888c2ecf20Sopenharmony_ci r = -EFAULT; 16898c2ecf20Sopenharmony_ci } 16908c2ecf20Sopenharmony_ci 16918c2ecf20Sopenharmony_ciexit: 16928c2ecf20Sopenharmony_ci kfree(metadata_buffer); 16938c2ecf20Sopenharmony_ci 16948c2ecf20Sopenharmony_ci return r; 16958c2ecf20Sopenharmony_ci} 16968c2ecf20Sopenharmony_ci 16978c2ecf20Sopenharmony_cistatic int kfd_ioctl_import_dmabuf(struct file *filep, 16988c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 16998c2ecf20Sopenharmony_ci{ 17008c2ecf20Sopenharmony_ci struct kfd_ioctl_import_dmabuf_args *args = data; 17018c2ecf20Sopenharmony_ci struct kfd_process_device *pdd; 17028c2ecf20Sopenharmony_ci struct dma_buf *dmabuf; 17038c2ecf20Sopenharmony_ci struct kfd_dev *dev; 17048c2ecf20Sopenharmony_ci int idr_handle; 17058c2ecf20Sopenharmony_ci uint64_t size; 17068c2ecf20Sopenharmony_ci void *mem; 17078c2ecf20Sopenharmony_ci int r; 17088c2ecf20Sopenharmony_ci 17098c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpu_id); 17108c2ecf20Sopenharmony_ci if (!dev) 17118c2ecf20Sopenharmony_ci return -EINVAL; 17128c2ecf20Sopenharmony_ci 17138c2ecf20Sopenharmony_ci dmabuf = dma_buf_get(args->dmabuf_fd); 17148c2ecf20Sopenharmony_ci if (IS_ERR(dmabuf)) 17158c2ecf20Sopenharmony_ci return PTR_ERR(dmabuf); 17168c2ecf20Sopenharmony_ci 17178c2ecf20Sopenharmony_ci mutex_lock(&p->mutex); 17188c2ecf20Sopenharmony_ci 17198c2ecf20Sopenharmony_ci pdd = kfd_bind_process_to_device(dev, p); 17208c2ecf20Sopenharmony_ci if (IS_ERR(pdd)) { 17218c2ecf20Sopenharmony_ci r = PTR_ERR(pdd); 17228c2ecf20Sopenharmony_ci goto err_unlock; 17238c2ecf20Sopenharmony_ci } 17248c2ecf20Sopenharmony_ci 17258c2ecf20Sopenharmony_ci r = amdgpu_amdkfd_gpuvm_import_dmabuf(dev->kgd, dmabuf, 17268c2ecf20Sopenharmony_ci args->va_addr, pdd->vm, 17278c2ecf20Sopenharmony_ci (struct kgd_mem **)&mem, &size, 17288c2ecf20Sopenharmony_ci NULL); 17298c2ecf20Sopenharmony_ci if (r) 17308c2ecf20Sopenharmony_ci goto err_unlock; 17318c2ecf20Sopenharmony_ci 17328c2ecf20Sopenharmony_ci idr_handle = kfd_process_device_create_obj_handle(pdd, mem); 17338c2ecf20Sopenharmony_ci if (idr_handle < 0) { 17348c2ecf20Sopenharmony_ci r = -EFAULT; 17358c2ecf20Sopenharmony_ci goto err_free; 17368c2ecf20Sopenharmony_ci } 17378c2ecf20Sopenharmony_ci 17388c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 17398c2ecf20Sopenharmony_ci dma_buf_put(dmabuf); 17408c2ecf20Sopenharmony_ci 17418c2ecf20Sopenharmony_ci args->handle = MAKE_HANDLE(args->gpu_id, idr_handle); 17428c2ecf20Sopenharmony_ci 17438c2ecf20Sopenharmony_ci return 0; 17448c2ecf20Sopenharmony_ci 17458c2ecf20Sopenharmony_cierr_free: 17468c2ecf20Sopenharmony_ci amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem, NULL); 17478c2ecf20Sopenharmony_cierr_unlock: 17488c2ecf20Sopenharmony_ci mutex_unlock(&p->mutex); 17498c2ecf20Sopenharmony_ci dma_buf_put(dmabuf); 17508c2ecf20Sopenharmony_ci return r; 17518c2ecf20Sopenharmony_ci} 17528c2ecf20Sopenharmony_ci 17538c2ecf20Sopenharmony_ci/* Handle requests for watching SMI events */ 17548c2ecf20Sopenharmony_cistatic int kfd_ioctl_smi_events(struct file *filep, 17558c2ecf20Sopenharmony_ci struct kfd_process *p, void *data) 17568c2ecf20Sopenharmony_ci{ 17578c2ecf20Sopenharmony_ci struct kfd_ioctl_smi_events_args *args = data; 17588c2ecf20Sopenharmony_ci struct kfd_dev *dev; 17598c2ecf20Sopenharmony_ci 17608c2ecf20Sopenharmony_ci dev = kfd_device_by_id(args->gpuid); 17618c2ecf20Sopenharmony_ci if (!dev) 17628c2ecf20Sopenharmony_ci return -EINVAL; 17638c2ecf20Sopenharmony_ci 17648c2ecf20Sopenharmony_ci return kfd_smi_event_open(dev, &args->anon_fd); 17658c2ecf20Sopenharmony_ci} 17668c2ecf20Sopenharmony_ci 17678c2ecf20Sopenharmony_ci#define AMDKFD_IOCTL_DEF(ioctl, _func, _flags) \ 17688c2ecf20Sopenharmony_ci [_IOC_NR(ioctl)] = {.cmd = ioctl, .func = _func, .flags = _flags, \ 17698c2ecf20Sopenharmony_ci .cmd_drv = 0, .name = #ioctl} 17708c2ecf20Sopenharmony_ci 17718c2ecf20Sopenharmony_ci/** Ioctl table */ 17728c2ecf20Sopenharmony_cistatic const struct amdkfd_ioctl_desc amdkfd_ioctls[] = { 17738c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_VERSION, 17748c2ecf20Sopenharmony_ci kfd_ioctl_get_version, 0), 17758c2ecf20Sopenharmony_ci 17768c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_CREATE_QUEUE, 17778c2ecf20Sopenharmony_ci kfd_ioctl_create_queue, 0), 17788c2ecf20Sopenharmony_ci 17798c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_DESTROY_QUEUE, 17808c2ecf20Sopenharmony_ci kfd_ioctl_destroy_queue, 0), 17818c2ecf20Sopenharmony_ci 17828c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_MEMORY_POLICY, 17838c2ecf20Sopenharmony_ci kfd_ioctl_set_memory_policy, 0), 17848c2ecf20Sopenharmony_ci 17858c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_CLOCK_COUNTERS, 17868c2ecf20Sopenharmony_ci kfd_ioctl_get_clock_counters, 0), 17878c2ecf20Sopenharmony_ci 17888c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_PROCESS_APERTURES, 17898c2ecf20Sopenharmony_ci kfd_ioctl_get_process_apertures, 0), 17908c2ecf20Sopenharmony_ci 17918c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_UPDATE_QUEUE, 17928c2ecf20Sopenharmony_ci kfd_ioctl_update_queue, 0), 17938c2ecf20Sopenharmony_ci 17948c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_CREATE_EVENT, 17958c2ecf20Sopenharmony_ci kfd_ioctl_create_event, 0), 17968c2ecf20Sopenharmony_ci 17978c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_DESTROY_EVENT, 17988c2ecf20Sopenharmony_ci kfd_ioctl_destroy_event, 0), 17998c2ecf20Sopenharmony_ci 18008c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_EVENT, 18018c2ecf20Sopenharmony_ci kfd_ioctl_set_event, 0), 18028c2ecf20Sopenharmony_ci 18038c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_RESET_EVENT, 18048c2ecf20Sopenharmony_ci kfd_ioctl_reset_event, 0), 18058c2ecf20Sopenharmony_ci 18068c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_WAIT_EVENTS, 18078c2ecf20Sopenharmony_ci kfd_ioctl_wait_events, 0), 18088c2ecf20Sopenharmony_ci 18098c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_REGISTER, 18108c2ecf20Sopenharmony_ci kfd_ioctl_dbg_register, 0), 18118c2ecf20Sopenharmony_ci 18128c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_UNREGISTER, 18138c2ecf20Sopenharmony_ci kfd_ioctl_dbg_unregister, 0), 18148c2ecf20Sopenharmony_ci 18158c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_ADDRESS_WATCH, 18168c2ecf20Sopenharmony_ci kfd_ioctl_dbg_address_watch, 0), 18178c2ecf20Sopenharmony_ci 18188c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_WAVE_CONTROL, 18198c2ecf20Sopenharmony_ci kfd_ioctl_dbg_wave_control, 0), 18208c2ecf20Sopenharmony_ci 18218c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_SCRATCH_BACKING_VA, 18228c2ecf20Sopenharmony_ci kfd_ioctl_set_scratch_backing_va, 0), 18238c2ecf20Sopenharmony_ci 18248c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_TILE_CONFIG, 18258c2ecf20Sopenharmony_ci kfd_ioctl_get_tile_config, 0), 18268c2ecf20Sopenharmony_ci 18278c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_TRAP_HANDLER, 18288c2ecf20Sopenharmony_ci kfd_ioctl_set_trap_handler, 0), 18298c2ecf20Sopenharmony_ci 18308c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_PROCESS_APERTURES_NEW, 18318c2ecf20Sopenharmony_ci kfd_ioctl_get_process_apertures_new, 0), 18328c2ecf20Sopenharmony_ci 18338c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_ACQUIRE_VM, 18348c2ecf20Sopenharmony_ci kfd_ioctl_acquire_vm, 0), 18358c2ecf20Sopenharmony_ci 18368c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_ALLOC_MEMORY_OF_GPU, 18378c2ecf20Sopenharmony_ci kfd_ioctl_alloc_memory_of_gpu, 0), 18388c2ecf20Sopenharmony_ci 18398c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_FREE_MEMORY_OF_GPU, 18408c2ecf20Sopenharmony_ci kfd_ioctl_free_memory_of_gpu, 0), 18418c2ecf20Sopenharmony_ci 18428c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_MAP_MEMORY_TO_GPU, 18438c2ecf20Sopenharmony_ci kfd_ioctl_map_memory_to_gpu, 0), 18448c2ecf20Sopenharmony_ci 18458c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_UNMAP_MEMORY_FROM_GPU, 18468c2ecf20Sopenharmony_ci kfd_ioctl_unmap_memory_from_gpu, 0), 18478c2ecf20Sopenharmony_ci 18488c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_CU_MASK, 18498c2ecf20Sopenharmony_ci kfd_ioctl_set_cu_mask, 0), 18508c2ecf20Sopenharmony_ci 18518c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_QUEUE_WAVE_STATE, 18528c2ecf20Sopenharmony_ci kfd_ioctl_get_queue_wave_state, 0), 18538c2ecf20Sopenharmony_ci 18548c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_DMABUF_INFO, 18558c2ecf20Sopenharmony_ci kfd_ioctl_get_dmabuf_info, 0), 18568c2ecf20Sopenharmony_ci 18578c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_IMPORT_DMABUF, 18588c2ecf20Sopenharmony_ci kfd_ioctl_import_dmabuf, 0), 18598c2ecf20Sopenharmony_ci 18608c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_ALLOC_QUEUE_GWS, 18618c2ecf20Sopenharmony_ci kfd_ioctl_alloc_queue_gws, 0), 18628c2ecf20Sopenharmony_ci 18638c2ecf20Sopenharmony_ci AMDKFD_IOCTL_DEF(AMDKFD_IOC_SMI_EVENTS, 18648c2ecf20Sopenharmony_ci kfd_ioctl_smi_events, 0), 18658c2ecf20Sopenharmony_ci}; 18668c2ecf20Sopenharmony_ci 18678c2ecf20Sopenharmony_ci#define AMDKFD_CORE_IOCTL_COUNT ARRAY_SIZE(amdkfd_ioctls) 18688c2ecf20Sopenharmony_ci 18698c2ecf20Sopenharmony_cistatic long kfd_ioctl(struct file *filep, unsigned int cmd, unsigned long arg) 18708c2ecf20Sopenharmony_ci{ 18718c2ecf20Sopenharmony_ci struct kfd_process *process; 18728c2ecf20Sopenharmony_ci amdkfd_ioctl_t *func; 18738c2ecf20Sopenharmony_ci const struct amdkfd_ioctl_desc *ioctl = NULL; 18748c2ecf20Sopenharmony_ci unsigned int nr = _IOC_NR(cmd); 18758c2ecf20Sopenharmony_ci char stack_kdata[128]; 18768c2ecf20Sopenharmony_ci char *kdata = NULL; 18778c2ecf20Sopenharmony_ci unsigned int usize, asize; 18788c2ecf20Sopenharmony_ci int retcode = -EINVAL; 18798c2ecf20Sopenharmony_ci 18808c2ecf20Sopenharmony_ci if (nr >= AMDKFD_CORE_IOCTL_COUNT) 18818c2ecf20Sopenharmony_ci goto err_i1; 18828c2ecf20Sopenharmony_ci 18838c2ecf20Sopenharmony_ci if ((nr >= AMDKFD_COMMAND_START) && (nr < AMDKFD_COMMAND_END)) { 18848c2ecf20Sopenharmony_ci u32 amdkfd_size; 18858c2ecf20Sopenharmony_ci 18868c2ecf20Sopenharmony_ci ioctl = &amdkfd_ioctls[nr]; 18878c2ecf20Sopenharmony_ci 18888c2ecf20Sopenharmony_ci amdkfd_size = _IOC_SIZE(ioctl->cmd); 18898c2ecf20Sopenharmony_ci usize = asize = _IOC_SIZE(cmd); 18908c2ecf20Sopenharmony_ci if (amdkfd_size > asize) 18918c2ecf20Sopenharmony_ci asize = amdkfd_size; 18928c2ecf20Sopenharmony_ci 18938c2ecf20Sopenharmony_ci cmd = ioctl->cmd; 18948c2ecf20Sopenharmony_ci } else 18958c2ecf20Sopenharmony_ci goto err_i1; 18968c2ecf20Sopenharmony_ci 18978c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "ioctl cmd 0x%x (#0x%x), arg 0x%lx\n", cmd, nr, arg); 18988c2ecf20Sopenharmony_ci 18998c2ecf20Sopenharmony_ci /* Get the process struct from the filep. Only the process 19008c2ecf20Sopenharmony_ci * that opened /dev/kfd can use the file descriptor. Child 19018c2ecf20Sopenharmony_ci * processes need to create their own KFD device context. 19028c2ecf20Sopenharmony_ci */ 19038c2ecf20Sopenharmony_ci process = filep->private_data; 19048c2ecf20Sopenharmony_ci if (process->lead_thread != current->group_leader) { 19058c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "Using KFD FD in wrong process\n"); 19068c2ecf20Sopenharmony_ci retcode = -EBADF; 19078c2ecf20Sopenharmony_ci goto err_i1; 19088c2ecf20Sopenharmony_ci } 19098c2ecf20Sopenharmony_ci 19108c2ecf20Sopenharmony_ci /* Do not trust userspace, use our own definition */ 19118c2ecf20Sopenharmony_ci func = ioctl->func; 19128c2ecf20Sopenharmony_ci 19138c2ecf20Sopenharmony_ci if (unlikely(!func)) { 19148c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "no function\n"); 19158c2ecf20Sopenharmony_ci retcode = -EINVAL; 19168c2ecf20Sopenharmony_ci goto err_i1; 19178c2ecf20Sopenharmony_ci } 19188c2ecf20Sopenharmony_ci 19198c2ecf20Sopenharmony_ci if (cmd & (IOC_IN | IOC_OUT)) { 19208c2ecf20Sopenharmony_ci if (asize <= sizeof(stack_kdata)) { 19218c2ecf20Sopenharmony_ci kdata = stack_kdata; 19228c2ecf20Sopenharmony_ci } else { 19238c2ecf20Sopenharmony_ci kdata = kmalloc(asize, GFP_KERNEL); 19248c2ecf20Sopenharmony_ci if (!kdata) { 19258c2ecf20Sopenharmony_ci retcode = -ENOMEM; 19268c2ecf20Sopenharmony_ci goto err_i1; 19278c2ecf20Sopenharmony_ci } 19288c2ecf20Sopenharmony_ci } 19298c2ecf20Sopenharmony_ci if (asize > usize) 19308c2ecf20Sopenharmony_ci memset(kdata + usize, 0, asize - usize); 19318c2ecf20Sopenharmony_ci } 19328c2ecf20Sopenharmony_ci 19338c2ecf20Sopenharmony_ci if (cmd & IOC_IN) { 19348c2ecf20Sopenharmony_ci if (copy_from_user(kdata, (void __user *)arg, usize) != 0) { 19358c2ecf20Sopenharmony_ci retcode = -EFAULT; 19368c2ecf20Sopenharmony_ci goto err_i1; 19378c2ecf20Sopenharmony_ci } 19388c2ecf20Sopenharmony_ci } else if (cmd & IOC_OUT) { 19398c2ecf20Sopenharmony_ci memset(kdata, 0, usize); 19408c2ecf20Sopenharmony_ci } 19418c2ecf20Sopenharmony_ci 19428c2ecf20Sopenharmony_ci retcode = func(filep, process, kdata); 19438c2ecf20Sopenharmony_ci 19448c2ecf20Sopenharmony_ci if (cmd & IOC_OUT) 19458c2ecf20Sopenharmony_ci if (copy_to_user((void __user *)arg, kdata, usize) != 0) 19468c2ecf20Sopenharmony_ci retcode = -EFAULT; 19478c2ecf20Sopenharmony_ci 19488c2ecf20Sopenharmony_cierr_i1: 19498c2ecf20Sopenharmony_ci if (!ioctl) 19508c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "invalid ioctl: pid=%d, cmd=0x%02x, nr=0x%02x\n", 19518c2ecf20Sopenharmony_ci task_pid_nr(current), cmd, nr); 19528c2ecf20Sopenharmony_ci 19538c2ecf20Sopenharmony_ci if (kdata != stack_kdata) 19548c2ecf20Sopenharmony_ci kfree(kdata); 19558c2ecf20Sopenharmony_ci 19568c2ecf20Sopenharmony_ci if (retcode) 19578c2ecf20Sopenharmony_ci dev_dbg(kfd_device, "ioctl cmd (#0x%x), arg 0x%lx, ret = %d\n", 19588c2ecf20Sopenharmony_ci nr, arg, retcode); 19598c2ecf20Sopenharmony_ci 19608c2ecf20Sopenharmony_ci return retcode; 19618c2ecf20Sopenharmony_ci} 19628c2ecf20Sopenharmony_ci 19638c2ecf20Sopenharmony_cistatic int kfd_mmio_mmap(struct kfd_dev *dev, struct kfd_process *process, 19648c2ecf20Sopenharmony_ci struct vm_area_struct *vma) 19658c2ecf20Sopenharmony_ci{ 19668c2ecf20Sopenharmony_ci phys_addr_t address; 19678c2ecf20Sopenharmony_ci int ret; 19688c2ecf20Sopenharmony_ci 19698c2ecf20Sopenharmony_ci if (vma->vm_end - vma->vm_start != PAGE_SIZE) 19708c2ecf20Sopenharmony_ci return -EINVAL; 19718c2ecf20Sopenharmony_ci 19728c2ecf20Sopenharmony_ci address = amdgpu_amdkfd_get_mmio_remap_phys_addr(dev->kgd); 19738c2ecf20Sopenharmony_ci 19748c2ecf20Sopenharmony_ci vma->vm_flags |= VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_NORESERVE | 19758c2ecf20Sopenharmony_ci VM_DONTDUMP | VM_PFNMAP; 19768c2ecf20Sopenharmony_ci 19778c2ecf20Sopenharmony_ci vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot); 19788c2ecf20Sopenharmony_ci 19798c2ecf20Sopenharmony_ci pr_debug("pasid 0x%x mapping mmio page\n" 19808c2ecf20Sopenharmony_ci " target user address == 0x%08llX\n" 19818c2ecf20Sopenharmony_ci " physical address == 0x%08llX\n" 19828c2ecf20Sopenharmony_ci " vm_flags == 0x%04lX\n" 19838c2ecf20Sopenharmony_ci " size == 0x%04lX\n", 19848c2ecf20Sopenharmony_ci process->pasid, (unsigned long long) vma->vm_start, 19858c2ecf20Sopenharmony_ci address, vma->vm_flags, PAGE_SIZE); 19868c2ecf20Sopenharmony_ci 19878c2ecf20Sopenharmony_ci ret = io_remap_pfn_range(vma, 19888c2ecf20Sopenharmony_ci vma->vm_start, 19898c2ecf20Sopenharmony_ci address >> PAGE_SHIFT, 19908c2ecf20Sopenharmony_ci PAGE_SIZE, 19918c2ecf20Sopenharmony_ci vma->vm_page_prot); 19928c2ecf20Sopenharmony_ci return ret; 19938c2ecf20Sopenharmony_ci} 19948c2ecf20Sopenharmony_ci 19958c2ecf20Sopenharmony_ci 19968c2ecf20Sopenharmony_cistatic int kfd_mmap(struct file *filp, struct vm_area_struct *vma) 19978c2ecf20Sopenharmony_ci{ 19988c2ecf20Sopenharmony_ci struct kfd_process *process; 19998c2ecf20Sopenharmony_ci struct kfd_dev *dev = NULL; 20008c2ecf20Sopenharmony_ci unsigned long mmap_offset; 20018c2ecf20Sopenharmony_ci unsigned int gpu_id; 20028c2ecf20Sopenharmony_ci 20038c2ecf20Sopenharmony_ci process = kfd_get_process(current); 20048c2ecf20Sopenharmony_ci if (IS_ERR(process)) 20058c2ecf20Sopenharmony_ci return PTR_ERR(process); 20068c2ecf20Sopenharmony_ci 20078c2ecf20Sopenharmony_ci mmap_offset = vma->vm_pgoff << PAGE_SHIFT; 20088c2ecf20Sopenharmony_ci gpu_id = KFD_MMAP_GET_GPU_ID(mmap_offset); 20098c2ecf20Sopenharmony_ci if (gpu_id) 20108c2ecf20Sopenharmony_ci dev = kfd_device_by_id(gpu_id); 20118c2ecf20Sopenharmony_ci 20128c2ecf20Sopenharmony_ci switch (mmap_offset & KFD_MMAP_TYPE_MASK) { 20138c2ecf20Sopenharmony_ci case KFD_MMAP_TYPE_DOORBELL: 20148c2ecf20Sopenharmony_ci if (!dev) 20158c2ecf20Sopenharmony_ci return -ENODEV; 20168c2ecf20Sopenharmony_ci return kfd_doorbell_mmap(dev, process, vma); 20178c2ecf20Sopenharmony_ci 20188c2ecf20Sopenharmony_ci case KFD_MMAP_TYPE_EVENTS: 20198c2ecf20Sopenharmony_ci return kfd_event_mmap(process, vma); 20208c2ecf20Sopenharmony_ci 20218c2ecf20Sopenharmony_ci case KFD_MMAP_TYPE_RESERVED_MEM: 20228c2ecf20Sopenharmony_ci if (!dev) 20238c2ecf20Sopenharmony_ci return -ENODEV; 20248c2ecf20Sopenharmony_ci return kfd_reserved_mem_mmap(dev, process, vma); 20258c2ecf20Sopenharmony_ci case KFD_MMAP_TYPE_MMIO: 20268c2ecf20Sopenharmony_ci if (!dev) 20278c2ecf20Sopenharmony_ci return -ENODEV; 20288c2ecf20Sopenharmony_ci return kfd_mmio_mmap(dev, process, vma); 20298c2ecf20Sopenharmony_ci } 20308c2ecf20Sopenharmony_ci 20318c2ecf20Sopenharmony_ci return -EFAULT; 20328c2ecf20Sopenharmony_ci} 2033