18c2ecf20Sopenharmony_ci/*
28c2ecf20Sopenharmony_ci * Copyright 2014 Advanced Micro Devices, Inc.
38c2ecf20Sopenharmony_ci *
48c2ecf20Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
58c2ecf20Sopenharmony_ci * copy of this software and associated documentation files (the "Software"),
68c2ecf20Sopenharmony_ci * to deal in the Software without restriction, including without limitation
78c2ecf20Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense,
88c2ecf20Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
98c2ecf20Sopenharmony_ci * Software is furnished to do so, subject to the following conditions:
108c2ecf20Sopenharmony_ci *
118c2ecf20Sopenharmony_ci * The above copyright notice and this permission notice shall be included in
128c2ecf20Sopenharmony_ci * all copies or substantial portions of the Software.
138c2ecf20Sopenharmony_ci *
148c2ecf20Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
158c2ecf20Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
168c2ecf20Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
178c2ecf20Sopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
188c2ecf20Sopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
198c2ecf20Sopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
208c2ecf20Sopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE.
218c2ecf20Sopenharmony_ci */
228c2ecf20Sopenharmony_ci
238c2ecf20Sopenharmony_ci#include <linux/device.h>
248c2ecf20Sopenharmony_ci#include <linux/export.h>
258c2ecf20Sopenharmony_ci#include <linux/err.h>
268c2ecf20Sopenharmony_ci#include <linux/fs.h>
278c2ecf20Sopenharmony_ci#include <linux/file.h>
288c2ecf20Sopenharmony_ci#include <linux/sched.h>
298c2ecf20Sopenharmony_ci#include <linux/slab.h>
308c2ecf20Sopenharmony_ci#include <linux/uaccess.h>
318c2ecf20Sopenharmony_ci#include <linux/compat.h>
328c2ecf20Sopenharmony_ci#include <uapi/linux/kfd_ioctl.h>
338c2ecf20Sopenharmony_ci#include <linux/time.h>
348c2ecf20Sopenharmony_ci#include <linux/mm.h>
358c2ecf20Sopenharmony_ci#include <linux/mman.h>
368c2ecf20Sopenharmony_ci#include <linux/dma-buf.h>
378c2ecf20Sopenharmony_ci#include <asm/processor.h>
388c2ecf20Sopenharmony_ci#include "kfd_priv.h"
398c2ecf20Sopenharmony_ci#include "kfd_device_queue_manager.h"
408c2ecf20Sopenharmony_ci#include "kfd_dbgmgr.h"
418c2ecf20Sopenharmony_ci#include "amdgpu_amdkfd.h"
428c2ecf20Sopenharmony_ci#include "kfd_smi_events.h"
438c2ecf20Sopenharmony_ci
448c2ecf20Sopenharmony_cistatic long kfd_ioctl(struct file *, unsigned int, unsigned long);
458c2ecf20Sopenharmony_cistatic int kfd_open(struct inode *, struct file *);
468c2ecf20Sopenharmony_cistatic int kfd_release(struct inode *, struct file *);
478c2ecf20Sopenharmony_cistatic int kfd_mmap(struct file *, struct vm_area_struct *);
488c2ecf20Sopenharmony_ci
498c2ecf20Sopenharmony_cistatic const char kfd_dev_name[] = "kfd";
508c2ecf20Sopenharmony_ci
518c2ecf20Sopenharmony_cistatic const struct file_operations kfd_fops = {
528c2ecf20Sopenharmony_ci	.owner = THIS_MODULE,
538c2ecf20Sopenharmony_ci	.unlocked_ioctl = kfd_ioctl,
548c2ecf20Sopenharmony_ci	.compat_ioctl = compat_ptr_ioctl,
558c2ecf20Sopenharmony_ci	.open = kfd_open,
568c2ecf20Sopenharmony_ci	.release = kfd_release,
578c2ecf20Sopenharmony_ci	.mmap = kfd_mmap,
588c2ecf20Sopenharmony_ci};
598c2ecf20Sopenharmony_ci
608c2ecf20Sopenharmony_cistatic int kfd_char_dev_major = -1;
618c2ecf20Sopenharmony_cistatic struct class *kfd_class;
628c2ecf20Sopenharmony_cistruct device *kfd_device;
638c2ecf20Sopenharmony_ci
648c2ecf20Sopenharmony_ciint kfd_chardev_init(void)
658c2ecf20Sopenharmony_ci{
668c2ecf20Sopenharmony_ci	int err = 0;
678c2ecf20Sopenharmony_ci
688c2ecf20Sopenharmony_ci	kfd_char_dev_major = register_chrdev(0, kfd_dev_name, &kfd_fops);
698c2ecf20Sopenharmony_ci	err = kfd_char_dev_major;
708c2ecf20Sopenharmony_ci	if (err < 0)
718c2ecf20Sopenharmony_ci		goto err_register_chrdev;
728c2ecf20Sopenharmony_ci
738c2ecf20Sopenharmony_ci	kfd_class = class_create(THIS_MODULE, kfd_dev_name);
748c2ecf20Sopenharmony_ci	err = PTR_ERR(kfd_class);
758c2ecf20Sopenharmony_ci	if (IS_ERR(kfd_class))
768c2ecf20Sopenharmony_ci		goto err_class_create;
778c2ecf20Sopenharmony_ci
788c2ecf20Sopenharmony_ci	kfd_device = device_create(kfd_class, NULL,
798c2ecf20Sopenharmony_ci					MKDEV(kfd_char_dev_major, 0),
808c2ecf20Sopenharmony_ci					NULL, kfd_dev_name);
818c2ecf20Sopenharmony_ci	err = PTR_ERR(kfd_device);
828c2ecf20Sopenharmony_ci	if (IS_ERR(kfd_device))
838c2ecf20Sopenharmony_ci		goto err_device_create;
848c2ecf20Sopenharmony_ci
858c2ecf20Sopenharmony_ci	return 0;
868c2ecf20Sopenharmony_ci
878c2ecf20Sopenharmony_cierr_device_create:
888c2ecf20Sopenharmony_ci	class_destroy(kfd_class);
898c2ecf20Sopenharmony_cierr_class_create:
908c2ecf20Sopenharmony_ci	unregister_chrdev(kfd_char_dev_major, kfd_dev_name);
918c2ecf20Sopenharmony_cierr_register_chrdev:
928c2ecf20Sopenharmony_ci	return err;
938c2ecf20Sopenharmony_ci}
948c2ecf20Sopenharmony_ci
958c2ecf20Sopenharmony_civoid kfd_chardev_exit(void)
968c2ecf20Sopenharmony_ci{
978c2ecf20Sopenharmony_ci	device_destroy(kfd_class, MKDEV(kfd_char_dev_major, 0));
988c2ecf20Sopenharmony_ci	class_destroy(kfd_class);
998c2ecf20Sopenharmony_ci	unregister_chrdev(kfd_char_dev_major, kfd_dev_name);
1008c2ecf20Sopenharmony_ci	kfd_device = NULL;
1018c2ecf20Sopenharmony_ci}
1028c2ecf20Sopenharmony_ci
1038c2ecf20Sopenharmony_cistruct device *kfd_chardev(void)
1048c2ecf20Sopenharmony_ci{
1058c2ecf20Sopenharmony_ci	return kfd_device;
1068c2ecf20Sopenharmony_ci}
1078c2ecf20Sopenharmony_ci
1088c2ecf20Sopenharmony_ci
1098c2ecf20Sopenharmony_cistatic int kfd_open(struct inode *inode, struct file *filep)
1108c2ecf20Sopenharmony_ci{
1118c2ecf20Sopenharmony_ci	struct kfd_process *process;
1128c2ecf20Sopenharmony_ci	bool is_32bit_user_mode;
1138c2ecf20Sopenharmony_ci
1148c2ecf20Sopenharmony_ci	if (iminor(inode) != 0)
1158c2ecf20Sopenharmony_ci		return -ENODEV;
1168c2ecf20Sopenharmony_ci
1178c2ecf20Sopenharmony_ci	is_32bit_user_mode = in_compat_syscall();
1188c2ecf20Sopenharmony_ci
1198c2ecf20Sopenharmony_ci	if (is_32bit_user_mode) {
1208c2ecf20Sopenharmony_ci		dev_warn(kfd_device,
1218c2ecf20Sopenharmony_ci			"Process %d (32-bit) failed to open /dev/kfd\n"
1228c2ecf20Sopenharmony_ci			"32-bit processes are not supported by amdkfd\n",
1238c2ecf20Sopenharmony_ci			current->pid);
1248c2ecf20Sopenharmony_ci		return -EPERM;
1258c2ecf20Sopenharmony_ci	}
1268c2ecf20Sopenharmony_ci
1278c2ecf20Sopenharmony_ci	process = kfd_create_process(filep);
1288c2ecf20Sopenharmony_ci	if (IS_ERR(process))
1298c2ecf20Sopenharmony_ci		return PTR_ERR(process);
1308c2ecf20Sopenharmony_ci
1318c2ecf20Sopenharmony_ci	if (kfd_is_locked()) {
1328c2ecf20Sopenharmony_ci		dev_dbg(kfd_device, "kfd is locked!\n"
1338c2ecf20Sopenharmony_ci				"process %d unreferenced", process->pasid);
1348c2ecf20Sopenharmony_ci		kfd_unref_process(process);
1358c2ecf20Sopenharmony_ci		return -EAGAIN;
1368c2ecf20Sopenharmony_ci	}
1378c2ecf20Sopenharmony_ci
1388c2ecf20Sopenharmony_ci	/* filep now owns the reference returned by kfd_create_process */
1398c2ecf20Sopenharmony_ci	filep->private_data = process;
1408c2ecf20Sopenharmony_ci
1418c2ecf20Sopenharmony_ci	dev_dbg(kfd_device, "process %d opened, compat mode (32 bit) - %d\n",
1428c2ecf20Sopenharmony_ci		process->pasid, process->is_32bit_user_mode);
1438c2ecf20Sopenharmony_ci
1448c2ecf20Sopenharmony_ci	return 0;
1458c2ecf20Sopenharmony_ci}
1468c2ecf20Sopenharmony_ci
1478c2ecf20Sopenharmony_cistatic int kfd_release(struct inode *inode, struct file *filep)
1488c2ecf20Sopenharmony_ci{
1498c2ecf20Sopenharmony_ci	struct kfd_process *process = filep->private_data;
1508c2ecf20Sopenharmony_ci
1518c2ecf20Sopenharmony_ci	if (process)
1528c2ecf20Sopenharmony_ci		kfd_unref_process(process);
1538c2ecf20Sopenharmony_ci
1548c2ecf20Sopenharmony_ci	return 0;
1558c2ecf20Sopenharmony_ci}
1568c2ecf20Sopenharmony_ci
1578c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_version(struct file *filep, struct kfd_process *p,
1588c2ecf20Sopenharmony_ci					void *data)
1598c2ecf20Sopenharmony_ci{
1608c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_version_args *args = data;
1618c2ecf20Sopenharmony_ci
1628c2ecf20Sopenharmony_ci	args->major_version = KFD_IOCTL_MAJOR_VERSION;
1638c2ecf20Sopenharmony_ci	args->minor_version = KFD_IOCTL_MINOR_VERSION;
1648c2ecf20Sopenharmony_ci
1658c2ecf20Sopenharmony_ci	return 0;
1668c2ecf20Sopenharmony_ci}
1678c2ecf20Sopenharmony_ci
1688c2ecf20Sopenharmony_cistatic int set_queue_properties_from_user(struct queue_properties *q_properties,
1698c2ecf20Sopenharmony_ci				struct kfd_ioctl_create_queue_args *args)
1708c2ecf20Sopenharmony_ci{
1718c2ecf20Sopenharmony_ci	if (args->queue_percentage > KFD_MAX_QUEUE_PERCENTAGE) {
1728c2ecf20Sopenharmony_ci		pr_err("Queue percentage must be between 0 to KFD_MAX_QUEUE_PERCENTAGE\n");
1738c2ecf20Sopenharmony_ci		return -EINVAL;
1748c2ecf20Sopenharmony_ci	}
1758c2ecf20Sopenharmony_ci
1768c2ecf20Sopenharmony_ci	if (args->queue_priority > KFD_MAX_QUEUE_PRIORITY) {
1778c2ecf20Sopenharmony_ci		pr_err("Queue priority must be between 0 to KFD_MAX_QUEUE_PRIORITY\n");
1788c2ecf20Sopenharmony_ci		return -EINVAL;
1798c2ecf20Sopenharmony_ci	}
1808c2ecf20Sopenharmony_ci
1818c2ecf20Sopenharmony_ci	if ((args->ring_base_address) &&
1828c2ecf20Sopenharmony_ci		(!access_ok((const void __user *) args->ring_base_address,
1838c2ecf20Sopenharmony_ci			sizeof(uint64_t)))) {
1848c2ecf20Sopenharmony_ci		pr_err("Can't access ring base address\n");
1858c2ecf20Sopenharmony_ci		return -EFAULT;
1868c2ecf20Sopenharmony_ci	}
1878c2ecf20Sopenharmony_ci
1888c2ecf20Sopenharmony_ci	if (!is_power_of_2(args->ring_size) && (args->ring_size != 0)) {
1898c2ecf20Sopenharmony_ci		pr_err("Ring size must be a power of 2 or 0\n");
1908c2ecf20Sopenharmony_ci		return -EINVAL;
1918c2ecf20Sopenharmony_ci	}
1928c2ecf20Sopenharmony_ci
1938c2ecf20Sopenharmony_ci	if (!access_ok((const void __user *) args->read_pointer_address,
1948c2ecf20Sopenharmony_ci			sizeof(uint32_t))) {
1958c2ecf20Sopenharmony_ci		pr_err("Can't access read pointer\n");
1968c2ecf20Sopenharmony_ci		return -EFAULT;
1978c2ecf20Sopenharmony_ci	}
1988c2ecf20Sopenharmony_ci
1998c2ecf20Sopenharmony_ci	if (!access_ok((const void __user *) args->write_pointer_address,
2008c2ecf20Sopenharmony_ci			sizeof(uint32_t))) {
2018c2ecf20Sopenharmony_ci		pr_err("Can't access write pointer\n");
2028c2ecf20Sopenharmony_ci		return -EFAULT;
2038c2ecf20Sopenharmony_ci	}
2048c2ecf20Sopenharmony_ci
2058c2ecf20Sopenharmony_ci	if (args->eop_buffer_address &&
2068c2ecf20Sopenharmony_ci		!access_ok((const void __user *) args->eop_buffer_address,
2078c2ecf20Sopenharmony_ci			sizeof(uint32_t))) {
2088c2ecf20Sopenharmony_ci		pr_debug("Can't access eop buffer");
2098c2ecf20Sopenharmony_ci		return -EFAULT;
2108c2ecf20Sopenharmony_ci	}
2118c2ecf20Sopenharmony_ci
2128c2ecf20Sopenharmony_ci	if (args->ctx_save_restore_address &&
2138c2ecf20Sopenharmony_ci		!access_ok((const void __user *) args->ctx_save_restore_address,
2148c2ecf20Sopenharmony_ci			sizeof(uint32_t))) {
2158c2ecf20Sopenharmony_ci		pr_debug("Can't access ctx save restore buffer");
2168c2ecf20Sopenharmony_ci		return -EFAULT;
2178c2ecf20Sopenharmony_ci	}
2188c2ecf20Sopenharmony_ci
2198c2ecf20Sopenharmony_ci	q_properties->is_interop = false;
2208c2ecf20Sopenharmony_ci	q_properties->is_gws = false;
2218c2ecf20Sopenharmony_ci	q_properties->queue_percent = args->queue_percentage;
2228c2ecf20Sopenharmony_ci	q_properties->priority = args->queue_priority;
2238c2ecf20Sopenharmony_ci	q_properties->queue_address = args->ring_base_address;
2248c2ecf20Sopenharmony_ci	q_properties->queue_size = args->ring_size;
2258c2ecf20Sopenharmony_ci	q_properties->read_ptr = (uint32_t *) args->read_pointer_address;
2268c2ecf20Sopenharmony_ci	q_properties->write_ptr = (uint32_t *) args->write_pointer_address;
2278c2ecf20Sopenharmony_ci	q_properties->eop_ring_buffer_address = args->eop_buffer_address;
2288c2ecf20Sopenharmony_ci	q_properties->eop_ring_buffer_size = args->eop_buffer_size;
2298c2ecf20Sopenharmony_ci	q_properties->ctx_save_restore_area_address =
2308c2ecf20Sopenharmony_ci			args->ctx_save_restore_address;
2318c2ecf20Sopenharmony_ci	q_properties->ctx_save_restore_area_size = args->ctx_save_restore_size;
2328c2ecf20Sopenharmony_ci	q_properties->ctl_stack_size = args->ctl_stack_size;
2338c2ecf20Sopenharmony_ci	if (args->queue_type == KFD_IOC_QUEUE_TYPE_COMPUTE ||
2348c2ecf20Sopenharmony_ci		args->queue_type == KFD_IOC_QUEUE_TYPE_COMPUTE_AQL)
2358c2ecf20Sopenharmony_ci		q_properties->type = KFD_QUEUE_TYPE_COMPUTE;
2368c2ecf20Sopenharmony_ci	else if (args->queue_type == KFD_IOC_QUEUE_TYPE_SDMA)
2378c2ecf20Sopenharmony_ci		q_properties->type = KFD_QUEUE_TYPE_SDMA;
2388c2ecf20Sopenharmony_ci	else if (args->queue_type == KFD_IOC_QUEUE_TYPE_SDMA_XGMI)
2398c2ecf20Sopenharmony_ci		q_properties->type = KFD_QUEUE_TYPE_SDMA_XGMI;
2408c2ecf20Sopenharmony_ci	else
2418c2ecf20Sopenharmony_ci		return -ENOTSUPP;
2428c2ecf20Sopenharmony_ci
2438c2ecf20Sopenharmony_ci	if (args->queue_type == KFD_IOC_QUEUE_TYPE_COMPUTE_AQL)
2448c2ecf20Sopenharmony_ci		q_properties->format = KFD_QUEUE_FORMAT_AQL;
2458c2ecf20Sopenharmony_ci	else
2468c2ecf20Sopenharmony_ci		q_properties->format = KFD_QUEUE_FORMAT_PM4;
2478c2ecf20Sopenharmony_ci
2488c2ecf20Sopenharmony_ci	pr_debug("Queue Percentage: %d, %d\n",
2498c2ecf20Sopenharmony_ci			q_properties->queue_percent, args->queue_percentage);
2508c2ecf20Sopenharmony_ci
2518c2ecf20Sopenharmony_ci	pr_debug("Queue Priority: %d, %d\n",
2528c2ecf20Sopenharmony_ci			q_properties->priority, args->queue_priority);
2538c2ecf20Sopenharmony_ci
2548c2ecf20Sopenharmony_ci	pr_debug("Queue Address: 0x%llX, 0x%llX\n",
2558c2ecf20Sopenharmony_ci			q_properties->queue_address, args->ring_base_address);
2568c2ecf20Sopenharmony_ci
2578c2ecf20Sopenharmony_ci	pr_debug("Queue Size: 0x%llX, %u\n",
2588c2ecf20Sopenharmony_ci			q_properties->queue_size, args->ring_size);
2598c2ecf20Sopenharmony_ci
2608c2ecf20Sopenharmony_ci	pr_debug("Queue r/w Pointers: %px, %px\n",
2618c2ecf20Sopenharmony_ci			q_properties->read_ptr,
2628c2ecf20Sopenharmony_ci			q_properties->write_ptr);
2638c2ecf20Sopenharmony_ci
2648c2ecf20Sopenharmony_ci	pr_debug("Queue Format: %d\n", q_properties->format);
2658c2ecf20Sopenharmony_ci
2668c2ecf20Sopenharmony_ci	pr_debug("Queue EOP: 0x%llX\n", q_properties->eop_ring_buffer_address);
2678c2ecf20Sopenharmony_ci
2688c2ecf20Sopenharmony_ci	pr_debug("Queue CTX save area: 0x%llX\n",
2698c2ecf20Sopenharmony_ci			q_properties->ctx_save_restore_area_address);
2708c2ecf20Sopenharmony_ci
2718c2ecf20Sopenharmony_ci	return 0;
2728c2ecf20Sopenharmony_ci}
2738c2ecf20Sopenharmony_ci
2748c2ecf20Sopenharmony_cistatic int kfd_ioctl_create_queue(struct file *filep, struct kfd_process *p,
2758c2ecf20Sopenharmony_ci					void *data)
2768c2ecf20Sopenharmony_ci{
2778c2ecf20Sopenharmony_ci	struct kfd_ioctl_create_queue_args *args = data;
2788c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
2798c2ecf20Sopenharmony_ci	int err = 0;
2808c2ecf20Sopenharmony_ci	unsigned int queue_id;
2818c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
2828c2ecf20Sopenharmony_ci	struct queue_properties q_properties;
2838c2ecf20Sopenharmony_ci	uint32_t doorbell_offset_in_process = 0;
2848c2ecf20Sopenharmony_ci
2858c2ecf20Sopenharmony_ci	memset(&q_properties, 0, sizeof(struct queue_properties));
2868c2ecf20Sopenharmony_ci
2878c2ecf20Sopenharmony_ci	pr_debug("Creating queue ioctl\n");
2888c2ecf20Sopenharmony_ci
2898c2ecf20Sopenharmony_ci	err = set_queue_properties_from_user(&q_properties, args);
2908c2ecf20Sopenharmony_ci	if (err)
2918c2ecf20Sopenharmony_ci		return err;
2928c2ecf20Sopenharmony_ci
2938c2ecf20Sopenharmony_ci	pr_debug("Looking for gpu id 0x%x\n", args->gpu_id);
2948c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
2958c2ecf20Sopenharmony_ci	if (!dev) {
2968c2ecf20Sopenharmony_ci		pr_debug("Could not find gpu id 0x%x\n", args->gpu_id);
2978c2ecf20Sopenharmony_ci		return -EINVAL;
2988c2ecf20Sopenharmony_ci	}
2998c2ecf20Sopenharmony_ci
3008c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
3018c2ecf20Sopenharmony_ci
3028c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
3038c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
3048c2ecf20Sopenharmony_ci		err = -ESRCH;
3058c2ecf20Sopenharmony_ci		goto err_bind_process;
3068c2ecf20Sopenharmony_ci	}
3078c2ecf20Sopenharmony_ci
3088c2ecf20Sopenharmony_ci	pr_debug("Creating queue for PASID 0x%x on gpu 0x%x\n",
3098c2ecf20Sopenharmony_ci			p->pasid,
3108c2ecf20Sopenharmony_ci			dev->id);
3118c2ecf20Sopenharmony_ci
3128c2ecf20Sopenharmony_ci	err = pqm_create_queue(&p->pqm, dev, filep, &q_properties, &queue_id,
3138c2ecf20Sopenharmony_ci			&doorbell_offset_in_process);
3148c2ecf20Sopenharmony_ci	if (err != 0)
3158c2ecf20Sopenharmony_ci		goto err_create_queue;
3168c2ecf20Sopenharmony_ci
3178c2ecf20Sopenharmony_ci	args->queue_id = queue_id;
3188c2ecf20Sopenharmony_ci
3198c2ecf20Sopenharmony_ci
3208c2ecf20Sopenharmony_ci	/* Return gpu_id as doorbell offset for mmap usage */
3218c2ecf20Sopenharmony_ci	args->doorbell_offset = KFD_MMAP_TYPE_DOORBELL;
3228c2ecf20Sopenharmony_ci	args->doorbell_offset |= KFD_MMAP_GPU_ID(args->gpu_id);
3238c2ecf20Sopenharmony_ci	if (KFD_IS_SOC15(dev->device_info->asic_family))
3248c2ecf20Sopenharmony_ci		/* On SOC15 ASICs, include the doorbell offset within the
3258c2ecf20Sopenharmony_ci		 * process doorbell frame, which is 2 pages.
3268c2ecf20Sopenharmony_ci		 */
3278c2ecf20Sopenharmony_ci		args->doorbell_offset |= doorbell_offset_in_process;
3288c2ecf20Sopenharmony_ci
3298c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
3308c2ecf20Sopenharmony_ci
3318c2ecf20Sopenharmony_ci	pr_debug("Queue id %d was created successfully\n", args->queue_id);
3328c2ecf20Sopenharmony_ci
3338c2ecf20Sopenharmony_ci	pr_debug("Ring buffer address == 0x%016llX\n",
3348c2ecf20Sopenharmony_ci			args->ring_base_address);
3358c2ecf20Sopenharmony_ci
3368c2ecf20Sopenharmony_ci	pr_debug("Read ptr address    == 0x%016llX\n",
3378c2ecf20Sopenharmony_ci			args->read_pointer_address);
3388c2ecf20Sopenharmony_ci
3398c2ecf20Sopenharmony_ci	pr_debug("Write ptr address   == 0x%016llX\n",
3408c2ecf20Sopenharmony_ci			args->write_pointer_address);
3418c2ecf20Sopenharmony_ci
3428c2ecf20Sopenharmony_ci	return 0;
3438c2ecf20Sopenharmony_ci
3448c2ecf20Sopenharmony_cierr_create_queue:
3458c2ecf20Sopenharmony_cierr_bind_process:
3468c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
3478c2ecf20Sopenharmony_ci	return err;
3488c2ecf20Sopenharmony_ci}
3498c2ecf20Sopenharmony_ci
3508c2ecf20Sopenharmony_cistatic int kfd_ioctl_destroy_queue(struct file *filp, struct kfd_process *p,
3518c2ecf20Sopenharmony_ci					void *data)
3528c2ecf20Sopenharmony_ci{
3538c2ecf20Sopenharmony_ci	int retval;
3548c2ecf20Sopenharmony_ci	struct kfd_ioctl_destroy_queue_args *args = data;
3558c2ecf20Sopenharmony_ci
3568c2ecf20Sopenharmony_ci	pr_debug("Destroying queue id %d for pasid 0x%x\n",
3578c2ecf20Sopenharmony_ci				args->queue_id,
3588c2ecf20Sopenharmony_ci				p->pasid);
3598c2ecf20Sopenharmony_ci
3608c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
3618c2ecf20Sopenharmony_ci
3628c2ecf20Sopenharmony_ci	retval = pqm_destroy_queue(&p->pqm, args->queue_id);
3638c2ecf20Sopenharmony_ci
3648c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
3658c2ecf20Sopenharmony_ci	return retval;
3668c2ecf20Sopenharmony_ci}
3678c2ecf20Sopenharmony_ci
3688c2ecf20Sopenharmony_cistatic int kfd_ioctl_update_queue(struct file *filp, struct kfd_process *p,
3698c2ecf20Sopenharmony_ci					void *data)
3708c2ecf20Sopenharmony_ci{
3718c2ecf20Sopenharmony_ci	int retval;
3728c2ecf20Sopenharmony_ci	struct kfd_ioctl_update_queue_args *args = data;
3738c2ecf20Sopenharmony_ci	struct queue_properties properties;
3748c2ecf20Sopenharmony_ci
3758c2ecf20Sopenharmony_ci	if (args->queue_percentage > KFD_MAX_QUEUE_PERCENTAGE) {
3768c2ecf20Sopenharmony_ci		pr_err("Queue percentage must be between 0 to KFD_MAX_QUEUE_PERCENTAGE\n");
3778c2ecf20Sopenharmony_ci		return -EINVAL;
3788c2ecf20Sopenharmony_ci	}
3798c2ecf20Sopenharmony_ci
3808c2ecf20Sopenharmony_ci	if (args->queue_priority > KFD_MAX_QUEUE_PRIORITY) {
3818c2ecf20Sopenharmony_ci		pr_err("Queue priority must be between 0 to KFD_MAX_QUEUE_PRIORITY\n");
3828c2ecf20Sopenharmony_ci		return -EINVAL;
3838c2ecf20Sopenharmony_ci	}
3848c2ecf20Sopenharmony_ci
3858c2ecf20Sopenharmony_ci	if ((args->ring_base_address) &&
3868c2ecf20Sopenharmony_ci		(!access_ok((const void __user *) args->ring_base_address,
3878c2ecf20Sopenharmony_ci			sizeof(uint64_t)))) {
3888c2ecf20Sopenharmony_ci		pr_err("Can't access ring base address\n");
3898c2ecf20Sopenharmony_ci		return -EFAULT;
3908c2ecf20Sopenharmony_ci	}
3918c2ecf20Sopenharmony_ci
3928c2ecf20Sopenharmony_ci	if (!is_power_of_2(args->ring_size) && (args->ring_size != 0)) {
3938c2ecf20Sopenharmony_ci		pr_err("Ring size must be a power of 2 or 0\n");
3948c2ecf20Sopenharmony_ci		return -EINVAL;
3958c2ecf20Sopenharmony_ci	}
3968c2ecf20Sopenharmony_ci
3978c2ecf20Sopenharmony_ci	properties.queue_address = args->ring_base_address;
3988c2ecf20Sopenharmony_ci	properties.queue_size = args->ring_size;
3998c2ecf20Sopenharmony_ci	properties.queue_percent = args->queue_percentage;
4008c2ecf20Sopenharmony_ci	properties.priority = args->queue_priority;
4018c2ecf20Sopenharmony_ci
4028c2ecf20Sopenharmony_ci	pr_debug("Updating queue id %d for pasid 0x%x\n",
4038c2ecf20Sopenharmony_ci			args->queue_id, p->pasid);
4048c2ecf20Sopenharmony_ci
4058c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
4068c2ecf20Sopenharmony_ci
4078c2ecf20Sopenharmony_ci	retval = pqm_update_queue(&p->pqm, args->queue_id, &properties);
4088c2ecf20Sopenharmony_ci
4098c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
4108c2ecf20Sopenharmony_ci
4118c2ecf20Sopenharmony_ci	return retval;
4128c2ecf20Sopenharmony_ci}
4138c2ecf20Sopenharmony_ci
4148c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_cu_mask(struct file *filp, struct kfd_process *p,
4158c2ecf20Sopenharmony_ci					void *data)
4168c2ecf20Sopenharmony_ci{
4178c2ecf20Sopenharmony_ci	int retval;
4188c2ecf20Sopenharmony_ci	const int max_num_cus = 1024;
4198c2ecf20Sopenharmony_ci	struct kfd_ioctl_set_cu_mask_args *args = data;
4208c2ecf20Sopenharmony_ci	struct queue_properties properties;
4218c2ecf20Sopenharmony_ci	uint32_t __user *cu_mask_ptr = (uint32_t __user *)args->cu_mask_ptr;
4228c2ecf20Sopenharmony_ci	size_t cu_mask_size = sizeof(uint32_t) * (args->num_cu_mask / 32);
4238c2ecf20Sopenharmony_ci
4248c2ecf20Sopenharmony_ci	if ((args->num_cu_mask % 32) != 0) {
4258c2ecf20Sopenharmony_ci		pr_debug("num_cu_mask 0x%x must be a multiple of 32",
4268c2ecf20Sopenharmony_ci				args->num_cu_mask);
4278c2ecf20Sopenharmony_ci		return -EINVAL;
4288c2ecf20Sopenharmony_ci	}
4298c2ecf20Sopenharmony_ci
4308c2ecf20Sopenharmony_ci	properties.cu_mask_count = args->num_cu_mask;
4318c2ecf20Sopenharmony_ci	if (properties.cu_mask_count == 0) {
4328c2ecf20Sopenharmony_ci		pr_debug("CU mask cannot be 0");
4338c2ecf20Sopenharmony_ci		return -EINVAL;
4348c2ecf20Sopenharmony_ci	}
4358c2ecf20Sopenharmony_ci
4368c2ecf20Sopenharmony_ci	/* To prevent an unreasonably large CU mask size, set an arbitrary
4378c2ecf20Sopenharmony_ci	 * limit of max_num_cus bits.  We can then just drop any CU mask bits
4388c2ecf20Sopenharmony_ci	 * past max_num_cus bits and just use the first max_num_cus bits.
4398c2ecf20Sopenharmony_ci	 */
4408c2ecf20Sopenharmony_ci	if (properties.cu_mask_count > max_num_cus) {
4418c2ecf20Sopenharmony_ci		pr_debug("CU mask cannot be greater than 1024 bits");
4428c2ecf20Sopenharmony_ci		properties.cu_mask_count = max_num_cus;
4438c2ecf20Sopenharmony_ci		cu_mask_size = sizeof(uint32_t) * (max_num_cus/32);
4448c2ecf20Sopenharmony_ci	}
4458c2ecf20Sopenharmony_ci
4468c2ecf20Sopenharmony_ci	properties.cu_mask = kzalloc(cu_mask_size, GFP_KERNEL);
4478c2ecf20Sopenharmony_ci	if (!properties.cu_mask)
4488c2ecf20Sopenharmony_ci		return -ENOMEM;
4498c2ecf20Sopenharmony_ci
4508c2ecf20Sopenharmony_ci	retval = copy_from_user(properties.cu_mask, cu_mask_ptr, cu_mask_size);
4518c2ecf20Sopenharmony_ci	if (retval) {
4528c2ecf20Sopenharmony_ci		pr_debug("Could not copy CU mask from userspace");
4538c2ecf20Sopenharmony_ci		kfree(properties.cu_mask);
4548c2ecf20Sopenharmony_ci		return -EFAULT;
4558c2ecf20Sopenharmony_ci	}
4568c2ecf20Sopenharmony_ci
4578c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
4588c2ecf20Sopenharmony_ci
4598c2ecf20Sopenharmony_ci	retval = pqm_set_cu_mask(&p->pqm, args->queue_id, &properties);
4608c2ecf20Sopenharmony_ci
4618c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
4628c2ecf20Sopenharmony_ci
4638c2ecf20Sopenharmony_ci	if (retval)
4648c2ecf20Sopenharmony_ci		kfree(properties.cu_mask);
4658c2ecf20Sopenharmony_ci
4668c2ecf20Sopenharmony_ci	return retval;
4678c2ecf20Sopenharmony_ci}
4688c2ecf20Sopenharmony_ci
4698c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_queue_wave_state(struct file *filep,
4708c2ecf20Sopenharmony_ci					  struct kfd_process *p, void *data)
4718c2ecf20Sopenharmony_ci{
4728c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_queue_wave_state_args *args = data;
4738c2ecf20Sopenharmony_ci	int r;
4748c2ecf20Sopenharmony_ci
4758c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
4768c2ecf20Sopenharmony_ci
4778c2ecf20Sopenharmony_ci	r = pqm_get_wave_state(&p->pqm, args->queue_id,
4788c2ecf20Sopenharmony_ci			       (void __user *)args->ctl_stack_address,
4798c2ecf20Sopenharmony_ci			       &args->ctl_stack_used_size,
4808c2ecf20Sopenharmony_ci			       &args->save_area_used_size);
4818c2ecf20Sopenharmony_ci
4828c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
4838c2ecf20Sopenharmony_ci
4848c2ecf20Sopenharmony_ci	return r;
4858c2ecf20Sopenharmony_ci}
4868c2ecf20Sopenharmony_ci
4878c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_memory_policy(struct file *filep,
4888c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
4898c2ecf20Sopenharmony_ci{
4908c2ecf20Sopenharmony_ci	struct kfd_ioctl_set_memory_policy_args *args = data;
4918c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
4928c2ecf20Sopenharmony_ci	int err = 0;
4938c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
4948c2ecf20Sopenharmony_ci	enum cache_policy default_policy, alternate_policy;
4958c2ecf20Sopenharmony_ci
4968c2ecf20Sopenharmony_ci	if (args->default_policy != KFD_IOC_CACHE_POLICY_COHERENT
4978c2ecf20Sopenharmony_ci	    && args->default_policy != KFD_IOC_CACHE_POLICY_NONCOHERENT) {
4988c2ecf20Sopenharmony_ci		return -EINVAL;
4998c2ecf20Sopenharmony_ci	}
5008c2ecf20Sopenharmony_ci
5018c2ecf20Sopenharmony_ci	if (args->alternate_policy != KFD_IOC_CACHE_POLICY_COHERENT
5028c2ecf20Sopenharmony_ci	    && args->alternate_policy != KFD_IOC_CACHE_POLICY_NONCOHERENT) {
5038c2ecf20Sopenharmony_ci		return -EINVAL;
5048c2ecf20Sopenharmony_ci	}
5058c2ecf20Sopenharmony_ci
5068c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
5078c2ecf20Sopenharmony_ci	if (!dev)
5088c2ecf20Sopenharmony_ci		return -EINVAL;
5098c2ecf20Sopenharmony_ci
5108c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
5118c2ecf20Sopenharmony_ci
5128c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
5138c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
5148c2ecf20Sopenharmony_ci		err = -ESRCH;
5158c2ecf20Sopenharmony_ci		goto out;
5168c2ecf20Sopenharmony_ci	}
5178c2ecf20Sopenharmony_ci
5188c2ecf20Sopenharmony_ci	default_policy = (args->default_policy == KFD_IOC_CACHE_POLICY_COHERENT)
5198c2ecf20Sopenharmony_ci			 ? cache_policy_coherent : cache_policy_noncoherent;
5208c2ecf20Sopenharmony_ci
5218c2ecf20Sopenharmony_ci	alternate_policy =
5228c2ecf20Sopenharmony_ci		(args->alternate_policy == KFD_IOC_CACHE_POLICY_COHERENT)
5238c2ecf20Sopenharmony_ci		   ? cache_policy_coherent : cache_policy_noncoherent;
5248c2ecf20Sopenharmony_ci
5258c2ecf20Sopenharmony_ci	if (!dev->dqm->ops.set_cache_memory_policy(dev->dqm,
5268c2ecf20Sopenharmony_ci				&pdd->qpd,
5278c2ecf20Sopenharmony_ci				default_policy,
5288c2ecf20Sopenharmony_ci				alternate_policy,
5298c2ecf20Sopenharmony_ci				(void __user *)args->alternate_aperture_base,
5308c2ecf20Sopenharmony_ci				args->alternate_aperture_size))
5318c2ecf20Sopenharmony_ci		err = -EINVAL;
5328c2ecf20Sopenharmony_ci
5338c2ecf20Sopenharmony_ciout:
5348c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
5358c2ecf20Sopenharmony_ci
5368c2ecf20Sopenharmony_ci	return err;
5378c2ecf20Sopenharmony_ci}
5388c2ecf20Sopenharmony_ci
5398c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_trap_handler(struct file *filep,
5408c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
5418c2ecf20Sopenharmony_ci{
5428c2ecf20Sopenharmony_ci	struct kfd_ioctl_set_trap_handler_args *args = data;
5438c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
5448c2ecf20Sopenharmony_ci	int err = 0;
5458c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
5468c2ecf20Sopenharmony_ci
5478c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
5488c2ecf20Sopenharmony_ci	if (!dev)
5498c2ecf20Sopenharmony_ci		return -EINVAL;
5508c2ecf20Sopenharmony_ci
5518c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
5528c2ecf20Sopenharmony_ci
5538c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
5548c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
5558c2ecf20Sopenharmony_ci		err = -ESRCH;
5568c2ecf20Sopenharmony_ci		goto out;
5578c2ecf20Sopenharmony_ci	}
5588c2ecf20Sopenharmony_ci
5598c2ecf20Sopenharmony_ci	if (dev->dqm->ops.set_trap_handler(dev->dqm,
5608c2ecf20Sopenharmony_ci					&pdd->qpd,
5618c2ecf20Sopenharmony_ci					args->tba_addr,
5628c2ecf20Sopenharmony_ci					args->tma_addr))
5638c2ecf20Sopenharmony_ci		err = -EINVAL;
5648c2ecf20Sopenharmony_ci
5658c2ecf20Sopenharmony_ciout:
5668c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
5678c2ecf20Sopenharmony_ci
5688c2ecf20Sopenharmony_ci	return err;
5698c2ecf20Sopenharmony_ci}
5708c2ecf20Sopenharmony_ci
5718c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_register(struct file *filep,
5728c2ecf20Sopenharmony_ci				struct kfd_process *p, void *data)
5738c2ecf20Sopenharmony_ci{
5748c2ecf20Sopenharmony_ci	struct kfd_ioctl_dbg_register_args *args = data;
5758c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
5768c2ecf20Sopenharmony_ci	struct kfd_dbgmgr *dbgmgr_ptr;
5778c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
5788c2ecf20Sopenharmony_ci	bool create_ok;
5798c2ecf20Sopenharmony_ci	long status = 0;
5808c2ecf20Sopenharmony_ci
5818c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
5828c2ecf20Sopenharmony_ci	if (!dev)
5838c2ecf20Sopenharmony_ci		return -EINVAL;
5848c2ecf20Sopenharmony_ci
5858c2ecf20Sopenharmony_ci	if (dev->device_info->asic_family == CHIP_CARRIZO) {
5868c2ecf20Sopenharmony_ci		pr_debug("kfd_ioctl_dbg_register not supported on CZ\n");
5878c2ecf20Sopenharmony_ci		return -EINVAL;
5888c2ecf20Sopenharmony_ci	}
5898c2ecf20Sopenharmony_ci
5908c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
5918c2ecf20Sopenharmony_ci	mutex_lock(kfd_get_dbgmgr_mutex());
5928c2ecf20Sopenharmony_ci
5938c2ecf20Sopenharmony_ci	/*
5948c2ecf20Sopenharmony_ci	 * make sure that we have pdd, if this the first queue created for
5958c2ecf20Sopenharmony_ci	 * this process
5968c2ecf20Sopenharmony_ci	 */
5978c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
5988c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
5998c2ecf20Sopenharmony_ci		status = PTR_ERR(pdd);
6008c2ecf20Sopenharmony_ci		goto out;
6018c2ecf20Sopenharmony_ci	}
6028c2ecf20Sopenharmony_ci
6038c2ecf20Sopenharmony_ci	if (!dev->dbgmgr) {
6048c2ecf20Sopenharmony_ci		/* In case of a legal call, we have no dbgmgr yet */
6058c2ecf20Sopenharmony_ci		create_ok = kfd_dbgmgr_create(&dbgmgr_ptr, dev);
6068c2ecf20Sopenharmony_ci		if (create_ok) {
6078c2ecf20Sopenharmony_ci			status = kfd_dbgmgr_register(dbgmgr_ptr, p);
6088c2ecf20Sopenharmony_ci			if (status != 0)
6098c2ecf20Sopenharmony_ci				kfd_dbgmgr_destroy(dbgmgr_ptr);
6108c2ecf20Sopenharmony_ci			else
6118c2ecf20Sopenharmony_ci				dev->dbgmgr = dbgmgr_ptr;
6128c2ecf20Sopenharmony_ci		}
6138c2ecf20Sopenharmony_ci	} else {
6148c2ecf20Sopenharmony_ci		pr_debug("debugger already registered\n");
6158c2ecf20Sopenharmony_ci		status = -EINVAL;
6168c2ecf20Sopenharmony_ci	}
6178c2ecf20Sopenharmony_ci
6188c2ecf20Sopenharmony_ciout:
6198c2ecf20Sopenharmony_ci	mutex_unlock(kfd_get_dbgmgr_mutex());
6208c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
6218c2ecf20Sopenharmony_ci
6228c2ecf20Sopenharmony_ci	return status;
6238c2ecf20Sopenharmony_ci}
6248c2ecf20Sopenharmony_ci
6258c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_unregister(struct file *filep,
6268c2ecf20Sopenharmony_ci				struct kfd_process *p, void *data)
6278c2ecf20Sopenharmony_ci{
6288c2ecf20Sopenharmony_ci	struct kfd_ioctl_dbg_unregister_args *args = data;
6298c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
6308c2ecf20Sopenharmony_ci	long status;
6318c2ecf20Sopenharmony_ci
6328c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
6338c2ecf20Sopenharmony_ci	if (!dev || !dev->dbgmgr)
6348c2ecf20Sopenharmony_ci		return -EINVAL;
6358c2ecf20Sopenharmony_ci
6368c2ecf20Sopenharmony_ci	if (dev->device_info->asic_family == CHIP_CARRIZO) {
6378c2ecf20Sopenharmony_ci		pr_debug("kfd_ioctl_dbg_unregister not supported on CZ\n");
6388c2ecf20Sopenharmony_ci		return -EINVAL;
6398c2ecf20Sopenharmony_ci	}
6408c2ecf20Sopenharmony_ci
6418c2ecf20Sopenharmony_ci	mutex_lock(kfd_get_dbgmgr_mutex());
6428c2ecf20Sopenharmony_ci
6438c2ecf20Sopenharmony_ci	status = kfd_dbgmgr_unregister(dev->dbgmgr, p);
6448c2ecf20Sopenharmony_ci	if (!status) {
6458c2ecf20Sopenharmony_ci		kfd_dbgmgr_destroy(dev->dbgmgr);
6468c2ecf20Sopenharmony_ci		dev->dbgmgr = NULL;
6478c2ecf20Sopenharmony_ci	}
6488c2ecf20Sopenharmony_ci
6498c2ecf20Sopenharmony_ci	mutex_unlock(kfd_get_dbgmgr_mutex());
6508c2ecf20Sopenharmony_ci
6518c2ecf20Sopenharmony_ci	return status;
6528c2ecf20Sopenharmony_ci}
6538c2ecf20Sopenharmony_ci
6548c2ecf20Sopenharmony_ci/*
6558c2ecf20Sopenharmony_ci * Parse and generate variable size data structure for address watch.
6568c2ecf20Sopenharmony_ci * Total size of the buffer and # watch points is limited in order
6578c2ecf20Sopenharmony_ci * to prevent kernel abuse. (no bearing to the much smaller HW limitation
6588c2ecf20Sopenharmony_ci * which is enforced by dbgdev module)
6598c2ecf20Sopenharmony_ci * please also note that the watch address itself are not "copied from user",
6608c2ecf20Sopenharmony_ci * since it be set into the HW in user mode values.
6618c2ecf20Sopenharmony_ci *
6628c2ecf20Sopenharmony_ci */
6638c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_address_watch(struct file *filep,
6648c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
6658c2ecf20Sopenharmony_ci{
6668c2ecf20Sopenharmony_ci	struct kfd_ioctl_dbg_address_watch_args *args = data;
6678c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
6688c2ecf20Sopenharmony_ci	struct dbg_address_watch_info aw_info;
6698c2ecf20Sopenharmony_ci	unsigned char *args_buff;
6708c2ecf20Sopenharmony_ci	long status;
6718c2ecf20Sopenharmony_ci	void __user *cmd_from_user;
6728c2ecf20Sopenharmony_ci	uint64_t watch_mask_value = 0;
6738c2ecf20Sopenharmony_ci	unsigned int args_idx = 0;
6748c2ecf20Sopenharmony_ci
6758c2ecf20Sopenharmony_ci	memset((void *) &aw_info, 0, sizeof(struct dbg_address_watch_info));
6768c2ecf20Sopenharmony_ci
6778c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
6788c2ecf20Sopenharmony_ci	if (!dev)
6798c2ecf20Sopenharmony_ci		return -EINVAL;
6808c2ecf20Sopenharmony_ci
6818c2ecf20Sopenharmony_ci	if (dev->device_info->asic_family == CHIP_CARRIZO) {
6828c2ecf20Sopenharmony_ci		pr_debug("kfd_ioctl_dbg_wave_control not supported on CZ\n");
6838c2ecf20Sopenharmony_ci		return -EINVAL;
6848c2ecf20Sopenharmony_ci	}
6858c2ecf20Sopenharmony_ci
6868c2ecf20Sopenharmony_ci	cmd_from_user = (void __user *) args->content_ptr;
6878c2ecf20Sopenharmony_ci
6888c2ecf20Sopenharmony_ci	/* Validate arguments */
6898c2ecf20Sopenharmony_ci
6908c2ecf20Sopenharmony_ci	if ((args->buf_size_in_bytes > MAX_ALLOWED_AW_BUFF_SIZE) ||
6918c2ecf20Sopenharmony_ci		(args->buf_size_in_bytes <= sizeof(*args) + sizeof(int) * 2) ||
6928c2ecf20Sopenharmony_ci		(cmd_from_user == NULL))
6938c2ecf20Sopenharmony_ci		return -EINVAL;
6948c2ecf20Sopenharmony_ci
6958c2ecf20Sopenharmony_ci	/* this is the actual buffer to work with */
6968c2ecf20Sopenharmony_ci	args_buff = memdup_user(cmd_from_user,
6978c2ecf20Sopenharmony_ci				args->buf_size_in_bytes - sizeof(*args));
6988c2ecf20Sopenharmony_ci	if (IS_ERR(args_buff))
6998c2ecf20Sopenharmony_ci		return PTR_ERR(args_buff);
7008c2ecf20Sopenharmony_ci
7018c2ecf20Sopenharmony_ci	aw_info.process = p;
7028c2ecf20Sopenharmony_ci
7038c2ecf20Sopenharmony_ci	aw_info.num_watch_points = *((uint32_t *)(&args_buff[args_idx]));
7048c2ecf20Sopenharmony_ci	args_idx += sizeof(aw_info.num_watch_points);
7058c2ecf20Sopenharmony_ci
7068c2ecf20Sopenharmony_ci	aw_info.watch_mode = (enum HSA_DBG_WATCH_MODE *) &args_buff[args_idx];
7078c2ecf20Sopenharmony_ci	args_idx += sizeof(enum HSA_DBG_WATCH_MODE) * aw_info.num_watch_points;
7088c2ecf20Sopenharmony_ci
7098c2ecf20Sopenharmony_ci	/*
7108c2ecf20Sopenharmony_ci	 * set watch address base pointer to point on the array base
7118c2ecf20Sopenharmony_ci	 * within args_buff
7128c2ecf20Sopenharmony_ci	 */
7138c2ecf20Sopenharmony_ci	aw_info.watch_address = (uint64_t *) &args_buff[args_idx];
7148c2ecf20Sopenharmony_ci
7158c2ecf20Sopenharmony_ci	/* skip over the addresses buffer */
7168c2ecf20Sopenharmony_ci	args_idx += sizeof(aw_info.watch_address) * aw_info.num_watch_points;
7178c2ecf20Sopenharmony_ci
7188c2ecf20Sopenharmony_ci	if (args_idx >= args->buf_size_in_bytes - sizeof(*args)) {
7198c2ecf20Sopenharmony_ci		status = -EINVAL;
7208c2ecf20Sopenharmony_ci		goto out;
7218c2ecf20Sopenharmony_ci	}
7228c2ecf20Sopenharmony_ci
7238c2ecf20Sopenharmony_ci	watch_mask_value = (uint64_t) args_buff[args_idx];
7248c2ecf20Sopenharmony_ci
7258c2ecf20Sopenharmony_ci	if (watch_mask_value > 0) {
7268c2ecf20Sopenharmony_ci		/*
7278c2ecf20Sopenharmony_ci		 * There is an array of masks.
7288c2ecf20Sopenharmony_ci		 * set watch mask base pointer to point on the array base
7298c2ecf20Sopenharmony_ci		 * within args_buff
7308c2ecf20Sopenharmony_ci		 */
7318c2ecf20Sopenharmony_ci		aw_info.watch_mask = (uint64_t *) &args_buff[args_idx];
7328c2ecf20Sopenharmony_ci
7338c2ecf20Sopenharmony_ci		/* skip over the masks buffer */
7348c2ecf20Sopenharmony_ci		args_idx += sizeof(aw_info.watch_mask) *
7358c2ecf20Sopenharmony_ci				aw_info.num_watch_points;
7368c2ecf20Sopenharmony_ci	} else {
7378c2ecf20Sopenharmony_ci		/* just the NULL mask, set to NULL and skip over it */
7388c2ecf20Sopenharmony_ci		aw_info.watch_mask = NULL;
7398c2ecf20Sopenharmony_ci		args_idx += sizeof(aw_info.watch_mask);
7408c2ecf20Sopenharmony_ci	}
7418c2ecf20Sopenharmony_ci
7428c2ecf20Sopenharmony_ci	if (args_idx >= args->buf_size_in_bytes - sizeof(args)) {
7438c2ecf20Sopenharmony_ci		status = -EINVAL;
7448c2ecf20Sopenharmony_ci		goto out;
7458c2ecf20Sopenharmony_ci	}
7468c2ecf20Sopenharmony_ci
7478c2ecf20Sopenharmony_ci	/* Currently HSA Event is not supported for DBG */
7488c2ecf20Sopenharmony_ci	aw_info.watch_event = NULL;
7498c2ecf20Sopenharmony_ci
7508c2ecf20Sopenharmony_ci	mutex_lock(kfd_get_dbgmgr_mutex());
7518c2ecf20Sopenharmony_ci
7528c2ecf20Sopenharmony_ci	status = kfd_dbgmgr_address_watch(dev->dbgmgr, &aw_info);
7538c2ecf20Sopenharmony_ci
7548c2ecf20Sopenharmony_ci	mutex_unlock(kfd_get_dbgmgr_mutex());
7558c2ecf20Sopenharmony_ci
7568c2ecf20Sopenharmony_ciout:
7578c2ecf20Sopenharmony_ci	kfree(args_buff);
7588c2ecf20Sopenharmony_ci
7598c2ecf20Sopenharmony_ci	return status;
7608c2ecf20Sopenharmony_ci}
7618c2ecf20Sopenharmony_ci
7628c2ecf20Sopenharmony_ci/* Parse and generate fixed size data structure for wave control */
7638c2ecf20Sopenharmony_cistatic int kfd_ioctl_dbg_wave_control(struct file *filep,
7648c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
7658c2ecf20Sopenharmony_ci{
7668c2ecf20Sopenharmony_ci	struct kfd_ioctl_dbg_wave_control_args *args = data;
7678c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
7688c2ecf20Sopenharmony_ci	struct dbg_wave_control_info wac_info;
7698c2ecf20Sopenharmony_ci	unsigned char *args_buff;
7708c2ecf20Sopenharmony_ci	uint32_t computed_buff_size;
7718c2ecf20Sopenharmony_ci	long status;
7728c2ecf20Sopenharmony_ci	void __user *cmd_from_user;
7738c2ecf20Sopenharmony_ci	unsigned int args_idx = 0;
7748c2ecf20Sopenharmony_ci
7758c2ecf20Sopenharmony_ci	memset((void *) &wac_info, 0, sizeof(struct dbg_wave_control_info));
7768c2ecf20Sopenharmony_ci
7778c2ecf20Sopenharmony_ci	/* we use compact form, independent of the packing attribute value */
7788c2ecf20Sopenharmony_ci	computed_buff_size = sizeof(*args) +
7798c2ecf20Sopenharmony_ci				sizeof(wac_info.mode) +
7808c2ecf20Sopenharmony_ci				sizeof(wac_info.operand) +
7818c2ecf20Sopenharmony_ci				sizeof(wac_info.dbgWave_msg.DbgWaveMsg) +
7828c2ecf20Sopenharmony_ci				sizeof(wac_info.dbgWave_msg.MemoryVA) +
7838c2ecf20Sopenharmony_ci				sizeof(wac_info.trapId);
7848c2ecf20Sopenharmony_ci
7858c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
7868c2ecf20Sopenharmony_ci	if (!dev)
7878c2ecf20Sopenharmony_ci		return -EINVAL;
7888c2ecf20Sopenharmony_ci
7898c2ecf20Sopenharmony_ci	if (dev->device_info->asic_family == CHIP_CARRIZO) {
7908c2ecf20Sopenharmony_ci		pr_debug("kfd_ioctl_dbg_wave_control not supported on CZ\n");
7918c2ecf20Sopenharmony_ci		return -EINVAL;
7928c2ecf20Sopenharmony_ci	}
7938c2ecf20Sopenharmony_ci
7948c2ecf20Sopenharmony_ci	/* input size must match the computed "compact" size */
7958c2ecf20Sopenharmony_ci	if (args->buf_size_in_bytes != computed_buff_size) {
7968c2ecf20Sopenharmony_ci		pr_debug("size mismatch, computed : actual %u : %u\n",
7978c2ecf20Sopenharmony_ci				args->buf_size_in_bytes, computed_buff_size);
7988c2ecf20Sopenharmony_ci		return -EINVAL;
7998c2ecf20Sopenharmony_ci	}
8008c2ecf20Sopenharmony_ci
8018c2ecf20Sopenharmony_ci	cmd_from_user = (void __user *) args->content_ptr;
8028c2ecf20Sopenharmony_ci
8038c2ecf20Sopenharmony_ci	if (cmd_from_user == NULL)
8048c2ecf20Sopenharmony_ci		return -EINVAL;
8058c2ecf20Sopenharmony_ci
8068c2ecf20Sopenharmony_ci	/* copy the entire buffer from user */
8078c2ecf20Sopenharmony_ci
8088c2ecf20Sopenharmony_ci	args_buff = memdup_user(cmd_from_user,
8098c2ecf20Sopenharmony_ci				args->buf_size_in_bytes - sizeof(*args));
8108c2ecf20Sopenharmony_ci	if (IS_ERR(args_buff))
8118c2ecf20Sopenharmony_ci		return PTR_ERR(args_buff);
8128c2ecf20Sopenharmony_ci
8138c2ecf20Sopenharmony_ci	/* move ptr to the start of the "pay-load" area */
8148c2ecf20Sopenharmony_ci	wac_info.process = p;
8158c2ecf20Sopenharmony_ci
8168c2ecf20Sopenharmony_ci	wac_info.operand = *((enum HSA_DBG_WAVEOP *)(&args_buff[args_idx]));
8178c2ecf20Sopenharmony_ci	args_idx += sizeof(wac_info.operand);
8188c2ecf20Sopenharmony_ci
8198c2ecf20Sopenharmony_ci	wac_info.mode = *((enum HSA_DBG_WAVEMODE *)(&args_buff[args_idx]));
8208c2ecf20Sopenharmony_ci	args_idx += sizeof(wac_info.mode);
8218c2ecf20Sopenharmony_ci
8228c2ecf20Sopenharmony_ci	wac_info.trapId = *((uint32_t *)(&args_buff[args_idx]));
8238c2ecf20Sopenharmony_ci	args_idx += sizeof(wac_info.trapId);
8248c2ecf20Sopenharmony_ci
8258c2ecf20Sopenharmony_ci	wac_info.dbgWave_msg.DbgWaveMsg.WaveMsgInfoGen2.Value =
8268c2ecf20Sopenharmony_ci					*((uint32_t *)(&args_buff[args_idx]));
8278c2ecf20Sopenharmony_ci	wac_info.dbgWave_msg.MemoryVA = NULL;
8288c2ecf20Sopenharmony_ci
8298c2ecf20Sopenharmony_ci	mutex_lock(kfd_get_dbgmgr_mutex());
8308c2ecf20Sopenharmony_ci
8318c2ecf20Sopenharmony_ci	pr_debug("Calling dbg manager process %p, operand %u, mode %u, trapId %u, message %u\n",
8328c2ecf20Sopenharmony_ci			wac_info.process, wac_info.operand,
8338c2ecf20Sopenharmony_ci			wac_info.mode, wac_info.trapId,
8348c2ecf20Sopenharmony_ci			wac_info.dbgWave_msg.DbgWaveMsg.WaveMsgInfoGen2.Value);
8358c2ecf20Sopenharmony_ci
8368c2ecf20Sopenharmony_ci	status = kfd_dbgmgr_wave_control(dev->dbgmgr, &wac_info);
8378c2ecf20Sopenharmony_ci
8388c2ecf20Sopenharmony_ci	pr_debug("Returned status of dbg manager is %ld\n", status);
8398c2ecf20Sopenharmony_ci
8408c2ecf20Sopenharmony_ci	mutex_unlock(kfd_get_dbgmgr_mutex());
8418c2ecf20Sopenharmony_ci
8428c2ecf20Sopenharmony_ci	kfree(args_buff);
8438c2ecf20Sopenharmony_ci
8448c2ecf20Sopenharmony_ci	return status;
8458c2ecf20Sopenharmony_ci}
8468c2ecf20Sopenharmony_ci
8478c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_clock_counters(struct file *filep,
8488c2ecf20Sopenharmony_ci				struct kfd_process *p, void *data)
8498c2ecf20Sopenharmony_ci{
8508c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_clock_counters_args *args = data;
8518c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
8528c2ecf20Sopenharmony_ci
8538c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
8548c2ecf20Sopenharmony_ci	if (dev)
8558c2ecf20Sopenharmony_ci		/* Reading GPU clock counter from KGD */
8568c2ecf20Sopenharmony_ci		args->gpu_clock_counter = amdgpu_amdkfd_get_gpu_clock_counter(dev->kgd);
8578c2ecf20Sopenharmony_ci	else
8588c2ecf20Sopenharmony_ci		/* Node without GPU resource */
8598c2ecf20Sopenharmony_ci		args->gpu_clock_counter = 0;
8608c2ecf20Sopenharmony_ci
8618c2ecf20Sopenharmony_ci	/* No access to rdtsc. Using raw monotonic time */
8628c2ecf20Sopenharmony_ci	args->cpu_clock_counter = ktime_get_raw_ns();
8638c2ecf20Sopenharmony_ci	args->system_clock_counter = ktime_get_boottime_ns();
8648c2ecf20Sopenharmony_ci
8658c2ecf20Sopenharmony_ci	/* Since the counter is in nano-seconds we use 1GHz frequency */
8668c2ecf20Sopenharmony_ci	args->system_clock_freq = 1000000000;
8678c2ecf20Sopenharmony_ci
8688c2ecf20Sopenharmony_ci	return 0;
8698c2ecf20Sopenharmony_ci}
8708c2ecf20Sopenharmony_ci
8718c2ecf20Sopenharmony_ci
8728c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_process_apertures(struct file *filp,
8738c2ecf20Sopenharmony_ci				struct kfd_process *p, void *data)
8748c2ecf20Sopenharmony_ci{
8758c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_process_apertures_args *args = data;
8768c2ecf20Sopenharmony_ci	struct kfd_process_device_apertures *pAperture;
8778c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
8788c2ecf20Sopenharmony_ci
8798c2ecf20Sopenharmony_ci	dev_dbg(kfd_device, "get apertures for PASID 0x%x", p->pasid);
8808c2ecf20Sopenharmony_ci
8818c2ecf20Sopenharmony_ci	args->num_of_nodes = 0;
8828c2ecf20Sopenharmony_ci
8838c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
8848c2ecf20Sopenharmony_ci
8858c2ecf20Sopenharmony_ci	/*if the process-device list isn't empty*/
8868c2ecf20Sopenharmony_ci	if (kfd_has_process_device_data(p)) {
8878c2ecf20Sopenharmony_ci		/* Run over all pdd of the process */
8888c2ecf20Sopenharmony_ci		pdd = kfd_get_first_process_device_data(p);
8898c2ecf20Sopenharmony_ci		do {
8908c2ecf20Sopenharmony_ci			pAperture =
8918c2ecf20Sopenharmony_ci				&args->process_apertures[args->num_of_nodes];
8928c2ecf20Sopenharmony_ci			pAperture->gpu_id = pdd->dev->id;
8938c2ecf20Sopenharmony_ci			pAperture->lds_base = pdd->lds_base;
8948c2ecf20Sopenharmony_ci			pAperture->lds_limit = pdd->lds_limit;
8958c2ecf20Sopenharmony_ci			pAperture->gpuvm_base = pdd->gpuvm_base;
8968c2ecf20Sopenharmony_ci			pAperture->gpuvm_limit = pdd->gpuvm_limit;
8978c2ecf20Sopenharmony_ci			pAperture->scratch_base = pdd->scratch_base;
8988c2ecf20Sopenharmony_ci			pAperture->scratch_limit = pdd->scratch_limit;
8998c2ecf20Sopenharmony_ci
9008c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9018c2ecf20Sopenharmony_ci				"node id %u\n", args->num_of_nodes);
9028c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9038c2ecf20Sopenharmony_ci				"gpu id %u\n", pdd->dev->id);
9048c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9058c2ecf20Sopenharmony_ci				"lds_base %llX\n", pdd->lds_base);
9068c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9078c2ecf20Sopenharmony_ci				"lds_limit %llX\n", pdd->lds_limit);
9088c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9098c2ecf20Sopenharmony_ci				"gpuvm_base %llX\n", pdd->gpuvm_base);
9108c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9118c2ecf20Sopenharmony_ci				"gpuvm_limit %llX\n", pdd->gpuvm_limit);
9128c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9138c2ecf20Sopenharmony_ci				"scratch_base %llX\n", pdd->scratch_base);
9148c2ecf20Sopenharmony_ci			dev_dbg(kfd_device,
9158c2ecf20Sopenharmony_ci				"scratch_limit %llX\n", pdd->scratch_limit);
9168c2ecf20Sopenharmony_ci
9178c2ecf20Sopenharmony_ci			args->num_of_nodes++;
9188c2ecf20Sopenharmony_ci
9198c2ecf20Sopenharmony_ci			pdd = kfd_get_next_process_device_data(p, pdd);
9208c2ecf20Sopenharmony_ci		} while (pdd && (args->num_of_nodes < NUM_OF_SUPPORTED_GPUS));
9218c2ecf20Sopenharmony_ci	}
9228c2ecf20Sopenharmony_ci
9238c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
9248c2ecf20Sopenharmony_ci
9258c2ecf20Sopenharmony_ci	return 0;
9268c2ecf20Sopenharmony_ci}
9278c2ecf20Sopenharmony_ci
9288c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_process_apertures_new(struct file *filp,
9298c2ecf20Sopenharmony_ci				struct kfd_process *p, void *data)
9308c2ecf20Sopenharmony_ci{
9318c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_process_apertures_new_args *args = data;
9328c2ecf20Sopenharmony_ci	struct kfd_process_device_apertures *pa;
9338c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
9348c2ecf20Sopenharmony_ci	uint32_t nodes = 0;
9358c2ecf20Sopenharmony_ci	int ret;
9368c2ecf20Sopenharmony_ci
9378c2ecf20Sopenharmony_ci	dev_dbg(kfd_device, "get apertures for PASID 0x%x", p->pasid);
9388c2ecf20Sopenharmony_ci
9398c2ecf20Sopenharmony_ci	if (args->num_of_nodes == 0) {
9408c2ecf20Sopenharmony_ci		/* Return number of nodes, so that user space can alloacate
9418c2ecf20Sopenharmony_ci		 * sufficient memory
9428c2ecf20Sopenharmony_ci		 */
9438c2ecf20Sopenharmony_ci		mutex_lock(&p->mutex);
9448c2ecf20Sopenharmony_ci
9458c2ecf20Sopenharmony_ci		if (!kfd_has_process_device_data(p))
9468c2ecf20Sopenharmony_ci			goto out_unlock;
9478c2ecf20Sopenharmony_ci
9488c2ecf20Sopenharmony_ci		/* Run over all pdd of the process */
9498c2ecf20Sopenharmony_ci		pdd = kfd_get_first_process_device_data(p);
9508c2ecf20Sopenharmony_ci		do {
9518c2ecf20Sopenharmony_ci			args->num_of_nodes++;
9528c2ecf20Sopenharmony_ci			pdd = kfd_get_next_process_device_data(p, pdd);
9538c2ecf20Sopenharmony_ci		} while (pdd);
9548c2ecf20Sopenharmony_ci
9558c2ecf20Sopenharmony_ci		goto out_unlock;
9568c2ecf20Sopenharmony_ci	}
9578c2ecf20Sopenharmony_ci
9588c2ecf20Sopenharmony_ci	/* Fill in process-aperture information for all available
9598c2ecf20Sopenharmony_ci	 * nodes, but not more than args->num_of_nodes as that is
9608c2ecf20Sopenharmony_ci	 * the amount of memory allocated by user
9618c2ecf20Sopenharmony_ci	 */
9628c2ecf20Sopenharmony_ci	pa = kzalloc((sizeof(struct kfd_process_device_apertures) *
9638c2ecf20Sopenharmony_ci				args->num_of_nodes), GFP_KERNEL);
9648c2ecf20Sopenharmony_ci	if (!pa)
9658c2ecf20Sopenharmony_ci		return -ENOMEM;
9668c2ecf20Sopenharmony_ci
9678c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
9688c2ecf20Sopenharmony_ci
9698c2ecf20Sopenharmony_ci	if (!kfd_has_process_device_data(p)) {
9708c2ecf20Sopenharmony_ci		args->num_of_nodes = 0;
9718c2ecf20Sopenharmony_ci		kfree(pa);
9728c2ecf20Sopenharmony_ci		goto out_unlock;
9738c2ecf20Sopenharmony_ci	}
9748c2ecf20Sopenharmony_ci
9758c2ecf20Sopenharmony_ci	/* Run over all pdd of the process */
9768c2ecf20Sopenharmony_ci	pdd = kfd_get_first_process_device_data(p);
9778c2ecf20Sopenharmony_ci	do {
9788c2ecf20Sopenharmony_ci		pa[nodes].gpu_id = pdd->dev->id;
9798c2ecf20Sopenharmony_ci		pa[nodes].lds_base = pdd->lds_base;
9808c2ecf20Sopenharmony_ci		pa[nodes].lds_limit = pdd->lds_limit;
9818c2ecf20Sopenharmony_ci		pa[nodes].gpuvm_base = pdd->gpuvm_base;
9828c2ecf20Sopenharmony_ci		pa[nodes].gpuvm_limit = pdd->gpuvm_limit;
9838c2ecf20Sopenharmony_ci		pa[nodes].scratch_base = pdd->scratch_base;
9848c2ecf20Sopenharmony_ci		pa[nodes].scratch_limit = pdd->scratch_limit;
9858c2ecf20Sopenharmony_ci
9868c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9878c2ecf20Sopenharmony_ci			"gpu id %u\n", pdd->dev->id);
9888c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9898c2ecf20Sopenharmony_ci			"lds_base %llX\n", pdd->lds_base);
9908c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9918c2ecf20Sopenharmony_ci			"lds_limit %llX\n", pdd->lds_limit);
9928c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9938c2ecf20Sopenharmony_ci			"gpuvm_base %llX\n", pdd->gpuvm_base);
9948c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9958c2ecf20Sopenharmony_ci			"gpuvm_limit %llX\n", pdd->gpuvm_limit);
9968c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9978c2ecf20Sopenharmony_ci			"scratch_base %llX\n", pdd->scratch_base);
9988c2ecf20Sopenharmony_ci		dev_dbg(kfd_device,
9998c2ecf20Sopenharmony_ci			"scratch_limit %llX\n", pdd->scratch_limit);
10008c2ecf20Sopenharmony_ci		nodes++;
10018c2ecf20Sopenharmony_ci
10028c2ecf20Sopenharmony_ci		pdd = kfd_get_next_process_device_data(p, pdd);
10038c2ecf20Sopenharmony_ci	} while (pdd && (nodes < args->num_of_nodes));
10048c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
10058c2ecf20Sopenharmony_ci
10068c2ecf20Sopenharmony_ci	args->num_of_nodes = nodes;
10078c2ecf20Sopenharmony_ci	ret = copy_to_user(
10088c2ecf20Sopenharmony_ci			(void __user *)args->kfd_process_device_apertures_ptr,
10098c2ecf20Sopenharmony_ci			pa,
10108c2ecf20Sopenharmony_ci			(nodes * sizeof(struct kfd_process_device_apertures)));
10118c2ecf20Sopenharmony_ci	kfree(pa);
10128c2ecf20Sopenharmony_ci	return ret ? -EFAULT : 0;
10138c2ecf20Sopenharmony_ci
10148c2ecf20Sopenharmony_ciout_unlock:
10158c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
10168c2ecf20Sopenharmony_ci	return 0;
10178c2ecf20Sopenharmony_ci}
10188c2ecf20Sopenharmony_ci
10198c2ecf20Sopenharmony_cistatic int kfd_ioctl_create_event(struct file *filp, struct kfd_process *p,
10208c2ecf20Sopenharmony_ci					void *data)
10218c2ecf20Sopenharmony_ci{
10228c2ecf20Sopenharmony_ci	struct kfd_ioctl_create_event_args *args = data;
10238c2ecf20Sopenharmony_ci	int err;
10248c2ecf20Sopenharmony_ci
10258c2ecf20Sopenharmony_ci	/* For dGPUs the event page is allocated in user mode. The
10268c2ecf20Sopenharmony_ci	 * handle is passed to KFD with the first call to this IOCTL
10278c2ecf20Sopenharmony_ci	 * through the event_page_offset field.
10288c2ecf20Sopenharmony_ci	 */
10298c2ecf20Sopenharmony_ci	if (args->event_page_offset) {
10308c2ecf20Sopenharmony_ci		struct kfd_dev *kfd;
10318c2ecf20Sopenharmony_ci		struct kfd_process_device *pdd;
10328c2ecf20Sopenharmony_ci		void *mem, *kern_addr;
10338c2ecf20Sopenharmony_ci		uint64_t size;
10348c2ecf20Sopenharmony_ci
10358c2ecf20Sopenharmony_ci		if (p->signal_page) {
10368c2ecf20Sopenharmony_ci			pr_err("Event page is already set\n");
10378c2ecf20Sopenharmony_ci			return -EINVAL;
10388c2ecf20Sopenharmony_ci		}
10398c2ecf20Sopenharmony_ci
10408c2ecf20Sopenharmony_ci		kfd = kfd_device_by_id(GET_GPU_ID(args->event_page_offset));
10418c2ecf20Sopenharmony_ci		if (!kfd) {
10428c2ecf20Sopenharmony_ci			pr_err("Getting device by id failed in %s\n", __func__);
10438c2ecf20Sopenharmony_ci			return -EINVAL;
10448c2ecf20Sopenharmony_ci		}
10458c2ecf20Sopenharmony_ci
10468c2ecf20Sopenharmony_ci		mutex_lock(&p->mutex);
10478c2ecf20Sopenharmony_ci		pdd = kfd_bind_process_to_device(kfd, p);
10488c2ecf20Sopenharmony_ci		if (IS_ERR(pdd)) {
10498c2ecf20Sopenharmony_ci			err = PTR_ERR(pdd);
10508c2ecf20Sopenharmony_ci			goto out_unlock;
10518c2ecf20Sopenharmony_ci		}
10528c2ecf20Sopenharmony_ci
10538c2ecf20Sopenharmony_ci		mem = kfd_process_device_translate_handle(pdd,
10548c2ecf20Sopenharmony_ci				GET_IDR_HANDLE(args->event_page_offset));
10558c2ecf20Sopenharmony_ci		if (!mem) {
10568c2ecf20Sopenharmony_ci			pr_err("Can't find BO, offset is 0x%llx\n",
10578c2ecf20Sopenharmony_ci			       args->event_page_offset);
10588c2ecf20Sopenharmony_ci			err = -EINVAL;
10598c2ecf20Sopenharmony_ci			goto out_unlock;
10608c2ecf20Sopenharmony_ci		}
10618c2ecf20Sopenharmony_ci		mutex_unlock(&p->mutex);
10628c2ecf20Sopenharmony_ci
10638c2ecf20Sopenharmony_ci		err = amdgpu_amdkfd_gpuvm_map_gtt_bo_to_kernel(kfd->kgd,
10648c2ecf20Sopenharmony_ci						mem, &kern_addr, &size);
10658c2ecf20Sopenharmony_ci		if (err) {
10668c2ecf20Sopenharmony_ci			pr_err("Failed to map event page to kernel\n");
10678c2ecf20Sopenharmony_ci			return err;
10688c2ecf20Sopenharmony_ci		}
10698c2ecf20Sopenharmony_ci
10708c2ecf20Sopenharmony_ci		err = kfd_event_page_set(p, kern_addr, size);
10718c2ecf20Sopenharmony_ci		if (err) {
10728c2ecf20Sopenharmony_ci			pr_err("Failed to set event page\n");
10738c2ecf20Sopenharmony_ci			return err;
10748c2ecf20Sopenharmony_ci		}
10758c2ecf20Sopenharmony_ci	}
10768c2ecf20Sopenharmony_ci
10778c2ecf20Sopenharmony_ci	err = kfd_event_create(filp, p, args->event_type,
10788c2ecf20Sopenharmony_ci				args->auto_reset != 0, args->node_id,
10798c2ecf20Sopenharmony_ci				&args->event_id, &args->event_trigger_data,
10808c2ecf20Sopenharmony_ci				&args->event_page_offset,
10818c2ecf20Sopenharmony_ci				&args->event_slot_index);
10828c2ecf20Sopenharmony_ci
10838c2ecf20Sopenharmony_ci	return err;
10848c2ecf20Sopenharmony_ci
10858c2ecf20Sopenharmony_ciout_unlock:
10868c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
10878c2ecf20Sopenharmony_ci	return err;
10888c2ecf20Sopenharmony_ci}
10898c2ecf20Sopenharmony_ci
10908c2ecf20Sopenharmony_cistatic int kfd_ioctl_destroy_event(struct file *filp, struct kfd_process *p,
10918c2ecf20Sopenharmony_ci					void *data)
10928c2ecf20Sopenharmony_ci{
10938c2ecf20Sopenharmony_ci	struct kfd_ioctl_destroy_event_args *args = data;
10948c2ecf20Sopenharmony_ci
10958c2ecf20Sopenharmony_ci	return kfd_event_destroy(p, args->event_id);
10968c2ecf20Sopenharmony_ci}
10978c2ecf20Sopenharmony_ci
10988c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_event(struct file *filp, struct kfd_process *p,
10998c2ecf20Sopenharmony_ci				void *data)
11008c2ecf20Sopenharmony_ci{
11018c2ecf20Sopenharmony_ci	struct kfd_ioctl_set_event_args *args = data;
11028c2ecf20Sopenharmony_ci
11038c2ecf20Sopenharmony_ci	return kfd_set_event(p, args->event_id);
11048c2ecf20Sopenharmony_ci}
11058c2ecf20Sopenharmony_ci
11068c2ecf20Sopenharmony_cistatic int kfd_ioctl_reset_event(struct file *filp, struct kfd_process *p,
11078c2ecf20Sopenharmony_ci				void *data)
11088c2ecf20Sopenharmony_ci{
11098c2ecf20Sopenharmony_ci	struct kfd_ioctl_reset_event_args *args = data;
11108c2ecf20Sopenharmony_ci
11118c2ecf20Sopenharmony_ci	return kfd_reset_event(p, args->event_id);
11128c2ecf20Sopenharmony_ci}
11138c2ecf20Sopenharmony_ci
11148c2ecf20Sopenharmony_cistatic int kfd_ioctl_wait_events(struct file *filp, struct kfd_process *p,
11158c2ecf20Sopenharmony_ci				void *data)
11168c2ecf20Sopenharmony_ci{
11178c2ecf20Sopenharmony_ci	struct kfd_ioctl_wait_events_args *args = data;
11188c2ecf20Sopenharmony_ci	int err;
11198c2ecf20Sopenharmony_ci
11208c2ecf20Sopenharmony_ci	err = kfd_wait_on_events(p, args->num_events,
11218c2ecf20Sopenharmony_ci			(void __user *)args->events_ptr,
11228c2ecf20Sopenharmony_ci			(args->wait_for_all != 0),
11238c2ecf20Sopenharmony_ci			args->timeout, &args->wait_result);
11248c2ecf20Sopenharmony_ci
11258c2ecf20Sopenharmony_ci	return err;
11268c2ecf20Sopenharmony_ci}
11278c2ecf20Sopenharmony_cistatic int kfd_ioctl_set_scratch_backing_va(struct file *filep,
11288c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
11298c2ecf20Sopenharmony_ci{
11308c2ecf20Sopenharmony_ci	struct kfd_ioctl_set_scratch_backing_va_args *args = data;
11318c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
11328c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
11338c2ecf20Sopenharmony_ci	long err;
11348c2ecf20Sopenharmony_ci
11358c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
11368c2ecf20Sopenharmony_ci	if (!dev)
11378c2ecf20Sopenharmony_ci		return -EINVAL;
11388c2ecf20Sopenharmony_ci
11398c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
11408c2ecf20Sopenharmony_ci
11418c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
11428c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
11438c2ecf20Sopenharmony_ci		err = PTR_ERR(pdd);
11448c2ecf20Sopenharmony_ci		goto bind_process_to_device_fail;
11458c2ecf20Sopenharmony_ci	}
11468c2ecf20Sopenharmony_ci
11478c2ecf20Sopenharmony_ci	pdd->qpd.sh_hidden_private_base = args->va_addr;
11488c2ecf20Sopenharmony_ci
11498c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
11508c2ecf20Sopenharmony_ci
11518c2ecf20Sopenharmony_ci	if (dev->dqm->sched_policy == KFD_SCHED_POLICY_NO_HWS &&
11528c2ecf20Sopenharmony_ci	    pdd->qpd.vmid != 0 && dev->kfd2kgd->set_scratch_backing_va)
11538c2ecf20Sopenharmony_ci		dev->kfd2kgd->set_scratch_backing_va(
11548c2ecf20Sopenharmony_ci			dev->kgd, args->va_addr, pdd->qpd.vmid);
11558c2ecf20Sopenharmony_ci
11568c2ecf20Sopenharmony_ci	return 0;
11578c2ecf20Sopenharmony_ci
11588c2ecf20Sopenharmony_cibind_process_to_device_fail:
11598c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
11608c2ecf20Sopenharmony_ci	return err;
11618c2ecf20Sopenharmony_ci}
11628c2ecf20Sopenharmony_ci
11638c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_tile_config(struct file *filep,
11648c2ecf20Sopenharmony_ci		struct kfd_process *p, void *data)
11658c2ecf20Sopenharmony_ci{
11668c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_tile_config_args *args = data;
11678c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
11688c2ecf20Sopenharmony_ci	struct tile_config config;
11698c2ecf20Sopenharmony_ci	int err = 0;
11708c2ecf20Sopenharmony_ci
11718c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
11728c2ecf20Sopenharmony_ci	if (!dev)
11738c2ecf20Sopenharmony_ci		return -EINVAL;
11748c2ecf20Sopenharmony_ci
11758c2ecf20Sopenharmony_ci	amdgpu_amdkfd_get_tile_config(dev->kgd, &config);
11768c2ecf20Sopenharmony_ci
11778c2ecf20Sopenharmony_ci	args->gb_addr_config = config.gb_addr_config;
11788c2ecf20Sopenharmony_ci	args->num_banks = config.num_banks;
11798c2ecf20Sopenharmony_ci	args->num_ranks = config.num_ranks;
11808c2ecf20Sopenharmony_ci
11818c2ecf20Sopenharmony_ci	if (args->num_tile_configs > config.num_tile_configs)
11828c2ecf20Sopenharmony_ci		args->num_tile_configs = config.num_tile_configs;
11838c2ecf20Sopenharmony_ci	err = copy_to_user((void __user *)args->tile_config_ptr,
11848c2ecf20Sopenharmony_ci			config.tile_config_ptr,
11858c2ecf20Sopenharmony_ci			args->num_tile_configs * sizeof(uint32_t));
11868c2ecf20Sopenharmony_ci	if (err) {
11878c2ecf20Sopenharmony_ci		args->num_tile_configs = 0;
11888c2ecf20Sopenharmony_ci		return -EFAULT;
11898c2ecf20Sopenharmony_ci	}
11908c2ecf20Sopenharmony_ci
11918c2ecf20Sopenharmony_ci	if (args->num_macro_tile_configs > config.num_macro_tile_configs)
11928c2ecf20Sopenharmony_ci		args->num_macro_tile_configs =
11938c2ecf20Sopenharmony_ci				config.num_macro_tile_configs;
11948c2ecf20Sopenharmony_ci	err = copy_to_user((void __user *)args->macro_tile_config_ptr,
11958c2ecf20Sopenharmony_ci			config.macro_tile_config_ptr,
11968c2ecf20Sopenharmony_ci			args->num_macro_tile_configs * sizeof(uint32_t));
11978c2ecf20Sopenharmony_ci	if (err) {
11988c2ecf20Sopenharmony_ci		args->num_macro_tile_configs = 0;
11998c2ecf20Sopenharmony_ci		return -EFAULT;
12008c2ecf20Sopenharmony_ci	}
12018c2ecf20Sopenharmony_ci
12028c2ecf20Sopenharmony_ci	return 0;
12038c2ecf20Sopenharmony_ci}
12048c2ecf20Sopenharmony_ci
12058c2ecf20Sopenharmony_cistatic int kfd_ioctl_acquire_vm(struct file *filep, struct kfd_process *p,
12068c2ecf20Sopenharmony_ci				void *data)
12078c2ecf20Sopenharmony_ci{
12088c2ecf20Sopenharmony_ci	struct kfd_ioctl_acquire_vm_args *args = data;
12098c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
12108c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
12118c2ecf20Sopenharmony_ci	struct file *drm_file;
12128c2ecf20Sopenharmony_ci	int ret;
12138c2ecf20Sopenharmony_ci
12148c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
12158c2ecf20Sopenharmony_ci	if (!dev)
12168c2ecf20Sopenharmony_ci		return -EINVAL;
12178c2ecf20Sopenharmony_ci
12188c2ecf20Sopenharmony_ci	drm_file = fget(args->drm_fd);
12198c2ecf20Sopenharmony_ci	if (!drm_file)
12208c2ecf20Sopenharmony_ci		return -EINVAL;
12218c2ecf20Sopenharmony_ci
12228c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
12238c2ecf20Sopenharmony_ci
12248c2ecf20Sopenharmony_ci	pdd = kfd_get_process_device_data(dev, p);
12258c2ecf20Sopenharmony_ci	if (!pdd) {
12268c2ecf20Sopenharmony_ci		ret = -EINVAL;
12278c2ecf20Sopenharmony_ci		goto err_unlock;
12288c2ecf20Sopenharmony_ci	}
12298c2ecf20Sopenharmony_ci
12308c2ecf20Sopenharmony_ci	if (pdd->drm_file) {
12318c2ecf20Sopenharmony_ci		ret = pdd->drm_file == drm_file ? 0 : -EBUSY;
12328c2ecf20Sopenharmony_ci		goto err_unlock;
12338c2ecf20Sopenharmony_ci	}
12348c2ecf20Sopenharmony_ci
12358c2ecf20Sopenharmony_ci	ret = kfd_process_device_init_vm(pdd, drm_file);
12368c2ecf20Sopenharmony_ci	if (ret)
12378c2ecf20Sopenharmony_ci		goto err_unlock;
12388c2ecf20Sopenharmony_ci	/* On success, the PDD keeps the drm_file reference */
12398c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
12408c2ecf20Sopenharmony_ci
12418c2ecf20Sopenharmony_ci	return 0;
12428c2ecf20Sopenharmony_ci
12438c2ecf20Sopenharmony_cierr_unlock:
12448c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
12458c2ecf20Sopenharmony_ci	fput(drm_file);
12468c2ecf20Sopenharmony_ci	return ret;
12478c2ecf20Sopenharmony_ci}
12488c2ecf20Sopenharmony_ci
12498c2ecf20Sopenharmony_cibool kfd_dev_is_large_bar(struct kfd_dev *dev)
12508c2ecf20Sopenharmony_ci{
12518c2ecf20Sopenharmony_ci	struct kfd_local_mem_info mem_info;
12528c2ecf20Sopenharmony_ci
12538c2ecf20Sopenharmony_ci	if (debug_largebar) {
12548c2ecf20Sopenharmony_ci		pr_debug("Simulate large-bar allocation on non large-bar machine\n");
12558c2ecf20Sopenharmony_ci		return true;
12568c2ecf20Sopenharmony_ci	}
12578c2ecf20Sopenharmony_ci
12588c2ecf20Sopenharmony_ci	if (dev->use_iommu_v2)
12598c2ecf20Sopenharmony_ci		return false;
12608c2ecf20Sopenharmony_ci
12618c2ecf20Sopenharmony_ci	amdgpu_amdkfd_get_local_mem_info(dev->kgd, &mem_info);
12628c2ecf20Sopenharmony_ci	if (mem_info.local_mem_size_private == 0 &&
12638c2ecf20Sopenharmony_ci			mem_info.local_mem_size_public > 0)
12648c2ecf20Sopenharmony_ci		return true;
12658c2ecf20Sopenharmony_ci	return false;
12668c2ecf20Sopenharmony_ci}
12678c2ecf20Sopenharmony_ci
12688c2ecf20Sopenharmony_cistatic int kfd_ioctl_alloc_memory_of_gpu(struct file *filep,
12698c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
12708c2ecf20Sopenharmony_ci{
12718c2ecf20Sopenharmony_ci	struct kfd_ioctl_alloc_memory_of_gpu_args *args = data;
12728c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
12738c2ecf20Sopenharmony_ci	void *mem;
12748c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
12758c2ecf20Sopenharmony_ci	int idr_handle;
12768c2ecf20Sopenharmony_ci	long err;
12778c2ecf20Sopenharmony_ci	uint64_t offset = args->mmap_offset;
12788c2ecf20Sopenharmony_ci	uint32_t flags = args->flags;
12798c2ecf20Sopenharmony_ci
12808c2ecf20Sopenharmony_ci	if (args->size == 0)
12818c2ecf20Sopenharmony_ci		return -EINVAL;
12828c2ecf20Sopenharmony_ci
12838c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
12848c2ecf20Sopenharmony_ci	if (!dev)
12858c2ecf20Sopenharmony_ci		return -EINVAL;
12868c2ecf20Sopenharmony_ci
12878c2ecf20Sopenharmony_ci	if ((flags & KFD_IOC_ALLOC_MEM_FLAGS_PUBLIC) &&
12888c2ecf20Sopenharmony_ci		(flags & KFD_IOC_ALLOC_MEM_FLAGS_VRAM) &&
12898c2ecf20Sopenharmony_ci		!kfd_dev_is_large_bar(dev)) {
12908c2ecf20Sopenharmony_ci		pr_err("Alloc host visible vram on small bar is not allowed\n");
12918c2ecf20Sopenharmony_ci		return -EINVAL;
12928c2ecf20Sopenharmony_ci	}
12938c2ecf20Sopenharmony_ci
12948c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
12958c2ecf20Sopenharmony_ci
12968c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
12978c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
12988c2ecf20Sopenharmony_ci		err = PTR_ERR(pdd);
12998c2ecf20Sopenharmony_ci		goto err_unlock;
13008c2ecf20Sopenharmony_ci	}
13018c2ecf20Sopenharmony_ci
13028c2ecf20Sopenharmony_ci	if (flags & KFD_IOC_ALLOC_MEM_FLAGS_DOORBELL) {
13038c2ecf20Sopenharmony_ci		if (args->size != kfd_doorbell_process_slice(dev)) {
13048c2ecf20Sopenharmony_ci			err = -EINVAL;
13058c2ecf20Sopenharmony_ci			goto err_unlock;
13068c2ecf20Sopenharmony_ci		}
13078c2ecf20Sopenharmony_ci		offset = kfd_get_process_doorbells(pdd);
13088c2ecf20Sopenharmony_ci	} else if (flags & KFD_IOC_ALLOC_MEM_FLAGS_MMIO_REMAP) {
13098c2ecf20Sopenharmony_ci		if (args->size != PAGE_SIZE) {
13108c2ecf20Sopenharmony_ci			err = -EINVAL;
13118c2ecf20Sopenharmony_ci			goto err_unlock;
13128c2ecf20Sopenharmony_ci		}
13138c2ecf20Sopenharmony_ci		offset = amdgpu_amdkfd_get_mmio_remap_phys_addr(dev->kgd);
13148c2ecf20Sopenharmony_ci		if (!offset) {
13158c2ecf20Sopenharmony_ci			err = -ENOMEM;
13168c2ecf20Sopenharmony_ci			goto err_unlock;
13178c2ecf20Sopenharmony_ci		}
13188c2ecf20Sopenharmony_ci	}
13198c2ecf20Sopenharmony_ci
13208c2ecf20Sopenharmony_ci	err = amdgpu_amdkfd_gpuvm_alloc_memory_of_gpu(
13218c2ecf20Sopenharmony_ci		dev->kgd, args->va_addr, args->size,
13228c2ecf20Sopenharmony_ci		pdd->vm, (struct kgd_mem **) &mem, &offset,
13238c2ecf20Sopenharmony_ci		flags);
13248c2ecf20Sopenharmony_ci
13258c2ecf20Sopenharmony_ci	if (err)
13268c2ecf20Sopenharmony_ci		goto err_unlock;
13278c2ecf20Sopenharmony_ci
13288c2ecf20Sopenharmony_ci	idr_handle = kfd_process_device_create_obj_handle(pdd, mem);
13298c2ecf20Sopenharmony_ci	if (idr_handle < 0) {
13308c2ecf20Sopenharmony_ci		err = -EFAULT;
13318c2ecf20Sopenharmony_ci		goto err_free;
13328c2ecf20Sopenharmony_ci	}
13338c2ecf20Sopenharmony_ci
13348c2ecf20Sopenharmony_ci	/* Update the VRAM usage count */
13358c2ecf20Sopenharmony_ci	if (flags & KFD_IOC_ALLOC_MEM_FLAGS_VRAM)
13368c2ecf20Sopenharmony_ci		WRITE_ONCE(pdd->vram_usage, pdd->vram_usage + args->size);
13378c2ecf20Sopenharmony_ci
13388c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
13398c2ecf20Sopenharmony_ci
13408c2ecf20Sopenharmony_ci	args->handle = MAKE_HANDLE(args->gpu_id, idr_handle);
13418c2ecf20Sopenharmony_ci	args->mmap_offset = offset;
13428c2ecf20Sopenharmony_ci
13438c2ecf20Sopenharmony_ci	/* MMIO is mapped through kfd device
13448c2ecf20Sopenharmony_ci	 * Generate a kfd mmap offset
13458c2ecf20Sopenharmony_ci	 */
13468c2ecf20Sopenharmony_ci	if (flags & KFD_IOC_ALLOC_MEM_FLAGS_MMIO_REMAP)
13478c2ecf20Sopenharmony_ci		args->mmap_offset = KFD_MMAP_TYPE_MMIO
13488c2ecf20Sopenharmony_ci					| KFD_MMAP_GPU_ID(args->gpu_id);
13498c2ecf20Sopenharmony_ci
13508c2ecf20Sopenharmony_ci	return 0;
13518c2ecf20Sopenharmony_ci
13528c2ecf20Sopenharmony_cierr_free:
13538c2ecf20Sopenharmony_ci	amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem, NULL);
13548c2ecf20Sopenharmony_cierr_unlock:
13558c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
13568c2ecf20Sopenharmony_ci	return err;
13578c2ecf20Sopenharmony_ci}
13588c2ecf20Sopenharmony_ci
13598c2ecf20Sopenharmony_cistatic int kfd_ioctl_free_memory_of_gpu(struct file *filep,
13608c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
13618c2ecf20Sopenharmony_ci{
13628c2ecf20Sopenharmony_ci	struct kfd_ioctl_free_memory_of_gpu_args *args = data;
13638c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
13648c2ecf20Sopenharmony_ci	void *mem;
13658c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
13668c2ecf20Sopenharmony_ci	int ret;
13678c2ecf20Sopenharmony_ci	uint64_t size = 0;
13688c2ecf20Sopenharmony_ci
13698c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(GET_GPU_ID(args->handle));
13708c2ecf20Sopenharmony_ci	if (!dev)
13718c2ecf20Sopenharmony_ci		return -EINVAL;
13728c2ecf20Sopenharmony_ci
13738c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
13748c2ecf20Sopenharmony_ci
13758c2ecf20Sopenharmony_ci	pdd = kfd_get_process_device_data(dev, p);
13768c2ecf20Sopenharmony_ci	if (!pdd) {
13778c2ecf20Sopenharmony_ci		pr_err("Process device data doesn't exist\n");
13788c2ecf20Sopenharmony_ci		ret = -EINVAL;
13798c2ecf20Sopenharmony_ci		goto err_unlock;
13808c2ecf20Sopenharmony_ci	}
13818c2ecf20Sopenharmony_ci
13828c2ecf20Sopenharmony_ci	mem = kfd_process_device_translate_handle(
13838c2ecf20Sopenharmony_ci		pdd, GET_IDR_HANDLE(args->handle));
13848c2ecf20Sopenharmony_ci	if (!mem) {
13858c2ecf20Sopenharmony_ci		ret = -EINVAL;
13868c2ecf20Sopenharmony_ci		goto err_unlock;
13878c2ecf20Sopenharmony_ci	}
13888c2ecf20Sopenharmony_ci
13898c2ecf20Sopenharmony_ci	ret = amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd,
13908c2ecf20Sopenharmony_ci						(struct kgd_mem *)mem, &size);
13918c2ecf20Sopenharmony_ci
13928c2ecf20Sopenharmony_ci	/* If freeing the buffer failed, leave the handle in place for
13938c2ecf20Sopenharmony_ci	 * clean-up during process tear-down.
13948c2ecf20Sopenharmony_ci	 */
13958c2ecf20Sopenharmony_ci	if (!ret)
13968c2ecf20Sopenharmony_ci		kfd_process_device_remove_obj_handle(
13978c2ecf20Sopenharmony_ci			pdd, GET_IDR_HANDLE(args->handle));
13988c2ecf20Sopenharmony_ci
13998c2ecf20Sopenharmony_ci	WRITE_ONCE(pdd->vram_usage, pdd->vram_usage - size);
14008c2ecf20Sopenharmony_ci
14018c2ecf20Sopenharmony_cierr_unlock:
14028c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
14038c2ecf20Sopenharmony_ci	return ret;
14048c2ecf20Sopenharmony_ci}
14058c2ecf20Sopenharmony_ci
14068c2ecf20Sopenharmony_cistatic int kfd_ioctl_map_memory_to_gpu(struct file *filep,
14078c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
14088c2ecf20Sopenharmony_ci{
14098c2ecf20Sopenharmony_ci	struct kfd_ioctl_map_memory_to_gpu_args *args = data;
14108c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd, *peer_pdd;
14118c2ecf20Sopenharmony_ci	void *mem;
14128c2ecf20Sopenharmony_ci	struct kfd_dev *dev, *peer;
14138c2ecf20Sopenharmony_ci	long err = 0;
14148c2ecf20Sopenharmony_ci	int i;
14158c2ecf20Sopenharmony_ci	uint32_t *devices_arr = NULL;
14168c2ecf20Sopenharmony_ci
14178c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(GET_GPU_ID(args->handle));
14188c2ecf20Sopenharmony_ci	if (!dev)
14198c2ecf20Sopenharmony_ci		return -EINVAL;
14208c2ecf20Sopenharmony_ci
14218c2ecf20Sopenharmony_ci	if (!args->n_devices) {
14228c2ecf20Sopenharmony_ci		pr_debug("Device IDs array empty\n");
14238c2ecf20Sopenharmony_ci		return -EINVAL;
14248c2ecf20Sopenharmony_ci	}
14258c2ecf20Sopenharmony_ci	if (args->n_success > args->n_devices) {
14268c2ecf20Sopenharmony_ci		pr_debug("n_success exceeds n_devices\n");
14278c2ecf20Sopenharmony_ci		return -EINVAL;
14288c2ecf20Sopenharmony_ci	}
14298c2ecf20Sopenharmony_ci
14308c2ecf20Sopenharmony_ci	devices_arr = kmalloc_array(args->n_devices, sizeof(*devices_arr),
14318c2ecf20Sopenharmony_ci				    GFP_KERNEL);
14328c2ecf20Sopenharmony_ci	if (!devices_arr)
14338c2ecf20Sopenharmony_ci		return -ENOMEM;
14348c2ecf20Sopenharmony_ci
14358c2ecf20Sopenharmony_ci	err = copy_from_user(devices_arr,
14368c2ecf20Sopenharmony_ci			     (void __user *)args->device_ids_array_ptr,
14378c2ecf20Sopenharmony_ci			     args->n_devices * sizeof(*devices_arr));
14388c2ecf20Sopenharmony_ci	if (err != 0) {
14398c2ecf20Sopenharmony_ci		err = -EFAULT;
14408c2ecf20Sopenharmony_ci		goto copy_from_user_failed;
14418c2ecf20Sopenharmony_ci	}
14428c2ecf20Sopenharmony_ci
14438c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
14448c2ecf20Sopenharmony_ci
14458c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
14468c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
14478c2ecf20Sopenharmony_ci		err = PTR_ERR(pdd);
14488c2ecf20Sopenharmony_ci		goto bind_process_to_device_failed;
14498c2ecf20Sopenharmony_ci	}
14508c2ecf20Sopenharmony_ci
14518c2ecf20Sopenharmony_ci	mem = kfd_process_device_translate_handle(pdd,
14528c2ecf20Sopenharmony_ci						GET_IDR_HANDLE(args->handle));
14538c2ecf20Sopenharmony_ci	if (!mem) {
14548c2ecf20Sopenharmony_ci		err = -ENOMEM;
14558c2ecf20Sopenharmony_ci		goto get_mem_obj_from_handle_failed;
14568c2ecf20Sopenharmony_ci	}
14578c2ecf20Sopenharmony_ci
14588c2ecf20Sopenharmony_ci	for (i = args->n_success; i < args->n_devices; i++) {
14598c2ecf20Sopenharmony_ci		peer = kfd_device_by_id(devices_arr[i]);
14608c2ecf20Sopenharmony_ci		if (!peer) {
14618c2ecf20Sopenharmony_ci			pr_debug("Getting device by id failed for 0x%x\n",
14628c2ecf20Sopenharmony_ci				 devices_arr[i]);
14638c2ecf20Sopenharmony_ci			err = -EINVAL;
14648c2ecf20Sopenharmony_ci			goto get_mem_obj_from_handle_failed;
14658c2ecf20Sopenharmony_ci		}
14668c2ecf20Sopenharmony_ci
14678c2ecf20Sopenharmony_ci		peer_pdd = kfd_bind_process_to_device(peer, p);
14688c2ecf20Sopenharmony_ci		if (IS_ERR(peer_pdd)) {
14698c2ecf20Sopenharmony_ci			err = PTR_ERR(peer_pdd);
14708c2ecf20Sopenharmony_ci			goto get_mem_obj_from_handle_failed;
14718c2ecf20Sopenharmony_ci		}
14728c2ecf20Sopenharmony_ci		err = amdgpu_amdkfd_gpuvm_map_memory_to_gpu(
14738c2ecf20Sopenharmony_ci			peer->kgd, (struct kgd_mem *)mem, peer_pdd->vm);
14748c2ecf20Sopenharmony_ci		if (err) {
14758c2ecf20Sopenharmony_ci			pr_err("Failed to map to gpu %d/%d\n",
14768c2ecf20Sopenharmony_ci			       i, args->n_devices);
14778c2ecf20Sopenharmony_ci			goto map_memory_to_gpu_failed;
14788c2ecf20Sopenharmony_ci		}
14798c2ecf20Sopenharmony_ci		args->n_success = i+1;
14808c2ecf20Sopenharmony_ci	}
14818c2ecf20Sopenharmony_ci
14828c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
14838c2ecf20Sopenharmony_ci
14848c2ecf20Sopenharmony_ci	err = amdgpu_amdkfd_gpuvm_sync_memory(dev->kgd, (struct kgd_mem *) mem, true);
14858c2ecf20Sopenharmony_ci	if (err) {
14868c2ecf20Sopenharmony_ci		pr_debug("Sync memory failed, wait interrupted by user signal\n");
14878c2ecf20Sopenharmony_ci		goto sync_memory_failed;
14888c2ecf20Sopenharmony_ci	}
14898c2ecf20Sopenharmony_ci
14908c2ecf20Sopenharmony_ci	/* Flush TLBs after waiting for the page table updates to complete */
14918c2ecf20Sopenharmony_ci	for (i = 0; i < args->n_devices; i++) {
14928c2ecf20Sopenharmony_ci		peer = kfd_device_by_id(devices_arr[i]);
14938c2ecf20Sopenharmony_ci		if (WARN_ON_ONCE(!peer))
14948c2ecf20Sopenharmony_ci			continue;
14958c2ecf20Sopenharmony_ci		peer_pdd = kfd_get_process_device_data(peer, p);
14968c2ecf20Sopenharmony_ci		if (WARN_ON_ONCE(!peer_pdd))
14978c2ecf20Sopenharmony_ci			continue;
14988c2ecf20Sopenharmony_ci		kfd_flush_tlb(peer_pdd);
14998c2ecf20Sopenharmony_ci	}
15008c2ecf20Sopenharmony_ci
15018c2ecf20Sopenharmony_ci	kfree(devices_arr);
15028c2ecf20Sopenharmony_ci
15038c2ecf20Sopenharmony_ci	return err;
15048c2ecf20Sopenharmony_ci
15058c2ecf20Sopenharmony_cibind_process_to_device_failed:
15068c2ecf20Sopenharmony_ciget_mem_obj_from_handle_failed:
15078c2ecf20Sopenharmony_cimap_memory_to_gpu_failed:
15088c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
15098c2ecf20Sopenharmony_cicopy_from_user_failed:
15108c2ecf20Sopenharmony_cisync_memory_failed:
15118c2ecf20Sopenharmony_ci	kfree(devices_arr);
15128c2ecf20Sopenharmony_ci
15138c2ecf20Sopenharmony_ci	return err;
15148c2ecf20Sopenharmony_ci}
15158c2ecf20Sopenharmony_ci
15168c2ecf20Sopenharmony_cistatic int kfd_ioctl_unmap_memory_from_gpu(struct file *filep,
15178c2ecf20Sopenharmony_ci					struct kfd_process *p, void *data)
15188c2ecf20Sopenharmony_ci{
15198c2ecf20Sopenharmony_ci	struct kfd_ioctl_unmap_memory_from_gpu_args *args = data;
15208c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd, *peer_pdd;
15218c2ecf20Sopenharmony_ci	void *mem;
15228c2ecf20Sopenharmony_ci	struct kfd_dev *dev, *peer;
15238c2ecf20Sopenharmony_ci	long err = 0;
15248c2ecf20Sopenharmony_ci	uint32_t *devices_arr = NULL, i;
15258c2ecf20Sopenharmony_ci
15268c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(GET_GPU_ID(args->handle));
15278c2ecf20Sopenharmony_ci	if (!dev)
15288c2ecf20Sopenharmony_ci		return -EINVAL;
15298c2ecf20Sopenharmony_ci
15308c2ecf20Sopenharmony_ci	if (!args->n_devices) {
15318c2ecf20Sopenharmony_ci		pr_debug("Device IDs array empty\n");
15328c2ecf20Sopenharmony_ci		return -EINVAL;
15338c2ecf20Sopenharmony_ci	}
15348c2ecf20Sopenharmony_ci	if (args->n_success > args->n_devices) {
15358c2ecf20Sopenharmony_ci		pr_debug("n_success exceeds n_devices\n");
15368c2ecf20Sopenharmony_ci		return -EINVAL;
15378c2ecf20Sopenharmony_ci	}
15388c2ecf20Sopenharmony_ci
15398c2ecf20Sopenharmony_ci	devices_arr = kmalloc_array(args->n_devices, sizeof(*devices_arr),
15408c2ecf20Sopenharmony_ci				    GFP_KERNEL);
15418c2ecf20Sopenharmony_ci	if (!devices_arr)
15428c2ecf20Sopenharmony_ci		return -ENOMEM;
15438c2ecf20Sopenharmony_ci
15448c2ecf20Sopenharmony_ci	err = copy_from_user(devices_arr,
15458c2ecf20Sopenharmony_ci			     (void __user *)args->device_ids_array_ptr,
15468c2ecf20Sopenharmony_ci			     args->n_devices * sizeof(*devices_arr));
15478c2ecf20Sopenharmony_ci	if (err != 0) {
15488c2ecf20Sopenharmony_ci		err = -EFAULT;
15498c2ecf20Sopenharmony_ci		goto copy_from_user_failed;
15508c2ecf20Sopenharmony_ci	}
15518c2ecf20Sopenharmony_ci
15528c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
15538c2ecf20Sopenharmony_ci
15548c2ecf20Sopenharmony_ci	pdd = kfd_get_process_device_data(dev, p);
15558c2ecf20Sopenharmony_ci	if (!pdd) {
15568c2ecf20Sopenharmony_ci		err = -EINVAL;
15578c2ecf20Sopenharmony_ci		goto bind_process_to_device_failed;
15588c2ecf20Sopenharmony_ci	}
15598c2ecf20Sopenharmony_ci
15608c2ecf20Sopenharmony_ci	mem = kfd_process_device_translate_handle(pdd,
15618c2ecf20Sopenharmony_ci						GET_IDR_HANDLE(args->handle));
15628c2ecf20Sopenharmony_ci	if (!mem) {
15638c2ecf20Sopenharmony_ci		err = -ENOMEM;
15648c2ecf20Sopenharmony_ci		goto get_mem_obj_from_handle_failed;
15658c2ecf20Sopenharmony_ci	}
15668c2ecf20Sopenharmony_ci
15678c2ecf20Sopenharmony_ci	for (i = args->n_success; i < args->n_devices; i++) {
15688c2ecf20Sopenharmony_ci		peer = kfd_device_by_id(devices_arr[i]);
15698c2ecf20Sopenharmony_ci		if (!peer) {
15708c2ecf20Sopenharmony_ci			err = -EINVAL;
15718c2ecf20Sopenharmony_ci			goto get_mem_obj_from_handle_failed;
15728c2ecf20Sopenharmony_ci		}
15738c2ecf20Sopenharmony_ci
15748c2ecf20Sopenharmony_ci		peer_pdd = kfd_get_process_device_data(peer, p);
15758c2ecf20Sopenharmony_ci		if (!peer_pdd) {
15768c2ecf20Sopenharmony_ci			err = -ENODEV;
15778c2ecf20Sopenharmony_ci			goto get_mem_obj_from_handle_failed;
15788c2ecf20Sopenharmony_ci		}
15798c2ecf20Sopenharmony_ci		err = amdgpu_amdkfd_gpuvm_unmap_memory_from_gpu(
15808c2ecf20Sopenharmony_ci			peer->kgd, (struct kgd_mem *)mem, peer_pdd->vm);
15818c2ecf20Sopenharmony_ci		if (err) {
15828c2ecf20Sopenharmony_ci			pr_err("Failed to unmap from gpu %d/%d\n",
15838c2ecf20Sopenharmony_ci			       i, args->n_devices);
15848c2ecf20Sopenharmony_ci			goto unmap_memory_from_gpu_failed;
15858c2ecf20Sopenharmony_ci		}
15868c2ecf20Sopenharmony_ci		args->n_success = i+1;
15878c2ecf20Sopenharmony_ci	}
15888c2ecf20Sopenharmony_ci	kfree(devices_arr);
15898c2ecf20Sopenharmony_ci
15908c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
15918c2ecf20Sopenharmony_ci
15928c2ecf20Sopenharmony_ci	return 0;
15938c2ecf20Sopenharmony_ci
15948c2ecf20Sopenharmony_cibind_process_to_device_failed:
15958c2ecf20Sopenharmony_ciget_mem_obj_from_handle_failed:
15968c2ecf20Sopenharmony_ciunmap_memory_from_gpu_failed:
15978c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
15988c2ecf20Sopenharmony_cicopy_from_user_failed:
15998c2ecf20Sopenharmony_ci	kfree(devices_arr);
16008c2ecf20Sopenharmony_ci	return err;
16018c2ecf20Sopenharmony_ci}
16028c2ecf20Sopenharmony_ci
16038c2ecf20Sopenharmony_cistatic int kfd_ioctl_alloc_queue_gws(struct file *filep,
16048c2ecf20Sopenharmony_ci		struct kfd_process *p, void *data)
16058c2ecf20Sopenharmony_ci{
16068c2ecf20Sopenharmony_ci	int retval;
16078c2ecf20Sopenharmony_ci	struct kfd_ioctl_alloc_queue_gws_args *args = data;
16088c2ecf20Sopenharmony_ci	struct queue *q;
16098c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
16108c2ecf20Sopenharmony_ci
16118c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
16128c2ecf20Sopenharmony_ci	q = pqm_get_user_queue(&p->pqm, args->queue_id);
16138c2ecf20Sopenharmony_ci
16148c2ecf20Sopenharmony_ci	if (q) {
16158c2ecf20Sopenharmony_ci		dev = q->device;
16168c2ecf20Sopenharmony_ci	} else {
16178c2ecf20Sopenharmony_ci		retval = -EINVAL;
16188c2ecf20Sopenharmony_ci		goto out_unlock;
16198c2ecf20Sopenharmony_ci	}
16208c2ecf20Sopenharmony_ci
16218c2ecf20Sopenharmony_ci	if (!dev->gws) {
16228c2ecf20Sopenharmony_ci		retval = -ENODEV;
16238c2ecf20Sopenharmony_ci		goto out_unlock;
16248c2ecf20Sopenharmony_ci	}
16258c2ecf20Sopenharmony_ci
16268c2ecf20Sopenharmony_ci	if (dev->dqm->sched_policy == KFD_SCHED_POLICY_NO_HWS) {
16278c2ecf20Sopenharmony_ci		retval = -ENODEV;
16288c2ecf20Sopenharmony_ci		goto out_unlock;
16298c2ecf20Sopenharmony_ci	}
16308c2ecf20Sopenharmony_ci
16318c2ecf20Sopenharmony_ci	retval = pqm_set_gws(&p->pqm, args->queue_id, args->num_gws ? dev->gws : NULL);
16328c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
16338c2ecf20Sopenharmony_ci
16348c2ecf20Sopenharmony_ci	args->first_gws = 0;
16358c2ecf20Sopenharmony_ci	return retval;
16368c2ecf20Sopenharmony_ci
16378c2ecf20Sopenharmony_ciout_unlock:
16388c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
16398c2ecf20Sopenharmony_ci	return retval;
16408c2ecf20Sopenharmony_ci}
16418c2ecf20Sopenharmony_ci
16428c2ecf20Sopenharmony_cistatic int kfd_ioctl_get_dmabuf_info(struct file *filep,
16438c2ecf20Sopenharmony_ci		struct kfd_process *p, void *data)
16448c2ecf20Sopenharmony_ci{
16458c2ecf20Sopenharmony_ci	struct kfd_ioctl_get_dmabuf_info_args *args = data;
16468c2ecf20Sopenharmony_ci	struct kfd_dev *dev = NULL;
16478c2ecf20Sopenharmony_ci	struct kgd_dev *dma_buf_kgd;
16488c2ecf20Sopenharmony_ci	void *metadata_buffer = NULL;
16498c2ecf20Sopenharmony_ci	uint32_t flags;
16508c2ecf20Sopenharmony_ci	unsigned int i;
16518c2ecf20Sopenharmony_ci	int r;
16528c2ecf20Sopenharmony_ci
16538c2ecf20Sopenharmony_ci	/* Find a KFD GPU device that supports the get_dmabuf_info query */
16548c2ecf20Sopenharmony_ci	for (i = 0; kfd_topology_enum_kfd_devices(i, &dev) == 0; i++)
16558c2ecf20Sopenharmony_ci		if (dev)
16568c2ecf20Sopenharmony_ci			break;
16578c2ecf20Sopenharmony_ci	if (!dev)
16588c2ecf20Sopenharmony_ci		return -EINVAL;
16598c2ecf20Sopenharmony_ci
16608c2ecf20Sopenharmony_ci	if (args->metadata_ptr) {
16618c2ecf20Sopenharmony_ci		metadata_buffer = kzalloc(args->metadata_size, GFP_KERNEL);
16628c2ecf20Sopenharmony_ci		if (!metadata_buffer)
16638c2ecf20Sopenharmony_ci			return -ENOMEM;
16648c2ecf20Sopenharmony_ci	}
16658c2ecf20Sopenharmony_ci
16668c2ecf20Sopenharmony_ci	/* Get dmabuf info from KGD */
16678c2ecf20Sopenharmony_ci	r = amdgpu_amdkfd_get_dmabuf_info(dev->kgd, args->dmabuf_fd,
16688c2ecf20Sopenharmony_ci					  &dma_buf_kgd, &args->size,
16698c2ecf20Sopenharmony_ci					  metadata_buffer, args->metadata_size,
16708c2ecf20Sopenharmony_ci					  &args->metadata_size, &flags);
16718c2ecf20Sopenharmony_ci	if (r)
16728c2ecf20Sopenharmony_ci		goto exit;
16738c2ecf20Sopenharmony_ci
16748c2ecf20Sopenharmony_ci	/* Reverse-lookup gpu_id from kgd pointer */
16758c2ecf20Sopenharmony_ci	dev = kfd_device_by_kgd(dma_buf_kgd);
16768c2ecf20Sopenharmony_ci	if (!dev) {
16778c2ecf20Sopenharmony_ci		r = -EINVAL;
16788c2ecf20Sopenharmony_ci		goto exit;
16798c2ecf20Sopenharmony_ci	}
16808c2ecf20Sopenharmony_ci	args->gpu_id = dev->id;
16818c2ecf20Sopenharmony_ci	args->flags = flags;
16828c2ecf20Sopenharmony_ci
16838c2ecf20Sopenharmony_ci	/* Copy metadata buffer to user mode */
16848c2ecf20Sopenharmony_ci	if (metadata_buffer) {
16858c2ecf20Sopenharmony_ci		r = copy_to_user((void __user *)args->metadata_ptr,
16868c2ecf20Sopenharmony_ci				 metadata_buffer, args->metadata_size);
16878c2ecf20Sopenharmony_ci		if (r != 0)
16888c2ecf20Sopenharmony_ci			r = -EFAULT;
16898c2ecf20Sopenharmony_ci	}
16908c2ecf20Sopenharmony_ci
16918c2ecf20Sopenharmony_ciexit:
16928c2ecf20Sopenharmony_ci	kfree(metadata_buffer);
16938c2ecf20Sopenharmony_ci
16948c2ecf20Sopenharmony_ci	return r;
16958c2ecf20Sopenharmony_ci}
16968c2ecf20Sopenharmony_ci
16978c2ecf20Sopenharmony_cistatic int kfd_ioctl_import_dmabuf(struct file *filep,
16988c2ecf20Sopenharmony_ci				   struct kfd_process *p, void *data)
16998c2ecf20Sopenharmony_ci{
17008c2ecf20Sopenharmony_ci	struct kfd_ioctl_import_dmabuf_args *args = data;
17018c2ecf20Sopenharmony_ci	struct kfd_process_device *pdd;
17028c2ecf20Sopenharmony_ci	struct dma_buf *dmabuf;
17038c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
17048c2ecf20Sopenharmony_ci	int idr_handle;
17058c2ecf20Sopenharmony_ci	uint64_t size;
17068c2ecf20Sopenharmony_ci	void *mem;
17078c2ecf20Sopenharmony_ci	int r;
17088c2ecf20Sopenharmony_ci
17098c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpu_id);
17108c2ecf20Sopenharmony_ci	if (!dev)
17118c2ecf20Sopenharmony_ci		return -EINVAL;
17128c2ecf20Sopenharmony_ci
17138c2ecf20Sopenharmony_ci	dmabuf = dma_buf_get(args->dmabuf_fd);
17148c2ecf20Sopenharmony_ci	if (IS_ERR(dmabuf))
17158c2ecf20Sopenharmony_ci		return PTR_ERR(dmabuf);
17168c2ecf20Sopenharmony_ci
17178c2ecf20Sopenharmony_ci	mutex_lock(&p->mutex);
17188c2ecf20Sopenharmony_ci
17198c2ecf20Sopenharmony_ci	pdd = kfd_bind_process_to_device(dev, p);
17208c2ecf20Sopenharmony_ci	if (IS_ERR(pdd)) {
17218c2ecf20Sopenharmony_ci		r = PTR_ERR(pdd);
17228c2ecf20Sopenharmony_ci		goto err_unlock;
17238c2ecf20Sopenharmony_ci	}
17248c2ecf20Sopenharmony_ci
17258c2ecf20Sopenharmony_ci	r = amdgpu_amdkfd_gpuvm_import_dmabuf(dev->kgd, dmabuf,
17268c2ecf20Sopenharmony_ci					      args->va_addr, pdd->vm,
17278c2ecf20Sopenharmony_ci					      (struct kgd_mem **)&mem, &size,
17288c2ecf20Sopenharmony_ci					      NULL);
17298c2ecf20Sopenharmony_ci	if (r)
17308c2ecf20Sopenharmony_ci		goto err_unlock;
17318c2ecf20Sopenharmony_ci
17328c2ecf20Sopenharmony_ci	idr_handle = kfd_process_device_create_obj_handle(pdd, mem);
17338c2ecf20Sopenharmony_ci	if (idr_handle < 0) {
17348c2ecf20Sopenharmony_ci		r = -EFAULT;
17358c2ecf20Sopenharmony_ci		goto err_free;
17368c2ecf20Sopenharmony_ci	}
17378c2ecf20Sopenharmony_ci
17388c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
17398c2ecf20Sopenharmony_ci	dma_buf_put(dmabuf);
17408c2ecf20Sopenharmony_ci
17418c2ecf20Sopenharmony_ci	args->handle = MAKE_HANDLE(args->gpu_id, idr_handle);
17428c2ecf20Sopenharmony_ci
17438c2ecf20Sopenharmony_ci	return 0;
17448c2ecf20Sopenharmony_ci
17458c2ecf20Sopenharmony_cierr_free:
17468c2ecf20Sopenharmony_ci	amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem, NULL);
17478c2ecf20Sopenharmony_cierr_unlock:
17488c2ecf20Sopenharmony_ci	mutex_unlock(&p->mutex);
17498c2ecf20Sopenharmony_ci	dma_buf_put(dmabuf);
17508c2ecf20Sopenharmony_ci	return r;
17518c2ecf20Sopenharmony_ci}
17528c2ecf20Sopenharmony_ci
17538c2ecf20Sopenharmony_ci/* Handle requests for watching SMI events */
17548c2ecf20Sopenharmony_cistatic int kfd_ioctl_smi_events(struct file *filep,
17558c2ecf20Sopenharmony_ci				struct kfd_process *p, void *data)
17568c2ecf20Sopenharmony_ci{
17578c2ecf20Sopenharmony_ci	struct kfd_ioctl_smi_events_args *args = data;
17588c2ecf20Sopenharmony_ci	struct kfd_dev *dev;
17598c2ecf20Sopenharmony_ci
17608c2ecf20Sopenharmony_ci	dev = kfd_device_by_id(args->gpuid);
17618c2ecf20Sopenharmony_ci	if (!dev)
17628c2ecf20Sopenharmony_ci		return -EINVAL;
17638c2ecf20Sopenharmony_ci
17648c2ecf20Sopenharmony_ci	return kfd_smi_event_open(dev, &args->anon_fd);
17658c2ecf20Sopenharmony_ci}
17668c2ecf20Sopenharmony_ci
17678c2ecf20Sopenharmony_ci#define AMDKFD_IOCTL_DEF(ioctl, _func, _flags) \
17688c2ecf20Sopenharmony_ci	[_IOC_NR(ioctl)] = {.cmd = ioctl, .func = _func, .flags = _flags, \
17698c2ecf20Sopenharmony_ci			    .cmd_drv = 0, .name = #ioctl}
17708c2ecf20Sopenharmony_ci
17718c2ecf20Sopenharmony_ci/** Ioctl table */
17728c2ecf20Sopenharmony_cistatic const struct amdkfd_ioctl_desc amdkfd_ioctls[] = {
17738c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_VERSION,
17748c2ecf20Sopenharmony_ci			kfd_ioctl_get_version, 0),
17758c2ecf20Sopenharmony_ci
17768c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_CREATE_QUEUE,
17778c2ecf20Sopenharmony_ci			kfd_ioctl_create_queue, 0),
17788c2ecf20Sopenharmony_ci
17798c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_DESTROY_QUEUE,
17808c2ecf20Sopenharmony_ci			kfd_ioctl_destroy_queue, 0),
17818c2ecf20Sopenharmony_ci
17828c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_MEMORY_POLICY,
17838c2ecf20Sopenharmony_ci			kfd_ioctl_set_memory_policy, 0),
17848c2ecf20Sopenharmony_ci
17858c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_CLOCK_COUNTERS,
17868c2ecf20Sopenharmony_ci			kfd_ioctl_get_clock_counters, 0),
17878c2ecf20Sopenharmony_ci
17888c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_PROCESS_APERTURES,
17898c2ecf20Sopenharmony_ci			kfd_ioctl_get_process_apertures, 0),
17908c2ecf20Sopenharmony_ci
17918c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_UPDATE_QUEUE,
17928c2ecf20Sopenharmony_ci			kfd_ioctl_update_queue, 0),
17938c2ecf20Sopenharmony_ci
17948c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_CREATE_EVENT,
17958c2ecf20Sopenharmony_ci			kfd_ioctl_create_event, 0),
17968c2ecf20Sopenharmony_ci
17978c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_DESTROY_EVENT,
17988c2ecf20Sopenharmony_ci			kfd_ioctl_destroy_event, 0),
17998c2ecf20Sopenharmony_ci
18008c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_EVENT,
18018c2ecf20Sopenharmony_ci			kfd_ioctl_set_event, 0),
18028c2ecf20Sopenharmony_ci
18038c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_RESET_EVENT,
18048c2ecf20Sopenharmony_ci			kfd_ioctl_reset_event, 0),
18058c2ecf20Sopenharmony_ci
18068c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_WAIT_EVENTS,
18078c2ecf20Sopenharmony_ci			kfd_ioctl_wait_events, 0),
18088c2ecf20Sopenharmony_ci
18098c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_REGISTER,
18108c2ecf20Sopenharmony_ci			kfd_ioctl_dbg_register, 0),
18118c2ecf20Sopenharmony_ci
18128c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_UNREGISTER,
18138c2ecf20Sopenharmony_ci			kfd_ioctl_dbg_unregister, 0),
18148c2ecf20Sopenharmony_ci
18158c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_ADDRESS_WATCH,
18168c2ecf20Sopenharmony_ci			kfd_ioctl_dbg_address_watch, 0),
18178c2ecf20Sopenharmony_ci
18188c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_DBG_WAVE_CONTROL,
18198c2ecf20Sopenharmony_ci			kfd_ioctl_dbg_wave_control, 0),
18208c2ecf20Sopenharmony_ci
18218c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_SCRATCH_BACKING_VA,
18228c2ecf20Sopenharmony_ci			kfd_ioctl_set_scratch_backing_va, 0),
18238c2ecf20Sopenharmony_ci
18248c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_TILE_CONFIG,
18258c2ecf20Sopenharmony_ci			kfd_ioctl_get_tile_config, 0),
18268c2ecf20Sopenharmony_ci
18278c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_TRAP_HANDLER,
18288c2ecf20Sopenharmony_ci			kfd_ioctl_set_trap_handler, 0),
18298c2ecf20Sopenharmony_ci
18308c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_PROCESS_APERTURES_NEW,
18318c2ecf20Sopenharmony_ci			kfd_ioctl_get_process_apertures_new, 0),
18328c2ecf20Sopenharmony_ci
18338c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_ACQUIRE_VM,
18348c2ecf20Sopenharmony_ci			kfd_ioctl_acquire_vm, 0),
18358c2ecf20Sopenharmony_ci
18368c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_ALLOC_MEMORY_OF_GPU,
18378c2ecf20Sopenharmony_ci			kfd_ioctl_alloc_memory_of_gpu, 0),
18388c2ecf20Sopenharmony_ci
18398c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_FREE_MEMORY_OF_GPU,
18408c2ecf20Sopenharmony_ci			kfd_ioctl_free_memory_of_gpu, 0),
18418c2ecf20Sopenharmony_ci
18428c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_MAP_MEMORY_TO_GPU,
18438c2ecf20Sopenharmony_ci			kfd_ioctl_map_memory_to_gpu, 0),
18448c2ecf20Sopenharmony_ci
18458c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_UNMAP_MEMORY_FROM_GPU,
18468c2ecf20Sopenharmony_ci			kfd_ioctl_unmap_memory_from_gpu, 0),
18478c2ecf20Sopenharmony_ci
18488c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_CU_MASK,
18498c2ecf20Sopenharmony_ci			kfd_ioctl_set_cu_mask, 0),
18508c2ecf20Sopenharmony_ci
18518c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_QUEUE_WAVE_STATE,
18528c2ecf20Sopenharmony_ci			kfd_ioctl_get_queue_wave_state, 0),
18538c2ecf20Sopenharmony_ci
18548c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_DMABUF_INFO,
18558c2ecf20Sopenharmony_ci				kfd_ioctl_get_dmabuf_info, 0),
18568c2ecf20Sopenharmony_ci
18578c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_IMPORT_DMABUF,
18588c2ecf20Sopenharmony_ci				kfd_ioctl_import_dmabuf, 0),
18598c2ecf20Sopenharmony_ci
18608c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_ALLOC_QUEUE_GWS,
18618c2ecf20Sopenharmony_ci			kfd_ioctl_alloc_queue_gws, 0),
18628c2ecf20Sopenharmony_ci
18638c2ecf20Sopenharmony_ci	AMDKFD_IOCTL_DEF(AMDKFD_IOC_SMI_EVENTS,
18648c2ecf20Sopenharmony_ci			kfd_ioctl_smi_events, 0),
18658c2ecf20Sopenharmony_ci};
18668c2ecf20Sopenharmony_ci
18678c2ecf20Sopenharmony_ci#define AMDKFD_CORE_IOCTL_COUNT	ARRAY_SIZE(amdkfd_ioctls)
18688c2ecf20Sopenharmony_ci
18698c2ecf20Sopenharmony_cistatic long kfd_ioctl(struct file *filep, unsigned int cmd, unsigned long arg)
18708c2ecf20Sopenharmony_ci{
18718c2ecf20Sopenharmony_ci	struct kfd_process *process;
18728c2ecf20Sopenharmony_ci	amdkfd_ioctl_t *func;
18738c2ecf20Sopenharmony_ci	const struct amdkfd_ioctl_desc *ioctl = NULL;
18748c2ecf20Sopenharmony_ci	unsigned int nr = _IOC_NR(cmd);
18758c2ecf20Sopenharmony_ci	char stack_kdata[128];
18768c2ecf20Sopenharmony_ci	char *kdata = NULL;
18778c2ecf20Sopenharmony_ci	unsigned int usize, asize;
18788c2ecf20Sopenharmony_ci	int retcode = -EINVAL;
18798c2ecf20Sopenharmony_ci
18808c2ecf20Sopenharmony_ci	if (nr >= AMDKFD_CORE_IOCTL_COUNT)
18818c2ecf20Sopenharmony_ci		goto err_i1;
18828c2ecf20Sopenharmony_ci
18838c2ecf20Sopenharmony_ci	if ((nr >= AMDKFD_COMMAND_START) && (nr < AMDKFD_COMMAND_END)) {
18848c2ecf20Sopenharmony_ci		u32 amdkfd_size;
18858c2ecf20Sopenharmony_ci
18868c2ecf20Sopenharmony_ci		ioctl = &amdkfd_ioctls[nr];
18878c2ecf20Sopenharmony_ci
18888c2ecf20Sopenharmony_ci		amdkfd_size = _IOC_SIZE(ioctl->cmd);
18898c2ecf20Sopenharmony_ci		usize = asize = _IOC_SIZE(cmd);
18908c2ecf20Sopenharmony_ci		if (amdkfd_size > asize)
18918c2ecf20Sopenharmony_ci			asize = amdkfd_size;
18928c2ecf20Sopenharmony_ci
18938c2ecf20Sopenharmony_ci		cmd = ioctl->cmd;
18948c2ecf20Sopenharmony_ci	} else
18958c2ecf20Sopenharmony_ci		goto err_i1;
18968c2ecf20Sopenharmony_ci
18978c2ecf20Sopenharmony_ci	dev_dbg(kfd_device, "ioctl cmd 0x%x (#0x%x), arg 0x%lx\n", cmd, nr, arg);
18988c2ecf20Sopenharmony_ci
18998c2ecf20Sopenharmony_ci	/* Get the process struct from the filep. Only the process
19008c2ecf20Sopenharmony_ci	 * that opened /dev/kfd can use the file descriptor. Child
19018c2ecf20Sopenharmony_ci	 * processes need to create their own KFD device context.
19028c2ecf20Sopenharmony_ci	 */
19038c2ecf20Sopenharmony_ci	process = filep->private_data;
19048c2ecf20Sopenharmony_ci	if (process->lead_thread != current->group_leader) {
19058c2ecf20Sopenharmony_ci		dev_dbg(kfd_device, "Using KFD FD in wrong process\n");
19068c2ecf20Sopenharmony_ci		retcode = -EBADF;
19078c2ecf20Sopenharmony_ci		goto err_i1;
19088c2ecf20Sopenharmony_ci	}
19098c2ecf20Sopenharmony_ci
19108c2ecf20Sopenharmony_ci	/* Do not trust userspace, use our own definition */
19118c2ecf20Sopenharmony_ci	func = ioctl->func;
19128c2ecf20Sopenharmony_ci
19138c2ecf20Sopenharmony_ci	if (unlikely(!func)) {
19148c2ecf20Sopenharmony_ci		dev_dbg(kfd_device, "no function\n");
19158c2ecf20Sopenharmony_ci		retcode = -EINVAL;
19168c2ecf20Sopenharmony_ci		goto err_i1;
19178c2ecf20Sopenharmony_ci	}
19188c2ecf20Sopenharmony_ci
19198c2ecf20Sopenharmony_ci	if (cmd & (IOC_IN | IOC_OUT)) {
19208c2ecf20Sopenharmony_ci		if (asize <= sizeof(stack_kdata)) {
19218c2ecf20Sopenharmony_ci			kdata = stack_kdata;
19228c2ecf20Sopenharmony_ci		} else {
19238c2ecf20Sopenharmony_ci			kdata = kmalloc(asize, GFP_KERNEL);
19248c2ecf20Sopenharmony_ci			if (!kdata) {
19258c2ecf20Sopenharmony_ci				retcode = -ENOMEM;
19268c2ecf20Sopenharmony_ci				goto err_i1;
19278c2ecf20Sopenharmony_ci			}
19288c2ecf20Sopenharmony_ci		}
19298c2ecf20Sopenharmony_ci		if (asize > usize)
19308c2ecf20Sopenharmony_ci			memset(kdata + usize, 0, asize - usize);
19318c2ecf20Sopenharmony_ci	}
19328c2ecf20Sopenharmony_ci
19338c2ecf20Sopenharmony_ci	if (cmd & IOC_IN) {
19348c2ecf20Sopenharmony_ci		if (copy_from_user(kdata, (void __user *)arg, usize) != 0) {
19358c2ecf20Sopenharmony_ci			retcode = -EFAULT;
19368c2ecf20Sopenharmony_ci			goto err_i1;
19378c2ecf20Sopenharmony_ci		}
19388c2ecf20Sopenharmony_ci	} else if (cmd & IOC_OUT) {
19398c2ecf20Sopenharmony_ci		memset(kdata, 0, usize);
19408c2ecf20Sopenharmony_ci	}
19418c2ecf20Sopenharmony_ci
19428c2ecf20Sopenharmony_ci	retcode = func(filep, process, kdata);
19438c2ecf20Sopenharmony_ci
19448c2ecf20Sopenharmony_ci	if (cmd & IOC_OUT)
19458c2ecf20Sopenharmony_ci		if (copy_to_user((void __user *)arg, kdata, usize) != 0)
19468c2ecf20Sopenharmony_ci			retcode = -EFAULT;
19478c2ecf20Sopenharmony_ci
19488c2ecf20Sopenharmony_cierr_i1:
19498c2ecf20Sopenharmony_ci	if (!ioctl)
19508c2ecf20Sopenharmony_ci		dev_dbg(kfd_device, "invalid ioctl: pid=%d, cmd=0x%02x, nr=0x%02x\n",
19518c2ecf20Sopenharmony_ci			  task_pid_nr(current), cmd, nr);
19528c2ecf20Sopenharmony_ci
19538c2ecf20Sopenharmony_ci	if (kdata != stack_kdata)
19548c2ecf20Sopenharmony_ci		kfree(kdata);
19558c2ecf20Sopenharmony_ci
19568c2ecf20Sopenharmony_ci	if (retcode)
19578c2ecf20Sopenharmony_ci		dev_dbg(kfd_device, "ioctl cmd (#0x%x), arg 0x%lx, ret = %d\n",
19588c2ecf20Sopenharmony_ci				nr, arg, retcode);
19598c2ecf20Sopenharmony_ci
19608c2ecf20Sopenharmony_ci	return retcode;
19618c2ecf20Sopenharmony_ci}
19628c2ecf20Sopenharmony_ci
19638c2ecf20Sopenharmony_cistatic int kfd_mmio_mmap(struct kfd_dev *dev, struct kfd_process *process,
19648c2ecf20Sopenharmony_ci		      struct vm_area_struct *vma)
19658c2ecf20Sopenharmony_ci{
19668c2ecf20Sopenharmony_ci	phys_addr_t address;
19678c2ecf20Sopenharmony_ci	int ret;
19688c2ecf20Sopenharmony_ci
19698c2ecf20Sopenharmony_ci	if (vma->vm_end - vma->vm_start != PAGE_SIZE)
19708c2ecf20Sopenharmony_ci		return -EINVAL;
19718c2ecf20Sopenharmony_ci
19728c2ecf20Sopenharmony_ci	address = amdgpu_amdkfd_get_mmio_remap_phys_addr(dev->kgd);
19738c2ecf20Sopenharmony_ci
19748c2ecf20Sopenharmony_ci	vma->vm_flags |= VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_NORESERVE |
19758c2ecf20Sopenharmony_ci				VM_DONTDUMP | VM_PFNMAP;
19768c2ecf20Sopenharmony_ci
19778c2ecf20Sopenharmony_ci	vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot);
19788c2ecf20Sopenharmony_ci
19798c2ecf20Sopenharmony_ci	pr_debug("pasid 0x%x mapping mmio page\n"
19808c2ecf20Sopenharmony_ci		 "     target user address == 0x%08llX\n"
19818c2ecf20Sopenharmony_ci		 "     physical address    == 0x%08llX\n"
19828c2ecf20Sopenharmony_ci		 "     vm_flags            == 0x%04lX\n"
19838c2ecf20Sopenharmony_ci		 "     size                == 0x%04lX\n",
19848c2ecf20Sopenharmony_ci		 process->pasid, (unsigned long long) vma->vm_start,
19858c2ecf20Sopenharmony_ci		 address, vma->vm_flags, PAGE_SIZE);
19868c2ecf20Sopenharmony_ci
19878c2ecf20Sopenharmony_ci	ret = io_remap_pfn_range(vma,
19888c2ecf20Sopenharmony_ci				vma->vm_start,
19898c2ecf20Sopenharmony_ci				address >> PAGE_SHIFT,
19908c2ecf20Sopenharmony_ci				PAGE_SIZE,
19918c2ecf20Sopenharmony_ci				vma->vm_page_prot);
19928c2ecf20Sopenharmony_ci	return ret;
19938c2ecf20Sopenharmony_ci}
19948c2ecf20Sopenharmony_ci
19958c2ecf20Sopenharmony_ci
19968c2ecf20Sopenharmony_cistatic int kfd_mmap(struct file *filp, struct vm_area_struct *vma)
19978c2ecf20Sopenharmony_ci{
19988c2ecf20Sopenharmony_ci	struct kfd_process *process;
19998c2ecf20Sopenharmony_ci	struct kfd_dev *dev = NULL;
20008c2ecf20Sopenharmony_ci	unsigned long mmap_offset;
20018c2ecf20Sopenharmony_ci	unsigned int gpu_id;
20028c2ecf20Sopenharmony_ci
20038c2ecf20Sopenharmony_ci	process = kfd_get_process(current);
20048c2ecf20Sopenharmony_ci	if (IS_ERR(process))
20058c2ecf20Sopenharmony_ci		return PTR_ERR(process);
20068c2ecf20Sopenharmony_ci
20078c2ecf20Sopenharmony_ci	mmap_offset = vma->vm_pgoff << PAGE_SHIFT;
20088c2ecf20Sopenharmony_ci	gpu_id = KFD_MMAP_GET_GPU_ID(mmap_offset);
20098c2ecf20Sopenharmony_ci	if (gpu_id)
20108c2ecf20Sopenharmony_ci		dev = kfd_device_by_id(gpu_id);
20118c2ecf20Sopenharmony_ci
20128c2ecf20Sopenharmony_ci	switch (mmap_offset & KFD_MMAP_TYPE_MASK) {
20138c2ecf20Sopenharmony_ci	case KFD_MMAP_TYPE_DOORBELL:
20148c2ecf20Sopenharmony_ci		if (!dev)
20158c2ecf20Sopenharmony_ci			return -ENODEV;
20168c2ecf20Sopenharmony_ci		return kfd_doorbell_mmap(dev, process, vma);
20178c2ecf20Sopenharmony_ci
20188c2ecf20Sopenharmony_ci	case KFD_MMAP_TYPE_EVENTS:
20198c2ecf20Sopenharmony_ci		return kfd_event_mmap(process, vma);
20208c2ecf20Sopenharmony_ci
20218c2ecf20Sopenharmony_ci	case KFD_MMAP_TYPE_RESERVED_MEM:
20228c2ecf20Sopenharmony_ci		if (!dev)
20238c2ecf20Sopenharmony_ci			return -ENODEV;
20248c2ecf20Sopenharmony_ci		return kfd_reserved_mem_mmap(dev, process, vma);
20258c2ecf20Sopenharmony_ci	case KFD_MMAP_TYPE_MMIO:
20268c2ecf20Sopenharmony_ci		if (!dev)
20278c2ecf20Sopenharmony_ci			return -ENODEV;
20288c2ecf20Sopenharmony_ci		return kfd_mmio_mmap(dev, process, vma);
20298c2ecf20Sopenharmony_ci	}
20308c2ecf20Sopenharmony_ci
20318c2ecf20Sopenharmony_ci	return -EFAULT;
20328c2ecf20Sopenharmony_ci}
2033