18c2ecf20Sopenharmony_ci/*
28c2ecf20Sopenharmony_ci * Copyright 2014 Advanced Micro Devices, Inc.
38c2ecf20Sopenharmony_ci * All Rights Reserved.
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
68c2ecf20Sopenharmony_ci * copy of this software and associated documentation files (the
78c2ecf20Sopenharmony_ci * "Software"), to deal in the Software without restriction, including
88c2ecf20Sopenharmony_ci * without limitation the rights to use, copy, modify, merge, publish,
98c2ecf20Sopenharmony_ci * distribute, sub license, and/or sell copies of the Software, and to
108c2ecf20Sopenharmony_ci * permit persons to whom the Software is furnished to do so, subject to
118c2ecf20Sopenharmony_ci * the following conditions:
128c2ecf20Sopenharmony_ci *
138c2ecf20Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
148c2ecf20Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
158c2ecf20Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
168c2ecf20Sopenharmony_ci * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
178c2ecf20Sopenharmony_ci * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
188c2ecf20Sopenharmony_ci * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
198c2ecf20Sopenharmony_ci * USE OR OTHER DEALINGS IN THE SOFTWARE.
208c2ecf20Sopenharmony_ci *
218c2ecf20Sopenharmony_ci * The above copyright notice and this permission notice (including the
228c2ecf20Sopenharmony_ci * next paragraph) shall be included in all copies or substantial portions
238c2ecf20Sopenharmony_ci * of the Software.
248c2ecf20Sopenharmony_ci *
258c2ecf20Sopenharmony_ci */
268c2ecf20Sopenharmony_ci/*
278c2ecf20Sopenharmony_ci * Authors:
288c2ecf20Sopenharmony_ci *    Christian König <christian.koenig@amd.com>
298c2ecf20Sopenharmony_ci */
308c2ecf20Sopenharmony_ci
318c2ecf20Sopenharmony_ci/**
328c2ecf20Sopenharmony_ci * DOC: MMU Notifier
338c2ecf20Sopenharmony_ci *
348c2ecf20Sopenharmony_ci * For coherent userptr handling registers an MMU notifier to inform the driver
358c2ecf20Sopenharmony_ci * about updates on the page tables of a process.
368c2ecf20Sopenharmony_ci *
378c2ecf20Sopenharmony_ci * When somebody tries to invalidate the page tables we block the update until
388c2ecf20Sopenharmony_ci * all operations on the pages in question are completed, then those pages are
398c2ecf20Sopenharmony_ci * marked as accessed and also dirty if it wasn't a read only access.
408c2ecf20Sopenharmony_ci *
418c2ecf20Sopenharmony_ci * New command submissions using the userptrs in question are delayed until all
428c2ecf20Sopenharmony_ci * page table invalidation are completed and we once more see a coherent process
438c2ecf20Sopenharmony_ci * address space.
448c2ecf20Sopenharmony_ci */
458c2ecf20Sopenharmony_ci
468c2ecf20Sopenharmony_ci#include <linux/firmware.h>
478c2ecf20Sopenharmony_ci#include <linux/module.h>
488c2ecf20Sopenharmony_ci#include <drm/drm.h>
498c2ecf20Sopenharmony_ci
508c2ecf20Sopenharmony_ci#include "amdgpu.h"
518c2ecf20Sopenharmony_ci#include "amdgpu_amdkfd.h"
528c2ecf20Sopenharmony_ci
538c2ecf20Sopenharmony_ci/**
548c2ecf20Sopenharmony_ci * amdgpu_mn_invalidate_gfx - callback to notify about mm change
558c2ecf20Sopenharmony_ci *
568c2ecf20Sopenharmony_ci * @mni: the range (mm) is about to update
578c2ecf20Sopenharmony_ci * @range: details on the invalidation
588c2ecf20Sopenharmony_ci * @cur_seq: Value to pass to mmu_interval_set_seq()
598c2ecf20Sopenharmony_ci *
608c2ecf20Sopenharmony_ci * Block for operations on BOs to finish and mark pages as accessed and
618c2ecf20Sopenharmony_ci * potentially dirty.
628c2ecf20Sopenharmony_ci */
638c2ecf20Sopenharmony_cistatic bool amdgpu_mn_invalidate_gfx(struct mmu_interval_notifier *mni,
648c2ecf20Sopenharmony_ci				     const struct mmu_notifier_range *range,
658c2ecf20Sopenharmony_ci				     unsigned long cur_seq)
668c2ecf20Sopenharmony_ci{
678c2ecf20Sopenharmony_ci	struct amdgpu_bo *bo = container_of(mni, struct amdgpu_bo, notifier);
688c2ecf20Sopenharmony_ci	struct amdgpu_device *adev = amdgpu_ttm_adev(bo->tbo.bdev);
698c2ecf20Sopenharmony_ci	long r;
708c2ecf20Sopenharmony_ci
718c2ecf20Sopenharmony_ci	if (!mmu_notifier_range_blockable(range))
728c2ecf20Sopenharmony_ci		return false;
738c2ecf20Sopenharmony_ci
748c2ecf20Sopenharmony_ci	mutex_lock(&adev->notifier_lock);
758c2ecf20Sopenharmony_ci
768c2ecf20Sopenharmony_ci	mmu_interval_set_seq(mni, cur_seq);
778c2ecf20Sopenharmony_ci
788c2ecf20Sopenharmony_ci	r = dma_resv_wait_timeout_rcu(bo->tbo.base.resv, true, false,
798c2ecf20Sopenharmony_ci				      MAX_SCHEDULE_TIMEOUT);
808c2ecf20Sopenharmony_ci	mutex_unlock(&adev->notifier_lock);
818c2ecf20Sopenharmony_ci	if (r <= 0)
828c2ecf20Sopenharmony_ci		DRM_ERROR("(%ld) failed to wait for user bo\n", r);
838c2ecf20Sopenharmony_ci	return true;
848c2ecf20Sopenharmony_ci}
858c2ecf20Sopenharmony_ci
868c2ecf20Sopenharmony_cistatic const struct mmu_interval_notifier_ops amdgpu_mn_gfx_ops = {
878c2ecf20Sopenharmony_ci	.invalidate = amdgpu_mn_invalidate_gfx,
888c2ecf20Sopenharmony_ci};
898c2ecf20Sopenharmony_ci
908c2ecf20Sopenharmony_ci/**
918c2ecf20Sopenharmony_ci * amdgpu_mn_invalidate_hsa - callback to notify about mm change
928c2ecf20Sopenharmony_ci *
938c2ecf20Sopenharmony_ci * @mni: the range (mm) is about to update
948c2ecf20Sopenharmony_ci * @range: details on the invalidation
958c2ecf20Sopenharmony_ci * @cur_seq: Value to pass to mmu_interval_set_seq()
968c2ecf20Sopenharmony_ci *
978c2ecf20Sopenharmony_ci * We temporarily evict the BO attached to this range. This necessitates
988c2ecf20Sopenharmony_ci * evicting all user-mode queues of the process.
998c2ecf20Sopenharmony_ci */
1008c2ecf20Sopenharmony_cistatic bool amdgpu_mn_invalidate_hsa(struct mmu_interval_notifier *mni,
1018c2ecf20Sopenharmony_ci				     const struct mmu_notifier_range *range,
1028c2ecf20Sopenharmony_ci				     unsigned long cur_seq)
1038c2ecf20Sopenharmony_ci{
1048c2ecf20Sopenharmony_ci	struct amdgpu_bo *bo = container_of(mni, struct amdgpu_bo, notifier);
1058c2ecf20Sopenharmony_ci	struct amdgpu_device *adev = amdgpu_ttm_adev(bo->tbo.bdev);
1068c2ecf20Sopenharmony_ci
1078c2ecf20Sopenharmony_ci	if (!mmu_notifier_range_blockable(range))
1088c2ecf20Sopenharmony_ci		return false;
1098c2ecf20Sopenharmony_ci
1108c2ecf20Sopenharmony_ci	mutex_lock(&adev->notifier_lock);
1118c2ecf20Sopenharmony_ci
1128c2ecf20Sopenharmony_ci	mmu_interval_set_seq(mni, cur_seq);
1138c2ecf20Sopenharmony_ci
1148c2ecf20Sopenharmony_ci	amdgpu_amdkfd_evict_userptr(bo->kfd_bo, bo->notifier.mm);
1158c2ecf20Sopenharmony_ci	mutex_unlock(&adev->notifier_lock);
1168c2ecf20Sopenharmony_ci
1178c2ecf20Sopenharmony_ci	return true;
1188c2ecf20Sopenharmony_ci}
1198c2ecf20Sopenharmony_ci
1208c2ecf20Sopenharmony_cistatic const struct mmu_interval_notifier_ops amdgpu_mn_hsa_ops = {
1218c2ecf20Sopenharmony_ci	.invalidate = amdgpu_mn_invalidate_hsa,
1228c2ecf20Sopenharmony_ci};
1238c2ecf20Sopenharmony_ci
1248c2ecf20Sopenharmony_ci/**
1258c2ecf20Sopenharmony_ci * amdgpu_mn_register - register a BO for notifier updates
1268c2ecf20Sopenharmony_ci *
1278c2ecf20Sopenharmony_ci * @bo: amdgpu buffer object
1288c2ecf20Sopenharmony_ci * @addr: userptr addr we should monitor
1298c2ecf20Sopenharmony_ci *
1308c2ecf20Sopenharmony_ci * Registers a mmu_notifier for the given BO at the specified address.
1318c2ecf20Sopenharmony_ci * Returns 0 on success, -ERRNO if anything goes wrong.
1328c2ecf20Sopenharmony_ci */
1338c2ecf20Sopenharmony_ciint amdgpu_mn_register(struct amdgpu_bo *bo, unsigned long addr)
1348c2ecf20Sopenharmony_ci{
1358c2ecf20Sopenharmony_ci	if (bo->kfd_bo)
1368c2ecf20Sopenharmony_ci		return mmu_interval_notifier_insert(&bo->notifier, current->mm,
1378c2ecf20Sopenharmony_ci						    addr, amdgpu_bo_size(bo),
1388c2ecf20Sopenharmony_ci						    &amdgpu_mn_hsa_ops);
1398c2ecf20Sopenharmony_ci	return mmu_interval_notifier_insert(&bo->notifier, current->mm, addr,
1408c2ecf20Sopenharmony_ci					    amdgpu_bo_size(bo),
1418c2ecf20Sopenharmony_ci					    &amdgpu_mn_gfx_ops);
1428c2ecf20Sopenharmony_ci}
1438c2ecf20Sopenharmony_ci
1448c2ecf20Sopenharmony_ci/**
1458c2ecf20Sopenharmony_ci * amdgpu_mn_unregister - unregister a BO for notifier updates
1468c2ecf20Sopenharmony_ci *
1478c2ecf20Sopenharmony_ci * @bo: amdgpu buffer object
1488c2ecf20Sopenharmony_ci *
1498c2ecf20Sopenharmony_ci * Remove any registration of mmu notifier updates from the buffer object.
1508c2ecf20Sopenharmony_ci */
1518c2ecf20Sopenharmony_civoid amdgpu_mn_unregister(struct amdgpu_bo *bo)
1528c2ecf20Sopenharmony_ci{
1538c2ecf20Sopenharmony_ci	if (!bo->notifier.mm)
1548c2ecf20Sopenharmony_ci		return;
1558c2ecf20Sopenharmony_ci	mmu_interval_notifier_remove(&bo->notifier);
1568c2ecf20Sopenharmony_ci	bo->notifier.mm = NULL;
1578c2ecf20Sopenharmony_ci}
158