162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 OR MIT
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Copyright 2020-2021 Advanced Micro Devices, Inc.
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
662306a36Sopenharmony_ci * copy of this software and associated documentation files (the "Software"),
762306a36Sopenharmony_ci * to deal in the Software without restriction, including without limitation
862306a36Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sublicense,
962306a36Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
1062306a36Sopenharmony_ci * Software is furnished to do so, subject to the following conditions:
1162306a36Sopenharmony_ci *
1262306a36Sopenharmony_ci * The above copyright notice and this permission notice shall be included in
1362306a36Sopenharmony_ci * all copies or substantial portions of the Software.
1462306a36Sopenharmony_ci *
1562306a36Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1662306a36Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
1762306a36Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
1862306a36Sopenharmony_ci * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
1962306a36Sopenharmony_ci * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
2062306a36Sopenharmony_ci * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
2162306a36Sopenharmony_ci * OTHER DEALINGS IN THE SOFTWARE.
2262306a36Sopenharmony_ci */
2362306a36Sopenharmony_ci#include <linux/types.h>
2462306a36Sopenharmony_ci#include <linux/hmm.h>
2562306a36Sopenharmony_ci#include <linux/dma-direction.h>
2662306a36Sopenharmony_ci#include <linux/dma-mapping.h>
2762306a36Sopenharmony_ci#include <linux/migrate.h>
2862306a36Sopenharmony_ci#include "amdgpu_sync.h"
2962306a36Sopenharmony_ci#include "amdgpu_object.h"
3062306a36Sopenharmony_ci#include "amdgpu_vm.h"
3162306a36Sopenharmony_ci#include "amdgpu_res_cursor.h"
3262306a36Sopenharmony_ci#include "kfd_priv.h"
3362306a36Sopenharmony_ci#include "kfd_svm.h"
3462306a36Sopenharmony_ci#include "kfd_migrate.h"
3562306a36Sopenharmony_ci#include "kfd_smi_events.h"
3662306a36Sopenharmony_ci
3762306a36Sopenharmony_ci#ifdef dev_fmt
3862306a36Sopenharmony_ci#undef dev_fmt
3962306a36Sopenharmony_ci#endif
4062306a36Sopenharmony_ci#define dev_fmt(fmt) "kfd_migrate: " fmt
4162306a36Sopenharmony_ci
4262306a36Sopenharmony_cistatic uint64_t
4362306a36Sopenharmony_cisvm_migrate_direct_mapping_addr(struct amdgpu_device *adev, uint64_t addr)
4462306a36Sopenharmony_ci{
4562306a36Sopenharmony_ci	return addr + amdgpu_ttm_domain_start(adev, TTM_PL_VRAM);
4662306a36Sopenharmony_ci}
4762306a36Sopenharmony_ci
4862306a36Sopenharmony_cistatic int
4962306a36Sopenharmony_cisvm_migrate_gart_map(struct amdgpu_ring *ring, uint64_t npages,
5062306a36Sopenharmony_ci		     dma_addr_t *addr, uint64_t *gart_addr, uint64_t flags)
5162306a36Sopenharmony_ci{
5262306a36Sopenharmony_ci	struct amdgpu_device *adev = ring->adev;
5362306a36Sopenharmony_ci	struct amdgpu_job *job;
5462306a36Sopenharmony_ci	unsigned int num_dw, num_bytes;
5562306a36Sopenharmony_ci	struct dma_fence *fence;
5662306a36Sopenharmony_ci	uint64_t src_addr, dst_addr;
5762306a36Sopenharmony_ci	uint64_t pte_flags;
5862306a36Sopenharmony_ci	void *cpu_addr;
5962306a36Sopenharmony_ci	int r;
6062306a36Sopenharmony_ci
6162306a36Sopenharmony_ci	/* use gart window 0 */
6262306a36Sopenharmony_ci	*gart_addr = adev->gmc.gart_start;
6362306a36Sopenharmony_ci
6462306a36Sopenharmony_ci	num_dw = ALIGN(adev->mman.buffer_funcs->copy_num_dw, 8);
6562306a36Sopenharmony_ci	num_bytes = npages * 8;
6662306a36Sopenharmony_ci
6762306a36Sopenharmony_ci	r = amdgpu_job_alloc_with_ib(adev, &adev->mman.high_pr,
6862306a36Sopenharmony_ci				     AMDGPU_FENCE_OWNER_UNDEFINED,
6962306a36Sopenharmony_ci				     num_dw * 4 + num_bytes,
7062306a36Sopenharmony_ci				     AMDGPU_IB_POOL_DELAYED,
7162306a36Sopenharmony_ci				     &job);
7262306a36Sopenharmony_ci	if (r)
7362306a36Sopenharmony_ci		return r;
7462306a36Sopenharmony_ci
7562306a36Sopenharmony_ci	src_addr = num_dw * 4;
7662306a36Sopenharmony_ci	src_addr += job->ibs[0].gpu_addr;
7762306a36Sopenharmony_ci
7862306a36Sopenharmony_ci	dst_addr = amdgpu_bo_gpu_offset(adev->gart.bo);
7962306a36Sopenharmony_ci	amdgpu_emit_copy_buffer(adev, &job->ibs[0], src_addr,
8062306a36Sopenharmony_ci				dst_addr, num_bytes, false);
8162306a36Sopenharmony_ci
8262306a36Sopenharmony_ci	amdgpu_ring_pad_ib(ring, &job->ibs[0]);
8362306a36Sopenharmony_ci	WARN_ON(job->ibs[0].length_dw > num_dw);
8462306a36Sopenharmony_ci
8562306a36Sopenharmony_ci	pte_flags = AMDGPU_PTE_VALID | AMDGPU_PTE_READABLE;
8662306a36Sopenharmony_ci	pte_flags |= AMDGPU_PTE_SYSTEM | AMDGPU_PTE_SNOOPED;
8762306a36Sopenharmony_ci	if (!(flags & KFD_IOCTL_SVM_FLAG_GPU_RO))
8862306a36Sopenharmony_ci		pte_flags |= AMDGPU_PTE_WRITEABLE;
8962306a36Sopenharmony_ci	pte_flags |= adev->gart.gart_pte_flags;
9062306a36Sopenharmony_ci
9162306a36Sopenharmony_ci	cpu_addr = &job->ibs[0].ptr[num_dw];
9262306a36Sopenharmony_ci
9362306a36Sopenharmony_ci	amdgpu_gart_map(adev, 0, npages, addr, pte_flags, cpu_addr);
9462306a36Sopenharmony_ci	fence = amdgpu_job_submit(job);
9562306a36Sopenharmony_ci	dma_fence_put(fence);
9662306a36Sopenharmony_ci
9762306a36Sopenharmony_ci	return r;
9862306a36Sopenharmony_ci}
9962306a36Sopenharmony_ci
10062306a36Sopenharmony_ci/**
10162306a36Sopenharmony_ci * svm_migrate_copy_memory_gart - sdma copy data between ram and vram
10262306a36Sopenharmony_ci *
10362306a36Sopenharmony_ci * @adev: amdgpu device the sdma ring running
10462306a36Sopenharmony_ci * @sys: system DMA pointer to be copied
10562306a36Sopenharmony_ci * @vram: vram destination DMA pointer
10662306a36Sopenharmony_ci * @npages: number of pages to copy
10762306a36Sopenharmony_ci * @direction: enum MIGRATION_COPY_DIR
10862306a36Sopenharmony_ci * @mfence: output, sdma fence to signal after sdma is done
10962306a36Sopenharmony_ci *
11062306a36Sopenharmony_ci * ram address uses GART table continuous entries mapping to ram pages,
11162306a36Sopenharmony_ci * vram address uses direct mapping of vram pages, which must have npages
11262306a36Sopenharmony_ci * number of continuous pages.
11362306a36Sopenharmony_ci * GART update and sdma uses same buf copy function ring, sdma is splited to
11462306a36Sopenharmony_ci * multiple GTT_MAX_PAGES transfer, all sdma operations are serialized, wait for
11562306a36Sopenharmony_ci * the last sdma finish fence which is returned to check copy memory is done.
11662306a36Sopenharmony_ci *
11762306a36Sopenharmony_ci * Context: Process context, takes and releases gtt_window_lock
11862306a36Sopenharmony_ci *
11962306a36Sopenharmony_ci * Return:
12062306a36Sopenharmony_ci * 0 - OK, otherwise error code
12162306a36Sopenharmony_ci */
12262306a36Sopenharmony_ci
12362306a36Sopenharmony_cistatic int
12462306a36Sopenharmony_cisvm_migrate_copy_memory_gart(struct amdgpu_device *adev, dma_addr_t *sys,
12562306a36Sopenharmony_ci			     uint64_t *vram, uint64_t npages,
12662306a36Sopenharmony_ci			     enum MIGRATION_COPY_DIR direction,
12762306a36Sopenharmony_ci			     struct dma_fence **mfence)
12862306a36Sopenharmony_ci{
12962306a36Sopenharmony_ci	const uint64_t GTT_MAX_PAGES = AMDGPU_GTT_MAX_TRANSFER_SIZE;
13062306a36Sopenharmony_ci	struct amdgpu_ring *ring = adev->mman.buffer_funcs_ring;
13162306a36Sopenharmony_ci	uint64_t gart_s, gart_d;
13262306a36Sopenharmony_ci	struct dma_fence *next;
13362306a36Sopenharmony_ci	uint64_t size;
13462306a36Sopenharmony_ci	int r;
13562306a36Sopenharmony_ci
13662306a36Sopenharmony_ci	mutex_lock(&adev->mman.gtt_window_lock);
13762306a36Sopenharmony_ci
13862306a36Sopenharmony_ci	while (npages) {
13962306a36Sopenharmony_ci		size = min(GTT_MAX_PAGES, npages);
14062306a36Sopenharmony_ci
14162306a36Sopenharmony_ci		if (direction == FROM_VRAM_TO_RAM) {
14262306a36Sopenharmony_ci			gart_s = svm_migrate_direct_mapping_addr(adev, *vram);
14362306a36Sopenharmony_ci			r = svm_migrate_gart_map(ring, size, sys, &gart_d, 0);
14462306a36Sopenharmony_ci
14562306a36Sopenharmony_ci		} else if (direction == FROM_RAM_TO_VRAM) {
14662306a36Sopenharmony_ci			r = svm_migrate_gart_map(ring, size, sys, &gart_s,
14762306a36Sopenharmony_ci						 KFD_IOCTL_SVM_FLAG_GPU_RO);
14862306a36Sopenharmony_ci			gart_d = svm_migrate_direct_mapping_addr(adev, *vram);
14962306a36Sopenharmony_ci		}
15062306a36Sopenharmony_ci		if (r) {
15162306a36Sopenharmony_ci			dev_err(adev->dev, "fail %d create gart mapping\n", r);
15262306a36Sopenharmony_ci			goto out_unlock;
15362306a36Sopenharmony_ci		}
15462306a36Sopenharmony_ci
15562306a36Sopenharmony_ci		r = amdgpu_copy_buffer(ring, gart_s, gart_d, size * PAGE_SIZE,
15662306a36Sopenharmony_ci				       NULL, &next, false, true, false);
15762306a36Sopenharmony_ci		if (r) {
15862306a36Sopenharmony_ci			dev_err(adev->dev, "fail %d to copy memory\n", r);
15962306a36Sopenharmony_ci			goto out_unlock;
16062306a36Sopenharmony_ci		}
16162306a36Sopenharmony_ci
16262306a36Sopenharmony_ci		dma_fence_put(*mfence);
16362306a36Sopenharmony_ci		*mfence = next;
16462306a36Sopenharmony_ci		npages -= size;
16562306a36Sopenharmony_ci		if (npages) {
16662306a36Sopenharmony_ci			sys += size;
16762306a36Sopenharmony_ci			vram += size;
16862306a36Sopenharmony_ci		}
16962306a36Sopenharmony_ci	}
17062306a36Sopenharmony_ci
17162306a36Sopenharmony_ciout_unlock:
17262306a36Sopenharmony_ci	mutex_unlock(&adev->mman.gtt_window_lock);
17362306a36Sopenharmony_ci
17462306a36Sopenharmony_ci	return r;
17562306a36Sopenharmony_ci}
17662306a36Sopenharmony_ci
17762306a36Sopenharmony_ci/**
17862306a36Sopenharmony_ci * svm_migrate_copy_done - wait for memory copy sdma is done
17962306a36Sopenharmony_ci *
18062306a36Sopenharmony_ci * @adev: amdgpu device the sdma memory copy is executing on
18162306a36Sopenharmony_ci * @mfence: migrate fence
18262306a36Sopenharmony_ci *
18362306a36Sopenharmony_ci * Wait for dma fence is signaled, if the copy ssplit into multiple sdma
18462306a36Sopenharmony_ci * operations, this is the last sdma operation fence.
18562306a36Sopenharmony_ci *
18662306a36Sopenharmony_ci * Context: called after svm_migrate_copy_memory
18762306a36Sopenharmony_ci *
18862306a36Sopenharmony_ci * Return:
18962306a36Sopenharmony_ci * 0		- success
19062306a36Sopenharmony_ci * otherwise	- error code from dma fence signal
19162306a36Sopenharmony_ci */
19262306a36Sopenharmony_cistatic int
19362306a36Sopenharmony_cisvm_migrate_copy_done(struct amdgpu_device *adev, struct dma_fence *mfence)
19462306a36Sopenharmony_ci{
19562306a36Sopenharmony_ci	int r = 0;
19662306a36Sopenharmony_ci
19762306a36Sopenharmony_ci	if (mfence) {
19862306a36Sopenharmony_ci		r = dma_fence_wait(mfence, false);
19962306a36Sopenharmony_ci		dma_fence_put(mfence);
20062306a36Sopenharmony_ci		pr_debug("sdma copy memory fence done\n");
20162306a36Sopenharmony_ci	}
20262306a36Sopenharmony_ci
20362306a36Sopenharmony_ci	return r;
20462306a36Sopenharmony_ci}
20562306a36Sopenharmony_ci
20662306a36Sopenharmony_ciunsigned long
20762306a36Sopenharmony_cisvm_migrate_addr_to_pfn(struct amdgpu_device *adev, unsigned long addr)
20862306a36Sopenharmony_ci{
20962306a36Sopenharmony_ci	return (addr + adev->kfd.pgmap.range.start) >> PAGE_SHIFT;
21062306a36Sopenharmony_ci}
21162306a36Sopenharmony_ci
21262306a36Sopenharmony_cistatic void
21362306a36Sopenharmony_cisvm_migrate_get_vram_page(struct svm_range *prange, unsigned long pfn)
21462306a36Sopenharmony_ci{
21562306a36Sopenharmony_ci	struct page *page;
21662306a36Sopenharmony_ci
21762306a36Sopenharmony_ci	page = pfn_to_page(pfn);
21862306a36Sopenharmony_ci	svm_range_bo_ref(prange->svm_bo);
21962306a36Sopenharmony_ci	page->zone_device_data = prange->svm_bo;
22062306a36Sopenharmony_ci	zone_device_page_init(page);
22162306a36Sopenharmony_ci}
22262306a36Sopenharmony_ci
22362306a36Sopenharmony_cistatic void
22462306a36Sopenharmony_cisvm_migrate_put_vram_page(struct amdgpu_device *adev, unsigned long addr)
22562306a36Sopenharmony_ci{
22662306a36Sopenharmony_ci	struct page *page;
22762306a36Sopenharmony_ci
22862306a36Sopenharmony_ci	page = pfn_to_page(svm_migrate_addr_to_pfn(adev, addr));
22962306a36Sopenharmony_ci	unlock_page(page);
23062306a36Sopenharmony_ci	put_page(page);
23162306a36Sopenharmony_ci}
23262306a36Sopenharmony_ci
23362306a36Sopenharmony_cistatic unsigned long
23462306a36Sopenharmony_cisvm_migrate_addr(struct amdgpu_device *adev, struct page *page)
23562306a36Sopenharmony_ci{
23662306a36Sopenharmony_ci	unsigned long addr;
23762306a36Sopenharmony_ci
23862306a36Sopenharmony_ci	addr = page_to_pfn(page) << PAGE_SHIFT;
23962306a36Sopenharmony_ci	return (addr - adev->kfd.pgmap.range.start);
24062306a36Sopenharmony_ci}
24162306a36Sopenharmony_ci
24262306a36Sopenharmony_cistatic struct page *
24362306a36Sopenharmony_cisvm_migrate_get_sys_page(struct vm_area_struct *vma, unsigned long addr)
24462306a36Sopenharmony_ci{
24562306a36Sopenharmony_ci	struct page *page;
24662306a36Sopenharmony_ci
24762306a36Sopenharmony_ci	page = alloc_page_vma(GFP_HIGHUSER, vma, addr);
24862306a36Sopenharmony_ci	if (page)
24962306a36Sopenharmony_ci		lock_page(page);
25062306a36Sopenharmony_ci
25162306a36Sopenharmony_ci	return page;
25262306a36Sopenharmony_ci}
25362306a36Sopenharmony_ci
25462306a36Sopenharmony_cistatic void svm_migrate_put_sys_page(unsigned long addr)
25562306a36Sopenharmony_ci{
25662306a36Sopenharmony_ci	struct page *page;
25762306a36Sopenharmony_ci
25862306a36Sopenharmony_ci	page = pfn_to_page(addr >> PAGE_SHIFT);
25962306a36Sopenharmony_ci	unlock_page(page);
26062306a36Sopenharmony_ci	put_page(page);
26162306a36Sopenharmony_ci}
26262306a36Sopenharmony_ci
26362306a36Sopenharmony_cistatic unsigned long svm_migrate_successful_pages(struct migrate_vma *migrate)
26462306a36Sopenharmony_ci{
26562306a36Sopenharmony_ci	unsigned long cpages = 0;
26662306a36Sopenharmony_ci	unsigned long i;
26762306a36Sopenharmony_ci
26862306a36Sopenharmony_ci	for (i = 0; i < migrate->npages; i++) {
26962306a36Sopenharmony_ci		if (migrate->src[i] & MIGRATE_PFN_VALID &&
27062306a36Sopenharmony_ci		    migrate->src[i] & MIGRATE_PFN_MIGRATE)
27162306a36Sopenharmony_ci			cpages++;
27262306a36Sopenharmony_ci	}
27362306a36Sopenharmony_ci	return cpages;
27462306a36Sopenharmony_ci}
27562306a36Sopenharmony_ci
27662306a36Sopenharmony_cistatic unsigned long svm_migrate_unsuccessful_pages(struct migrate_vma *migrate)
27762306a36Sopenharmony_ci{
27862306a36Sopenharmony_ci	unsigned long upages = 0;
27962306a36Sopenharmony_ci	unsigned long i;
28062306a36Sopenharmony_ci
28162306a36Sopenharmony_ci	for (i = 0; i < migrate->npages; i++) {
28262306a36Sopenharmony_ci		if (migrate->src[i] & MIGRATE_PFN_VALID &&
28362306a36Sopenharmony_ci		    !(migrate->src[i] & MIGRATE_PFN_MIGRATE))
28462306a36Sopenharmony_ci			upages++;
28562306a36Sopenharmony_ci	}
28662306a36Sopenharmony_ci	return upages;
28762306a36Sopenharmony_ci}
28862306a36Sopenharmony_ci
28962306a36Sopenharmony_cistatic int
29062306a36Sopenharmony_cisvm_migrate_copy_to_vram(struct kfd_node *node, struct svm_range *prange,
29162306a36Sopenharmony_ci			 struct migrate_vma *migrate, struct dma_fence **mfence,
29262306a36Sopenharmony_ci			 dma_addr_t *scratch, uint64_t ttm_res_offset)
29362306a36Sopenharmony_ci{
29462306a36Sopenharmony_ci	uint64_t npages = migrate->cpages;
29562306a36Sopenharmony_ci	struct amdgpu_device *adev = node->adev;
29662306a36Sopenharmony_ci	struct device *dev = adev->dev;
29762306a36Sopenharmony_ci	struct amdgpu_res_cursor cursor;
29862306a36Sopenharmony_ci	dma_addr_t *src;
29962306a36Sopenharmony_ci	uint64_t *dst;
30062306a36Sopenharmony_ci	uint64_t i, j;
30162306a36Sopenharmony_ci	int r;
30262306a36Sopenharmony_ci
30362306a36Sopenharmony_ci	pr_debug("svms 0x%p [0x%lx 0x%lx 0x%llx]\n", prange->svms, prange->start,
30462306a36Sopenharmony_ci		 prange->last, ttm_res_offset);
30562306a36Sopenharmony_ci
30662306a36Sopenharmony_ci	src = scratch;
30762306a36Sopenharmony_ci	dst = (uint64_t *)(scratch + npages);
30862306a36Sopenharmony_ci
30962306a36Sopenharmony_ci	amdgpu_res_first(prange->ttm_res, ttm_res_offset,
31062306a36Sopenharmony_ci			 npages << PAGE_SHIFT, &cursor);
31162306a36Sopenharmony_ci	for (i = j = 0; i < npages; i++) {
31262306a36Sopenharmony_ci		struct page *spage;
31362306a36Sopenharmony_ci
31462306a36Sopenharmony_ci		dst[i] = cursor.start + (j << PAGE_SHIFT);
31562306a36Sopenharmony_ci		migrate->dst[i] = svm_migrate_addr_to_pfn(adev, dst[i]);
31662306a36Sopenharmony_ci		svm_migrate_get_vram_page(prange, migrate->dst[i]);
31762306a36Sopenharmony_ci		migrate->dst[i] = migrate_pfn(migrate->dst[i]);
31862306a36Sopenharmony_ci
31962306a36Sopenharmony_ci		spage = migrate_pfn_to_page(migrate->src[i]);
32062306a36Sopenharmony_ci		if (spage && !is_zone_device_page(spage)) {
32162306a36Sopenharmony_ci			src[i] = dma_map_page(dev, spage, 0, PAGE_SIZE,
32262306a36Sopenharmony_ci					      DMA_TO_DEVICE);
32362306a36Sopenharmony_ci			r = dma_mapping_error(dev, src[i]);
32462306a36Sopenharmony_ci			if (r) {
32562306a36Sopenharmony_ci				dev_err(dev, "%s: fail %d dma_map_page\n",
32662306a36Sopenharmony_ci					__func__, r);
32762306a36Sopenharmony_ci				goto out_free_vram_pages;
32862306a36Sopenharmony_ci			}
32962306a36Sopenharmony_ci		} else {
33062306a36Sopenharmony_ci			if (j) {
33162306a36Sopenharmony_ci				r = svm_migrate_copy_memory_gart(
33262306a36Sopenharmony_ci						adev, src + i - j,
33362306a36Sopenharmony_ci						dst + i - j, j,
33462306a36Sopenharmony_ci						FROM_RAM_TO_VRAM,
33562306a36Sopenharmony_ci						mfence);
33662306a36Sopenharmony_ci				if (r)
33762306a36Sopenharmony_ci					goto out_free_vram_pages;
33862306a36Sopenharmony_ci				amdgpu_res_next(&cursor, (j + 1) << PAGE_SHIFT);
33962306a36Sopenharmony_ci				j = 0;
34062306a36Sopenharmony_ci			} else {
34162306a36Sopenharmony_ci				amdgpu_res_next(&cursor, PAGE_SIZE);
34262306a36Sopenharmony_ci			}
34362306a36Sopenharmony_ci			continue;
34462306a36Sopenharmony_ci		}
34562306a36Sopenharmony_ci
34662306a36Sopenharmony_ci		pr_debug_ratelimited("dma mapping src to 0x%llx, pfn 0x%lx\n",
34762306a36Sopenharmony_ci				     src[i] >> PAGE_SHIFT, page_to_pfn(spage));
34862306a36Sopenharmony_ci
34962306a36Sopenharmony_ci		if (j >= (cursor.size >> PAGE_SHIFT) - 1 && i < npages - 1) {
35062306a36Sopenharmony_ci			r = svm_migrate_copy_memory_gart(adev, src + i - j,
35162306a36Sopenharmony_ci							 dst + i - j, j + 1,
35262306a36Sopenharmony_ci							 FROM_RAM_TO_VRAM,
35362306a36Sopenharmony_ci							 mfence);
35462306a36Sopenharmony_ci			if (r)
35562306a36Sopenharmony_ci				goto out_free_vram_pages;
35662306a36Sopenharmony_ci			amdgpu_res_next(&cursor, (j + 1) * PAGE_SIZE);
35762306a36Sopenharmony_ci			j = 0;
35862306a36Sopenharmony_ci		} else {
35962306a36Sopenharmony_ci			j++;
36062306a36Sopenharmony_ci		}
36162306a36Sopenharmony_ci	}
36262306a36Sopenharmony_ci
36362306a36Sopenharmony_ci	r = svm_migrate_copy_memory_gart(adev, src + i - j, dst + i - j, j,
36462306a36Sopenharmony_ci					 FROM_RAM_TO_VRAM, mfence);
36562306a36Sopenharmony_ci
36662306a36Sopenharmony_ciout_free_vram_pages:
36762306a36Sopenharmony_ci	if (r) {
36862306a36Sopenharmony_ci		pr_debug("failed %d to copy memory to vram\n", r);
36962306a36Sopenharmony_ci		while (i--) {
37062306a36Sopenharmony_ci			svm_migrate_put_vram_page(adev, dst[i]);
37162306a36Sopenharmony_ci			migrate->dst[i] = 0;
37262306a36Sopenharmony_ci		}
37362306a36Sopenharmony_ci	}
37462306a36Sopenharmony_ci
37562306a36Sopenharmony_ci#ifdef DEBUG_FORCE_MIXED_DOMAINS
37662306a36Sopenharmony_ci	for (i = 0, j = 0; i < npages; i += 4, j++) {
37762306a36Sopenharmony_ci		if (j & 1)
37862306a36Sopenharmony_ci			continue;
37962306a36Sopenharmony_ci		svm_migrate_put_vram_page(adev, dst[i]);
38062306a36Sopenharmony_ci		migrate->dst[i] = 0;
38162306a36Sopenharmony_ci		svm_migrate_put_vram_page(adev, dst[i + 1]);
38262306a36Sopenharmony_ci		migrate->dst[i + 1] = 0;
38362306a36Sopenharmony_ci		svm_migrate_put_vram_page(adev, dst[i + 2]);
38462306a36Sopenharmony_ci		migrate->dst[i + 2] = 0;
38562306a36Sopenharmony_ci		svm_migrate_put_vram_page(adev, dst[i + 3]);
38662306a36Sopenharmony_ci		migrate->dst[i + 3] = 0;
38762306a36Sopenharmony_ci	}
38862306a36Sopenharmony_ci#endif
38962306a36Sopenharmony_ci
39062306a36Sopenharmony_ci	return r;
39162306a36Sopenharmony_ci}
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_cistatic long
39462306a36Sopenharmony_cisvm_migrate_vma_to_vram(struct kfd_node *node, struct svm_range *prange,
39562306a36Sopenharmony_ci			struct vm_area_struct *vma, uint64_t start,
39662306a36Sopenharmony_ci			uint64_t end, uint32_t trigger, uint64_t ttm_res_offset)
39762306a36Sopenharmony_ci{
39862306a36Sopenharmony_ci	struct kfd_process *p = container_of(prange->svms, struct kfd_process, svms);
39962306a36Sopenharmony_ci	uint64_t npages = (end - start) >> PAGE_SHIFT;
40062306a36Sopenharmony_ci	struct amdgpu_device *adev = node->adev;
40162306a36Sopenharmony_ci	struct kfd_process_device *pdd;
40262306a36Sopenharmony_ci	struct dma_fence *mfence = NULL;
40362306a36Sopenharmony_ci	struct migrate_vma migrate = { 0 };
40462306a36Sopenharmony_ci	unsigned long cpages = 0;
40562306a36Sopenharmony_ci	dma_addr_t *scratch;
40662306a36Sopenharmony_ci	void *buf;
40762306a36Sopenharmony_ci	int r = -ENOMEM;
40862306a36Sopenharmony_ci
40962306a36Sopenharmony_ci	memset(&migrate, 0, sizeof(migrate));
41062306a36Sopenharmony_ci	migrate.vma = vma;
41162306a36Sopenharmony_ci	migrate.start = start;
41262306a36Sopenharmony_ci	migrate.end = end;
41362306a36Sopenharmony_ci	migrate.flags = MIGRATE_VMA_SELECT_SYSTEM;
41462306a36Sopenharmony_ci	migrate.pgmap_owner = SVM_ADEV_PGMAP_OWNER(adev);
41562306a36Sopenharmony_ci
41662306a36Sopenharmony_ci	buf = kvcalloc(npages,
41762306a36Sopenharmony_ci		       2 * sizeof(*migrate.src) + sizeof(uint64_t) + sizeof(dma_addr_t),
41862306a36Sopenharmony_ci		       GFP_KERNEL);
41962306a36Sopenharmony_ci	if (!buf)
42062306a36Sopenharmony_ci		goto out;
42162306a36Sopenharmony_ci
42262306a36Sopenharmony_ci	migrate.src = buf;
42362306a36Sopenharmony_ci	migrate.dst = migrate.src + npages;
42462306a36Sopenharmony_ci	scratch = (dma_addr_t *)(migrate.dst + npages);
42562306a36Sopenharmony_ci
42662306a36Sopenharmony_ci	kfd_smi_event_migration_start(node, p->lead_thread->pid,
42762306a36Sopenharmony_ci				      start >> PAGE_SHIFT, end >> PAGE_SHIFT,
42862306a36Sopenharmony_ci				      0, node->id, prange->prefetch_loc,
42962306a36Sopenharmony_ci				      prange->preferred_loc, trigger);
43062306a36Sopenharmony_ci
43162306a36Sopenharmony_ci	r = migrate_vma_setup(&migrate);
43262306a36Sopenharmony_ci	if (r) {
43362306a36Sopenharmony_ci		dev_err(adev->dev, "%s: vma setup fail %d range [0x%lx 0x%lx]\n",
43462306a36Sopenharmony_ci			__func__, r, prange->start, prange->last);
43562306a36Sopenharmony_ci		goto out_free;
43662306a36Sopenharmony_ci	}
43762306a36Sopenharmony_ci
43862306a36Sopenharmony_ci	cpages = migrate.cpages;
43962306a36Sopenharmony_ci	if (!cpages) {
44062306a36Sopenharmony_ci		pr_debug("failed collect migrate sys pages [0x%lx 0x%lx]\n",
44162306a36Sopenharmony_ci			 prange->start, prange->last);
44262306a36Sopenharmony_ci		goto out_free;
44362306a36Sopenharmony_ci	}
44462306a36Sopenharmony_ci	if (cpages != npages)
44562306a36Sopenharmony_ci		pr_debug("partial migration, 0x%lx/0x%llx pages migrated\n",
44662306a36Sopenharmony_ci			 cpages, npages);
44762306a36Sopenharmony_ci	else
44862306a36Sopenharmony_ci		pr_debug("0x%lx pages migrated\n", cpages);
44962306a36Sopenharmony_ci
45062306a36Sopenharmony_ci	r = svm_migrate_copy_to_vram(node, prange, &migrate, &mfence, scratch, ttm_res_offset);
45162306a36Sopenharmony_ci	migrate_vma_pages(&migrate);
45262306a36Sopenharmony_ci
45362306a36Sopenharmony_ci	pr_debug("successful/cpages/npages 0x%lx/0x%lx/0x%lx\n",
45462306a36Sopenharmony_ci		svm_migrate_successful_pages(&migrate), cpages, migrate.npages);
45562306a36Sopenharmony_ci
45662306a36Sopenharmony_ci	svm_migrate_copy_done(adev, mfence);
45762306a36Sopenharmony_ci	migrate_vma_finalize(&migrate);
45862306a36Sopenharmony_ci
45962306a36Sopenharmony_ci	kfd_smi_event_migration_end(node, p->lead_thread->pid,
46062306a36Sopenharmony_ci				    start >> PAGE_SHIFT, end >> PAGE_SHIFT,
46162306a36Sopenharmony_ci				    0, node->id, trigger);
46262306a36Sopenharmony_ci
46362306a36Sopenharmony_ci	svm_range_dma_unmap(adev->dev, scratch, 0, npages);
46462306a36Sopenharmony_ci
46562306a36Sopenharmony_ciout_free:
46662306a36Sopenharmony_ci	kvfree(buf);
46762306a36Sopenharmony_ciout:
46862306a36Sopenharmony_ci	if (!r && cpages) {
46962306a36Sopenharmony_ci		pdd = svm_range_get_pdd_by_node(prange, node);
47062306a36Sopenharmony_ci		if (pdd)
47162306a36Sopenharmony_ci			WRITE_ONCE(pdd->page_in, pdd->page_in + cpages);
47262306a36Sopenharmony_ci
47362306a36Sopenharmony_ci		return cpages;
47462306a36Sopenharmony_ci	}
47562306a36Sopenharmony_ci	return r;
47662306a36Sopenharmony_ci}
47762306a36Sopenharmony_ci
47862306a36Sopenharmony_ci/**
47962306a36Sopenharmony_ci * svm_migrate_ram_to_vram - migrate svm range from system to device
48062306a36Sopenharmony_ci * @prange: range structure
48162306a36Sopenharmony_ci * @best_loc: the device to migrate to
48262306a36Sopenharmony_ci * @mm: the process mm structure
48362306a36Sopenharmony_ci * @trigger: reason of migration
48462306a36Sopenharmony_ci *
48562306a36Sopenharmony_ci * Context: Process context, caller hold mmap read lock, svms lock, prange lock
48662306a36Sopenharmony_ci *
48762306a36Sopenharmony_ci * Return:
48862306a36Sopenharmony_ci * 0 - OK, otherwise error code
48962306a36Sopenharmony_ci */
49062306a36Sopenharmony_cistatic int
49162306a36Sopenharmony_cisvm_migrate_ram_to_vram(struct svm_range *prange, uint32_t best_loc,
49262306a36Sopenharmony_ci			struct mm_struct *mm, uint32_t trigger)
49362306a36Sopenharmony_ci{
49462306a36Sopenharmony_ci	unsigned long addr, start, end;
49562306a36Sopenharmony_ci	struct vm_area_struct *vma;
49662306a36Sopenharmony_ci	uint64_t ttm_res_offset;
49762306a36Sopenharmony_ci	struct kfd_node *node;
49862306a36Sopenharmony_ci	unsigned long cpages = 0;
49962306a36Sopenharmony_ci	long r = 0;
50062306a36Sopenharmony_ci
50162306a36Sopenharmony_ci	if (prange->actual_loc == best_loc) {
50262306a36Sopenharmony_ci		pr_debug("svms 0x%p [0x%lx 0x%lx] already on best_loc 0x%x\n",
50362306a36Sopenharmony_ci			 prange->svms, prange->start, prange->last, best_loc);
50462306a36Sopenharmony_ci		return 0;
50562306a36Sopenharmony_ci	}
50662306a36Sopenharmony_ci
50762306a36Sopenharmony_ci	node = svm_range_get_node_by_id(prange, best_loc);
50862306a36Sopenharmony_ci	if (!node) {
50962306a36Sopenharmony_ci		pr_debug("failed to get kfd node by id 0x%x\n", best_loc);
51062306a36Sopenharmony_ci		return -ENODEV;
51162306a36Sopenharmony_ci	}
51262306a36Sopenharmony_ci
51362306a36Sopenharmony_ci	pr_debug("svms 0x%p [0x%lx 0x%lx] to gpu 0x%x\n", prange->svms,
51462306a36Sopenharmony_ci		 prange->start, prange->last, best_loc);
51562306a36Sopenharmony_ci
51662306a36Sopenharmony_ci	start = prange->start << PAGE_SHIFT;
51762306a36Sopenharmony_ci	end = (prange->last + 1) << PAGE_SHIFT;
51862306a36Sopenharmony_ci
51962306a36Sopenharmony_ci	r = svm_range_vram_node_new(node, prange, true);
52062306a36Sopenharmony_ci	if (r) {
52162306a36Sopenharmony_ci		dev_dbg(node->adev->dev, "fail %ld to alloc vram\n", r);
52262306a36Sopenharmony_ci		return r;
52362306a36Sopenharmony_ci	}
52462306a36Sopenharmony_ci	ttm_res_offset = prange->offset << PAGE_SHIFT;
52562306a36Sopenharmony_ci
52662306a36Sopenharmony_ci	for (addr = start; addr < end;) {
52762306a36Sopenharmony_ci		unsigned long next;
52862306a36Sopenharmony_ci
52962306a36Sopenharmony_ci		vma = vma_lookup(mm, addr);
53062306a36Sopenharmony_ci		if (!vma)
53162306a36Sopenharmony_ci			break;
53262306a36Sopenharmony_ci
53362306a36Sopenharmony_ci		next = min(vma->vm_end, end);
53462306a36Sopenharmony_ci		r = svm_migrate_vma_to_vram(node, prange, vma, addr, next, trigger, ttm_res_offset);
53562306a36Sopenharmony_ci		if (r < 0) {
53662306a36Sopenharmony_ci			pr_debug("failed %ld to migrate\n", r);
53762306a36Sopenharmony_ci			break;
53862306a36Sopenharmony_ci		} else {
53962306a36Sopenharmony_ci			cpages += r;
54062306a36Sopenharmony_ci		}
54162306a36Sopenharmony_ci		ttm_res_offset += next - addr;
54262306a36Sopenharmony_ci		addr = next;
54362306a36Sopenharmony_ci	}
54462306a36Sopenharmony_ci
54562306a36Sopenharmony_ci	if (cpages) {
54662306a36Sopenharmony_ci		prange->actual_loc = best_loc;
54762306a36Sopenharmony_ci		svm_range_free_dma_mappings(prange, true);
54862306a36Sopenharmony_ci	} else {
54962306a36Sopenharmony_ci		svm_range_vram_node_free(prange);
55062306a36Sopenharmony_ci	}
55162306a36Sopenharmony_ci
55262306a36Sopenharmony_ci	return r < 0 ? r : 0;
55362306a36Sopenharmony_ci}
55462306a36Sopenharmony_ci
55562306a36Sopenharmony_cistatic void svm_migrate_page_free(struct page *page)
55662306a36Sopenharmony_ci{
55762306a36Sopenharmony_ci	struct svm_range_bo *svm_bo = page->zone_device_data;
55862306a36Sopenharmony_ci
55962306a36Sopenharmony_ci	if (svm_bo) {
56062306a36Sopenharmony_ci		pr_debug_ratelimited("ref: %d\n", kref_read(&svm_bo->kref));
56162306a36Sopenharmony_ci		svm_range_bo_unref_async(svm_bo);
56262306a36Sopenharmony_ci	}
56362306a36Sopenharmony_ci}
56462306a36Sopenharmony_ci
56562306a36Sopenharmony_cistatic int
56662306a36Sopenharmony_cisvm_migrate_copy_to_ram(struct amdgpu_device *adev, struct svm_range *prange,
56762306a36Sopenharmony_ci			struct migrate_vma *migrate, struct dma_fence **mfence,
56862306a36Sopenharmony_ci			dma_addr_t *scratch, uint64_t npages)
56962306a36Sopenharmony_ci{
57062306a36Sopenharmony_ci	struct device *dev = adev->dev;
57162306a36Sopenharmony_ci	uint64_t *src;
57262306a36Sopenharmony_ci	dma_addr_t *dst;
57362306a36Sopenharmony_ci	struct page *dpage;
57462306a36Sopenharmony_ci	uint64_t i = 0, j;
57562306a36Sopenharmony_ci	uint64_t addr;
57662306a36Sopenharmony_ci	int r = 0;
57762306a36Sopenharmony_ci
57862306a36Sopenharmony_ci	pr_debug("svms 0x%p [0x%lx 0x%lx]\n", prange->svms, prange->start,
57962306a36Sopenharmony_ci		 prange->last);
58062306a36Sopenharmony_ci
58162306a36Sopenharmony_ci	addr = prange->start << PAGE_SHIFT;
58262306a36Sopenharmony_ci
58362306a36Sopenharmony_ci	src = (uint64_t *)(scratch + npages);
58462306a36Sopenharmony_ci	dst = scratch;
58562306a36Sopenharmony_ci
58662306a36Sopenharmony_ci	for (i = 0, j = 0; i < npages; i++, addr += PAGE_SIZE) {
58762306a36Sopenharmony_ci		struct page *spage;
58862306a36Sopenharmony_ci
58962306a36Sopenharmony_ci		spage = migrate_pfn_to_page(migrate->src[i]);
59062306a36Sopenharmony_ci		if (!spage || !is_zone_device_page(spage)) {
59162306a36Sopenharmony_ci			pr_debug("invalid page. Could be in CPU already svms 0x%p [0x%lx 0x%lx]\n",
59262306a36Sopenharmony_ci				 prange->svms, prange->start, prange->last);
59362306a36Sopenharmony_ci			if (j) {
59462306a36Sopenharmony_ci				r = svm_migrate_copy_memory_gart(adev, dst + i - j,
59562306a36Sopenharmony_ci								 src + i - j, j,
59662306a36Sopenharmony_ci								 FROM_VRAM_TO_RAM,
59762306a36Sopenharmony_ci								 mfence);
59862306a36Sopenharmony_ci				if (r)
59962306a36Sopenharmony_ci					goto out_oom;
60062306a36Sopenharmony_ci				j = 0;
60162306a36Sopenharmony_ci			}
60262306a36Sopenharmony_ci			continue;
60362306a36Sopenharmony_ci		}
60462306a36Sopenharmony_ci		src[i] = svm_migrate_addr(adev, spage);
60562306a36Sopenharmony_ci		if (j > 0 && src[i] != src[i - 1] + PAGE_SIZE) {
60662306a36Sopenharmony_ci			r = svm_migrate_copy_memory_gart(adev, dst + i - j,
60762306a36Sopenharmony_ci							 src + i - j, j,
60862306a36Sopenharmony_ci							 FROM_VRAM_TO_RAM,
60962306a36Sopenharmony_ci							 mfence);
61062306a36Sopenharmony_ci			if (r)
61162306a36Sopenharmony_ci				goto out_oom;
61262306a36Sopenharmony_ci			j = 0;
61362306a36Sopenharmony_ci		}
61462306a36Sopenharmony_ci
61562306a36Sopenharmony_ci		dpage = svm_migrate_get_sys_page(migrate->vma, addr);
61662306a36Sopenharmony_ci		if (!dpage) {
61762306a36Sopenharmony_ci			pr_debug("failed get page svms 0x%p [0x%lx 0x%lx]\n",
61862306a36Sopenharmony_ci				 prange->svms, prange->start, prange->last);
61962306a36Sopenharmony_ci			r = -ENOMEM;
62062306a36Sopenharmony_ci			goto out_oom;
62162306a36Sopenharmony_ci		}
62262306a36Sopenharmony_ci
62362306a36Sopenharmony_ci		dst[i] = dma_map_page(dev, dpage, 0, PAGE_SIZE, DMA_FROM_DEVICE);
62462306a36Sopenharmony_ci		r = dma_mapping_error(dev, dst[i]);
62562306a36Sopenharmony_ci		if (r) {
62662306a36Sopenharmony_ci			dev_err(adev->dev, "%s: fail %d dma_map_page\n", __func__, r);
62762306a36Sopenharmony_ci			goto out_oom;
62862306a36Sopenharmony_ci		}
62962306a36Sopenharmony_ci
63062306a36Sopenharmony_ci		pr_debug_ratelimited("dma mapping dst to 0x%llx, pfn 0x%lx\n",
63162306a36Sopenharmony_ci				     dst[i] >> PAGE_SHIFT, page_to_pfn(dpage));
63262306a36Sopenharmony_ci
63362306a36Sopenharmony_ci		migrate->dst[i] = migrate_pfn(page_to_pfn(dpage));
63462306a36Sopenharmony_ci		j++;
63562306a36Sopenharmony_ci	}
63662306a36Sopenharmony_ci
63762306a36Sopenharmony_ci	r = svm_migrate_copy_memory_gart(adev, dst + i - j, src + i - j, j,
63862306a36Sopenharmony_ci					 FROM_VRAM_TO_RAM, mfence);
63962306a36Sopenharmony_ci
64062306a36Sopenharmony_ciout_oom:
64162306a36Sopenharmony_ci	if (r) {
64262306a36Sopenharmony_ci		pr_debug("failed %d copy to ram\n", r);
64362306a36Sopenharmony_ci		while (i--) {
64462306a36Sopenharmony_ci			svm_migrate_put_sys_page(dst[i]);
64562306a36Sopenharmony_ci			migrate->dst[i] = 0;
64662306a36Sopenharmony_ci		}
64762306a36Sopenharmony_ci	}
64862306a36Sopenharmony_ci
64962306a36Sopenharmony_ci	return r;
65062306a36Sopenharmony_ci}
65162306a36Sopenharmony_ci
65262306a36Sopenharmony_ci/**
65362306a36Sopenharmony_ci * svm_migrate_vma_to_ram - migrate range inside one vma from device to system
65462306a36Sopenharmony_ci *
65562306a36Sopenharmony_ci * @prange: svm range structure
65662306a36Sopenharmony_ci * @vma: vm_area_struct that range [start, end] belongs to
65762306a36Sopenharmony_ci * @start: range start virtual address in pages
65862306a36Sopenharmony_ci * @end: range end virtual address in pages
65962306a36Sopenharmony_ci * @node: kfd node device to migrate from
66062306a36Sopenharmony_ci * @trigger: reason of migration
66162306a36Sopenharmony_ci * @fault_page: is from vmf->page, svm_migrate_to_ram(), this is CPU page fault callback
66262306a36Sopenharmony_ci *
66362306a36Sopenharmony_ci * Context: Process context, caller hold mmap read lock, prange->migrate_mutex
66462306a36Sopenharmony_ci *
66562306a36Sopenharmony_ci * Return:
66662306a36Sopenharmony_ci *   0 - success with all pages migrated
66762306a36Sopenharmony_ci *   negative values - indicate error
66862306a36Sopenharmony_ci *   positive values - partial migration, number of pages not migrated
66962306a36Sopenharmony_ci */
67062306a36Sopenharmony_cistatic long
67162306a36Sopenharmony_cisvm_migrate_vma_to_ram(struct kfd_node *node, struct svm_range *prange,
67262306a36Sopenharmony_ci		       struct vm_area_struct *vma, uint64_t start, uint64_t end,
67362306a36Sopenharmony_ci		       uint32_t trigger, struct page *fault_page)
67462306a36Sopenharmony_ci{
67562306a36Sopenharmony_ci	struct kfd_process *p = container_of(prange->svms, struct kfd_process, svms);
67662306a36Sopenharmony_ci	uint64_t npages = (end - start) >> PAGE_SHIFT;
67762306a36Sopenharmony_ci	unsigned long upages = npages;
67862306a36Sopenharmony_ci	unsigned long cpages = 0;
67962306a36Sopenharmony_ci	struct amdgpu_device *adev = node->adev;
68062306a36Sopenharmony_ci	struct kfd_process_device *pdd;
68162306a36Sopenharmony_ci	struct dma_fence *mfence = NULL;
68262306a36Sopenharmony_ci	struct migrate_vma migrate = { 0 };
68362306a36Sopenharmony_ci	dma_addr_t *scratch;
68462306a36Sopenharmony_ci	void *buf;
68562306a36Sopenharmony_ci	int r = -ENOMEM;
68662306a36Sopenharmony_ci
68762306a36Sopenharmony_ci	memset(&migrate, 0, sizeof(migrate));
68862306a36Sopenharmony_ci	migrate.vma = vma;
68962306a36Sopenharmony_ci	migrate.start = start;
69062306a36Sopenharmony_ci	migrate.end = end;
69162306a36Sopenharmony_ci	migrate.pgmap_owner = SVM_ADEV_PGMAP_OWNER(adev);
69262306a36Sopenharmony_ci	if (adev->gmc.xgmi.connected_to_cpu)
69362306a36Sopenharmony_ci		migrate.flags = MIGRATE_VMA_SELECT_DEVICE_COHERENT;
69462306a36Sopenharmony_ci	else
69562306a36Sopenharmony_ci		migrate.flags = MIGRATE_VMA_SELECT_DEVICE_PRIVATE;
69662306a36Sopenharmony_ci
69762306a36Sopenharmony_ci	buf = kvcalloc(npages,
69862306a36Sopenharmony_ci		       2 * sizeof(*migrate.src) + sizeof(uint64_t) + sizeof(dma_addr_t),
69962306a36Sopenharmony_ci		       GFP_KERNEL);
70062306a36Sopenharmony_ci	if (!buf)
70162306a36Sopenharmony_ci		goto out;
70262306a36Sopenharmony_ci
70362306a36Sopenharmony_ci	migrate.src = buf;
70462306a36Sopenharmony_ci	migrate.dst = migrate.src + npages;
70562306a36Sopenharmony_ci	migrate.fault_page = fault_page;
70662306a36Sopenharmony_ci	scratch = (dma_addr_t *)(migrate.dst + npages);
70762306a36Sopenharmony_ci
70862306a36Sopenharmony_ci	kfd_smi_event_migration_start(node, p->lead_thread->pid,
70962306a36Sopenharmony_ci				      start >> PAGE_SHIFT, end >> PAGE_SHIFT,
71062306a36Sopenharmony_ci				      node->id, 0, prange->prefetch_loc,
71162306a36Sopenharmony_ci				      prange->preferred_loc, trigger);
71262306a36Sopenharmony_ci
71362306a36Sopenharmony_ci	r = migrate_vma_setup(&migrate);
71462306a36Sopenharmony_ci	if (r) {
71562306a36Sopenharmony_ci		dev_err(adev->dev, "%s: vma setup fail %d range [0x%lx 0x%lx]\n",
71662306a36Sopenharmony_ci			__func__, r, prange->start, prange->last);
71762306a36Sopenharmony_ci		goto out_free;
71862306a36Sopenharmony_ci	}
71962306a36Sopenharmony_ci
72062306a36Sopenharmony_ci	cpages = migrate.cpages;
72162306a36Sopenharmony_ci	if (!cpages) {
72262306a36Sopenharmony_ci		pr_debug("failed collect migrate device pages [0x%lx 0x%lx]\n",
72362306a36Sopenharmony_ci			 prange->start, prange->last);
72462306a36Sopenharmony_ci		upages = svm_migrate_unsuccessful_pages(&migrate);
72562306a36Sopenharmony_ci		goto out_free;
72662306a36Sopenharmony_ci	}
72762306a36Sopenharmony_ci	if (cpages != npages)
72862306a36Sopenharmony_ci		pr_debug("partial migration, 0x%lx/0x%llx pages migrated\n",
72962306a36Sopenharmony_ci			 cpages, npages);
73062306a36Sopenharmony_ci	else
73162306a36Sopenharmony_ci		pr_debug("0x%lx pages migrated\n", cpages);
73262306a36Sopenharmony_ci
73362306a36Sopenharmony_ci	r = svm_migrate_copy_to_ram(adev, prange, &migrate, &mfence,
73462306a36Sopenharmony_ci				    scratch, npages);
73562306a36Sopenharmony_ci	migrate_vma_pages(&migrate);
73662306a36Sopenharmony_ci
73762306a36Sopenharmony_ci	upages = svm_migrate_unsuccessful_pages(&migrate);
73862306a36Sopenharmony_ci	pr_debug("unsuccessful/cpages/npages 0x%lx/0x%lx/0x%lx\n",
73962306a36Sopenharmony_ci		 upages, cpages, migrate.npages);
74062306a36Sopenharmony_ci
74162306a36Sopenharmony_ci	svm_migrate_copy_done(adev, mfence);
74262306a36Sopenharmony_ci	migrate_vma_finalize(&migrate);
74362306a36Sopenharmony_ci
74462306a36Sopenharmony_ci	kfd_smi_event_migration_end(node, p->lead_thread->pid,
74562306a36Sopenharmony_ci				    start >> PAGE_SHIFT, end >> PAGE_SHIFT,
74662306a36Sopenharmony_ci				    node->id, 0, trigger);
74762306a36Sopenharmony_ci
74862306a36Sopenharmony_ci	svm_range_dma_unmap(adev->dev, scratch, 0, npages);
74962306a36Sopenharmony_ci
75062306a36Sopenharmony_ciout_free:
75162306a36Sopenharmony_ci	kvfree(buf);
75262306a36Sopenharmony_ciout:
75362306a36Sopenharmony_ci	if (!r && cpages) {
75462306a36Sopenharmony_ci		pdd = svm_range_get_pdd_by_node(prange, node);
75562306a36Sopenharmony_ci		if (pdd)
75662306a36Sopenharmony_ci			WRITE_ONCE(pdd->page_out, pdd->page_out + cpages);
75762306a36Sopenharmony_ci	}
75862306a36Sopenharmony_ci	return r ? r : upages;
75962306a36Sopenharmony_ci}
76062306a36Sopenharmony_ci
76162306a36Sopenharmony_ci/**
76262306a36Sopenharmony_ci * svm_migrate_vram_to_ram - migrate svm range from device to system
76362306a36Sopenharmony_ci * @prange: range structure
76462306a36Sopenharmony_ci * @mm: process mm, use current->mm if NULL
76562306a36Sopenharmony_ci * @trigger: reason of migration
76662306a36Sopenharmony_ci * @fault_page: is from vmf->page, svm_migrate_to_ram(), this is CPU page fault callback
76762306a36Sopenharmony_ci *
76862306a36Sopenharmony_ci * Context: Process context, caller hold mmap read lock, prange->migrate_mutex
76962306a36Sopenharmony_ci *
77062306a36Sopenharmony_ci * Return:
77162306a36Sopenharmony_ci * 0 - OK, otherwise error code
77262306a36Sopenharmony_ci */
77362306a36Sopenharmony_ciint svm_migrate_vram_to_ram(struct svm_range *prange, struct mm_struct *mm,
77462306a36Sopenharmony_ci			    uint32_t trigger, struct page *fault_page)
77562306a36Sopenharmony_ci{
77662306a36Sopenharmony_ci	struct kfd_node *node;
77762306a36Sopenharmony_ci	struct vm_area_struct *vma;
77862306a36Sopenharmony_ci	unsigned long addr;
77962306a36Sopenharmony_ci	unsigned long start;
78062306a36Sopenharmony_ci	unsigned long end;
78162306a36Sopenharmony_ci	unsigned long upages = 0;
78262306a36Sopenharmony_ci	long r = 0;
78362306a36Sopenharmony_ci
78462306a36Sopenharmony_ci	if (!prange->actual_loc) {
78562306a36Sopenharmony_ci		pr_debug("[0x%lx 0x%lx] already migrated to ram\n",
78662306a36Sopenharmony_ci			 prange->start, prange->last);
78762306a36Sopenharmony_ci		return 0;
78862306a36Sopenharmony_ci	}
78962306a36Sopenharmony_ci
79062306a36Sopenharmony_ci	node = svm_range_get_node_by_id(prange, prange->actual_loc);
79162306a36Sopenharmony_ci	if (!node) {
79262306a36Sopenharmony_ci		pr_debug("failed to get kfd node by id 0x%x\n", prange->actual_loc);
79362306a36Sopenharmony_ci		return -ENODEV;
79462306a36Sopenharmony_ci	}
79562306a36Sopenharmony_ci	pr_debug("svms 0x%p prange 0x%p [0x%lx 0x%lx] from gpu 0x%x to ram\n",
79662306a36Sopenharmony_ci		 prange->svms, prange, prange->start, prange->last,
79762306a36Sopenharmony_ci		 prange->actual_loc);
79862306a36Sopenharmony_ci
79962306a36Sopenharmony_ci	start = prange->start << PAGE_SHIFT;
80062306a36Sopenharmony_ci	end = (prange->last + 1) << PAGE_SHIFT;
80162306a36Sopenharmony_ci
80262306a36Sopenharmony_ci	for (addr = start; addr < end;) {
80362306a36Sopenharmony_ci		unsigned long next;
80462306a36Sopenharmony_ci
80562306a36Sopenharmony_ci		vma = vma_lookup(mm, addr);
80662306a36Sopenharmony_ci		if (!vma) {
80762306a36Sopenharmony_ci			pr_debug("failed to find vma for prange %p\n", prange);
80862306a36Sopenharmony_ci			r = -EFAULT;
80962306a36Sopenharmony_ci			break;
81062306a36Sopenharmony_ci		}
81162306a36Sopenharmony_ci
81262306a36Sopenharmony_ci		next = min(vma->vm_end, end);
81362306a36Sopenharmony_ci		r = svm_migrate_vma_to_ram(node, prange, vma, addr, next, trigger,
81462306a36Sopenharmony_ci			fault_page);
81562306a36Sopenharmony_ci		if (r < 0) {
81662306a36Sopenharmony_ci			pr_debug("failed %ld to migrate prange %p\n", r, prange);
81762306a36Sopenharmony_ci			break;
81862306a36Sopenharmony_ci		} else {
81962306a36Sopenharmony_ci			upages += r;
82062306a36Sopenharmony_ci		}
82162306a36Sopenharmony_ci		addr = next;
82262306a36Sopenharmony_ci	}
82362306a36Sopenharmony_ci
82462306a36Sopenharmony_ci	if (r >= 0 && !upages) {
82562306a36Sopenharmony_ci		svm_range_vram_node_free(prange);
82662306a36Sopenharmony_ci		prange->actual_loc = 0;
82762306a36Sopenharmony_ci	}
82862306a36Sopenharmony_ci
82962306a36Sopenharmony_ci	return r < 0 ? r : 0;
83062306a36Sopenharmony_ci}
83162306a36Sopenharmony_ci
83262306a36Sopenharmony_ci/**
83362306a36Sopenharmony_ci * svm_migrate_vram_to_vram - migrate svm range from device to device
83462306a36Sopenharmony_ci * @prange: range structure
83562306a36Sopenharmony_ci * @best_loc: the device to migrate to
83662306a36Sopenharmony_ci * @mm: process mm, use current->mm if NULL
83762306a36Sopenharmony_ci * @trigger: reason of migration
83862306a36Sopenharmony_ci *
83962306a36Sopenharmony_ci * Context: Process context, caller hold mmap read lock, svms lock, prange lock
84062306a36Sopenharmony_ci *
84162306a36Sopenharmony_ci * Return:
84262306a36Sopenharmony_ci * 0 - OK, otherwise error code
84362306a36Sopenharmony_ci */
84462306a36Sopenharmony_cistatic int
84562306a36Sopenharmony_cisvm_migrate_vram_to_vram(struct svm_range *prange, uint32_t best_loc,
84662306a36Sopenharmony_ci			 struct mm_struct *mm, uint32_t trigger)
84762306a36Sopenharmony_ci{
84862306a36Sopenharmony_ci	int r, retries = 3;
84962306a36Sopenharmony_ci
85062306a36Sopenharmony_ci	/*
85162306a36Sopenharmony_ci	 * TODO: for both devices with PCIe large bar or on same xgmi hive, skip
85262306a36Sopenharmony_ci	 * system memory as migration bridge
85362306a36Sopenharmony_ci	 */
85462306a36Sopenharmony_ci
85562306a36Sopenharmony_ci	pr_debug("from gpu 0x%x to gpu 0x%x\n", prange->actual_loc, best_loc);
85662306a36Sopenharmony_ci
85762306a36Sopenharmony_ci	do {
85862306a36Sopenharmony_ci		r = svm_migrate_vram_to_ram(prange, mm, trigger, NULL);
85962306a36Sopenharmony_ci		if (r)
86062306a36Sopenharmony_ci			return r;
86162306a36Sopenharmony_ci	} while (prange->actual_loc && --retries);
86262306a36Sopenharmony_ci
86362306a36Sopenharmony_ci	if (prange->actual_loc)
86462306a36Sopenharmony_ci		return -EDEADLK;
86562306a36Sopenharmony_ci
86662306a36Sopenharmony_ci	return svm_migrate_ram_to_vram(prange, best_loc, mm, trigger);
86762306a36Sopenharmony_ci}
86862306a36Sopenharmony_ci
86962306a36Sopenharmony_ciint
87062306a36Sopenharmony_cisvm_migrate_to_vram(struct svm_range *prange, uint32_t best_loc,
87162306a36Sopenharmony_ci		    struct mm_struct *mm, uint32_t trigger)
87262306a36Sopenharmony_ci{
87362306a36Sopenharmony_ci	if  (!prange->actual_loc)
87462306a36Sopenharmony_ci		return svm_migrate_ram_to_vram(prange, best_loc, mm, trigger);
87562306a36Sopenharmony_ci	else
87662306a36Sopenharmony_ci		return svm_migrate_vram_to_vram(prange, best_loc, mm, trigger);
87762306a36Sopenharmony_ci
87862306a36Sopenharmony_ci}
87962306a36Sopenharmony_ci
88062306a36Sopenharmony_ci/**
88162306a36Sopenharmony_ci * svm_migrate_to_ram - CPU page fault handler
88262306a36Sopenharmony_ci * @vmf: CPU vm fault vma, address
88362306a36Sopenharmony_ci *
88462306a36Sopenharmony_ci * Context: vm fault handler, caller holds the mmap read lock
88562306a36Sopenharmony_ci *
88662306a36Sopenharmony_ci * Return:
88762306a36Sopenharmony_ci * 0 - OK
88862306a36Sopenharmony_ci * VM_FAULT_SIGBUS - notice application to have SIGBUS page fault
88962306a36Sopenharmony_ci */
89062306a36Sopenharmony_cistatic vm_fault_t svm_migrate_to_ram(struct vm_fault *vmf)
89162306a36Sopenharmony_ci{
89262306a36Sopenharmony_ci	unsigned long addr = vmf->address;
89362306a36Sopenharmony_ci	struct svm_range_bo *svm_bo;
89462306a36Sopenharmony_ci	enum svm_work_list_ops op;
89562306a36Sopenharmony_ci	struct svm_range *parent;
89662306a36Sopenharmony_ci	struct svm_range *prange;
89762306a36Sopenharmony_ci	struct kfd_process *p;
89862306a36Sopenharmony_ci	struct mm_struct *mm;
89962306a36Sopenharmony_ci	int r = 0;
90062306a36Sopenharmony_ci
90162306a36Sopenharmony_ci	svm_bo = vmf->page->zone_device_data;
90262306a36Sopenharmony_ci	if (!svm_bo) {
90362306a36Sopenharmony_ci		pr_debug("failed get device page at addr 0x%lx\n", addr);
90462306a36Sopenharmony_ci		return VM_FAULT_SIGBUS;
90562306a36Sopenharmony_ci	}
90662306a36Sopenharmony_ci	if (!mmget_not_zero(svm_bo->eviction_fence->mm)) {
90762306a36Sopenharmony_ci		pr_debug("addr 0x%lx of process mm is destroyed\n", addr);
90862306a36Sopenharmony_ci		return VM_FAULT_SIGBUS;
90962306a36Sopenharmony_ci	}
91062306a36Sopenharmony_ci
91162306a36Sopenharmony_ci	mm = svm_bo->eviction_fence->mm;
91262306a36Sopenharmony_ci	if (mm != vmf->vma->vm_mm)
91362306a36Sopenharmony_ci		pr_debug("addr 0x%lx is COW mapping in child process\n", addr);
91462306a36Sopenharmony_ci
91562306a36Sopenharmony_ci	p = kfd_lookup_process_by_mm(mm);
91662306a36Sopenharmony_ci	if (!p) {
91762306a36Sopenharmony_ci		pr_debug("failed find process at fault address 0x%lx\n", addr);
91862306a36Sopenharmony_ci		r = VM_FAULT_SIGBUS;
91962306a36Sopenharmony_ci		goto out_mmput;
92062306a36Sopenharmony_ci	}
92162306a36Sopenharmony_ci	if (READ_ONCE(p->svms.faulting_task) == current) {
92262306a36Sopenharmony_ci		pr_debug("skipping ram migration\n");
92362306a36Sopenharmony_ci		r = 0;
92462306a36Sopenharmony_ci		goto out_unref_process;
92562306a36Sopenharmony_ci	}
92662306a36Sopenharmony_ci
92762306a36Sopenharmony_ci	pr_debug("CPU page fault svms 0x%p address 0x%lx\n", &p->svms, addr);
92862306a36Sopenharmony_ci	addr >>= PAGE_SHIFT;
92962306a36Sopenharmony_ci
93062306a36Sopenharmony_ci	mutex_lock(&p->svms.lock);
93162306a36Sopenharmony_ci
93262306a36Sopenharmony_ci	prange = svm_range_from_addr(&p->svms, addr, &parent);
93362306a36Sopenharmony_ci	if (!prange) {
93462306a36Sopenharmony_ci		pr_debug("failed get range svms 0x%p addr 0x%lx\n", &p->svms, addr);
93562306a36Sopenharmony_ci		r = -EFAULT;
93662306a36Sopenharmony_ci		goto out_unlock_svms;
93762306a36Sopenharmony_ci	}
93862306a36Sopenharmony_ci
93962306a36Sopenharmony_ci	mutex_lock(&parent->migrate_mutex);
94062306a36Sopenharmony_ci	if (prange != parent)
94162306a36Sopenharmony_ci		mutex_lock_nested(&prange->migrate_mutex, 1);
94262306a36Sopenharmony_ci
94362306a36Sopenharmony_ci	if (!prange->actual_loc)
94462306a36Sopenharmony_ci		goto out_unlock_prange;
94562306a36Sopenharmony_ci
94662306a36Sopenharmony_ci	svm_range_lock(parent);
94762306a36Sopenharmony_ci	if (prange != parent)
94862306a36Sopenharmony_ci		mutex_lock_nested(&prange->lock, 1);
94962306a36Sopenharmony_ci	r = svm_range_split_by_granularity(p, mm, addr, parent, prange);
95062306a36Sopenharmony_ci	if (prange != parent)
95162306a36Sopenharmony_ci		mutex_unlock(&prange->lock);
95262306a36Sopenharmony_ci	svm_range_unlock(parent);
95362306a36Sopenharmony_ci	if (r) {
95462306a36Sopenharmony_ci		pr_debug("failed %d to split range by granularity\n", r);
95562306a36Sopenharmony_ci		goto out_unlock_prange;
95662306a36Sopenharmony_ci	}
95762306a36Sopenharmony_ci
95862306a36Sopenharmony_ci	r = svm_migrate_vram_to_ram(prange, vmf->vma->vm_mm,
95962306a36Sopenharmony_ci				    KFD_MIGRATE_TRIGGER_PAGEFAULT_CPU,
96062306a36Sopenharmony_ci				    vmf->page);
96162306a36Sopenharmony_ci	if (r)
96262306a36Sopenharmony_ci		pr_debug("failed %d migrate svms 0x%p range 0x%p [0x%lx 0x%lx]\n",
96362306a36Sopenharmony_ci			 r, prange->svms, prange, prange->start, prange->last);
96462306a36Sopenharmony_ci
96562306a36Sopenharmony_ci	/* xnack on, update mapping on GPUs with ACCESS_IN_PLACE */
96662306a36Sopenharmony_ci	if (p->xnack_enabled && parent == prange)
96762306a36Sopenharmony_ci		op = SVM_OP_UPDATE_RANGE_NOTIFIER_AND_MAP;
96862306a36Sopenharmony_ci	else
96962306a36Sopenharmony_ci		op = SVM_OP_UPDATE_RANGE_NOTIFIER;
97062306a36Sopenharmony_ci	svm_range_add_list_work(&p->svms, parent, mm, op);
97162306a36Sopenharmony_ci	schedule_deferred_list_work(&p->svms);
97262306a36Sopenharmony_ci
97362306a36Sopenharmony_ciout_unlock_prange:
97462306a36Sopenharmony_ci	if (prange != parent)
97562306a36Sopenharmony_ci		mutex_unlock(&prange->migrate_mutex);
97662306a36Sopenharmony_ci	mutex_unlock(&parent->migrate_mutex);
97762306a36Sopenharmony_ciout_unlock_svms:
97862306a36Sopenharmony_ci	mutex_unlock(&p->svms.lock);
97962306a36Sopenharmony_ciout_unref_process:
98062306a36Sopenharmony_ci	pr_debug("CPU fault svms 0x%p address 0x%lx done\n", &p->svms, addr);
98162306a36Sopenharmony_ci	kfd_unref_process(p);
98262306a36Sopenharmony_ciout_mmput:
98362306a36Sopenharmony_ci	mmput(mm);
98462306a36Sopenharmony_ci	return r ? VM_FAULT_SIGBUS : 0;
98562306a36Sopenharmony_ci}
98662306a36Sopenharmony_ci
98762306a36Sopenharmony_cistatic const struct dev_pagemap_ops svm_migrate_pgmap_ops = {
98862306a36Sopenharmony_ci	.page_free		= svm_migrate_page_free,
98962306a36Sopenharmony_ci	.migrate_to_ram		= svm_migrate_to_ram,
99062306a36Sopenharmony_ci};
99162306a36Sopenharmony_ci
99262306a36Sopenharmony_ci/* Each VRAM page uses sizeof(struct page) on system memory */
99362306a36Sopenharmony_ci#define SVM_HMM_PAGE_STRUCT_SIZE(size) ((size)/PAGE_SIZE * sizeof(struct page))
99462306a36Sopenharmony_ci
99562306a36Sopenharmony_ciint kgd2kfd_init_zone_device(struct amdgpu_device *adev)
99662306a36Sopenharmony_ci{
99762306a36Sopenharmony_ci	struct amdgpu_kfd_dev *kfddev = &adev->kfd;
99862306a36Sopenharmony_ci	struct dev_pagemap *pgmap;
99962306a36Sopenharmony_ci	struct resource *res = NULL;
100062306a36Sopenharmony_ci	unsigned long size;
100162306a36Sopenharmony_ci	void *r;
100262306a36Sopenharmony_ci
100362306a36Sopenharmony_ci	/* Page migration works on gfx9 or newer */
100462306a36Sopenharmony_ci	if (adev->ip_versions[GC_HWIP][0] < IP_VERSION(9, 0, 1))
100562306a36Sopenharmony_ci		return -EINVAL;
100662306a36Sopenharmony_ci
100762306a36Sopenharmony_ci	if (adev->gmc.is_app_apu)
100862306a36Sopenharmony_ci		return 0;
100962306a36Sopenharmony_ci
101062306a36Sopenharmony_ci	pgmap = &kfddev->pgmap;
101162306a36Sopenharmony_ci	memset(pgmap, 0, sizeof(*pgmap));
101262306a36Sopenharmony_ci
101362306a36Sopenharmony_ci	/* TODO: register all vram to HMM for now.
101462306a36Sopenharmony_ci	 * should remove reserved size
101562306a36Sopenharmony_ci	 */
101662306a36Sopenharmony_ci	size = ALIGN(adev->gmc.real_vram_size, 2ULL << 20);
101762306a36Sopenharmony_ci	if (adev->gmc.xgmi.connected_to_cpu) {
101862306a36Sopenharmony_ci		pgmap->range.start = adev->gmc.aper_base;
101962306a36Sopenharmony_ci		pgmap->range.end = adev->gmc.aper_base + adev->gmc.aper_size - 1;
102062306a36Sopenharmony_ci		pgmap->type = MEMORY_DEVICE_COHERENT;
102162306a36Sopenharmony_ci	} else {
102262306a36Sopenharmony_ci		res = devm_request_free_mem_region(adev->dev, &iomem_resource, size);
102362306a36Sopenharmony_ci		if (IS_ERR(res))
102462306a36Sopenharmony_ci			return PTR_ERR(res);
102562306a36Sopenharmony_ci		pgmap->range.start = res->start;
102662306a36Sopenharmony_ci		pgmap->range.end = res->end;
102762306a36Sopenharmony_ci		pgmap->type = MEMORY_DEVICE_PRIVATE;
102862306a36Sopenharmony_ci	}
102962306a36Sopenharmony_ci
103062306a36Sopenharmony_ci	pgmap->nr_range = 1;
103162306a36Sopenharmony_ci	pgmap->ops = &svm_migrate_pgmap_ops;
103262306a36Sopenharmony_ci	pgmap->owner = SVM_ADEV_PGMAP_OWNER(adev);
103362306a36Sopenharmony_ci	pgmap->flags = 0;
103462306a36Sopenharmony_ci	/* Device manager releases device-specific resources, memory region and
103562306a36Sopenharmony_ci	 * pgmap when driver disconnects from device.
103662306a36Sopenharmony_ci	 */
103762306a36Sopenharmony_ci	r = devm_memremap_pages(adev->dev, pgmap);
103862306a36Sopenharmony_ci	if (IS_ERR(r)) {
103962306a36Sopenharmony_ci		pr_err("failed to register HMM device memory\n");
104062306a36Sopenharmony_ci		if (pgmap->type == MEMORY_DEVICE_PRIVATE)
104162306a36Sopenharmony_ci			devm_release_mem_region(adev->dev, res->start, resource_size(res));
104262306a36Sopenharmony_ci		/* Disable SVM support capability */
104362306a36Sopenharmony_ci		pgmap->type = 0;
104462306a36Sopenharmony_ci		return PTR_ERR(r);
104562306a36Sopenharmony_ci	}
104662306a36Sopenharmony_ci
104762306a36Sopenharmony_ci	pr_debug("reserve %ldMB system memory for VRAM pages struct\n",
104862306a36Sopenharmony_ci		 SVM_HMM_PAGE_STRUCT_SIZE(size) >> 20);
104962306a36Sopenharmony_ci
105062306a36Sopenharmony_ci	amdgpu_amdkfd_reserve_system_mem(SVM_HMM_PAGE_STRUCT_SIZE(size));
105162306a36Sopenharmony_ci
105262306a36Sopenharmony_ci	pr_info("HMM registered %ldMB device memory\n", size >> 20);
105362306a36Sopenharmony_ci
105462306a36Sopenharmony_ci	return 0;
105562306a36Sopenharmony_ci}
1056