162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * DAMON Primitives for The Physical Address Space 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Author: SeongJae Park <sj@kernel.org> 662306a36Sopenharmony_ci */ 762306a36Sopenharmony_ci 862306a36Sopenharmony_ci#define pr_fmt(fmt) "damon-pa: " fmt 962306a36Sopenharmony_ci 1062306a36Sopenharmony_ci#include <linux/mmu_notifier.h> 1162306a36Sopenharmony_ci#include <linux/page_idle.h> 1262306a36Sopenharmony_ci#include <linux/pagemap.h> 1362306a36Sopenharmony_ci#include <linux/rmap.h> 1462306a36Sopenharmony_ci#include <linux/swap.h> 1562306a36Sopenharmony_ci 1662306a36Sopenharmony_ci#include "../internal.h" 1762306a36Sopenharmony_ci#include "ops-common.h" 1862306a36Sopenharmony_ci 1962306a36Sopenharmony_cistatic bool __damon_pa_mkold(struct folio *folio, struct vm_area_struct *vma, 2062306a36Sopenharmony_ci unsigned long addr, void *arg) 2162306a36Sopenharmony_ci{ 2262306a36Sopenharmony_ci DEFINE_FOLIO_VMA_WALK(pvmw, folio, vma, addr, 0); 2362306a36Sopenharmony_ci 2462306a36Sopenharmony_ci while (page_vma_mapped_walk(&pvmw)) { 2562306a36Sopenharmony_ci addr = pvmw.address; 2662306a36Sopenharmony_ci if (pvmw.pte) 2762306a36Sopenharmony_ci damon_ptep_mkold(pvmw.pte, vma, addr); 2862306a36Sopenharmony_ci else 2962306a36Sopenharmony_ci damon_pmdp_mkold(pvmw.pmd, vma, addr); 3062306a36Sopenharmony_ci } 3162306a36Sopenharmony_ci return true; 3262306a36Sopenharmony_ci} 3362306a36Sopenharmony_ci 3462306a36Sopenharmony_cistatic void damon_pa_mkold(unsigned long paddr) 3562306a36Sopenharmony_ci{ 3662306a36Sopenharmony_ci struct folio *folio = damon_get_folio(PHYS_PFN(paddr)); 3762306a36Sopenharmony_ci struct rmap_walk_control rwc = { 3862306a36Sopenharmony_ci .rmap_one = __damon_pa_mkold, 3962306a36Sopenharmony_ci .anon_lock = folio_lock_anon_vma_read, 4062306a36Sopenharmony_ci }; 4162306a36Sopenharmony_ci bool need_lock; 4262306a36Sopenharmony_ci 4362306a36Sopenharmony_ci if (!folio) 4462306a36Sopenharmony_ci return; 4562306a36Sopenharmony_ci 4662306a36Sopenharmony_ci if (!folio_mapped(folio) || !folio_raw_mapping(folio)) { 4762306a36Sopenharmony_ci folio_set_idle(folio); 4862306a36Sopenharmony_ci goto out; 4962306a36Sopenharmony_ci } 5062306a36Sopenharmony_ci 5162306a36Sopenharmony_ci need_lock = !folio_test_anon(folio) || folio_test_ksm(folio); 5262306a36Sopenharmony_ci if (need_lock && !folio_trylock(folio)) 5362306a36Sopenharmony_ci goto out; 5462306a36Sopenharmony_ci 5562306a36Sopenharmony_ci rmap_walk(folio, &rwc); 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_ci if (need_lock) 5862306a36Sopenharmony_ci folio_unlock(folio); 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_ciout: 6162306a36Sopenharmony_ci folio_put(folio); 6262306a36Sopenharmony_ci} 6362306a36Sopenharmony_ci 6462306a36Sopenharmony_cistatic void __damon_pa_prepare_access_check(struct damon_region *r) 6562306a36Sopenharmony_ci{ 6662306a36Sopenharmony_ci r->sampling_addr = damon_rand(r->ar.start, r->ar.end); 6762306a36Sopenharmony_ci 6862306a36Sopenharmony_ci damon_pa_mkold(r->sampling_addr); 6962306a36Sopenharmony_ci} 7062306a36Sopenharmony_ci 7162306a36Sopenharmony_cistatic void damon_pa_prepare_access_checks(struct damon_ctx *ctx) 7262306a36Sopenharmony_ci{ 7362306a36Sopenharmony_ci struct damon_target *t; 7462306a36Sopenharmony_ci struct damon_region *r; 7562306a36Sopenharmony_ci 7662306a36Sopenharmony_ci damon_for_each_target(t, ctx) { 7762306a36Sopenharmony_ci damon_for_each_region(r, t) 7862306a36Sopenharmony_ci __damon_pa_prepare_access_check(r); 7962306a36Sopenharmony_ci } 8062306a36Sopenharmony_ci} 8162306a36Sopenharmony_ci 8262306a36Sopenharmony_cistatic bool __damon_pa_young(struct folio *folio, struct vm_area_struct *vma, 8362306a36Sopenharmony_ci unsigned long addr, void *arg) 8462306a36Sopenharmony_ci{ 8562306a36Sopenharmony_ci bool *accessed = arg; 8662306a36Sopenharmony_ci DEFINE_FOLIO_VMA_WALK(pvmw, folio, vma, addr, 0); 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci *accessed = false; 8962306a36Sopenharmony_ci while (page_vma_mapped_walk(&pvmw)) { 9062306a36Sopenharmony_ci addr = pvmw.address; 9162306a36Sopenharmony_ci if (pvmw.pte) { 9262306a36Sopenharmony_ci *accessed = pte_young(ptep_get(pvmw.pte)) || 9362306a36Sopenharmony_ci !folio_test_idle(folio) || 9462306a36Sopenharmony_ci mmu_notifier_test_young(vma->vm_mm, addr); 9562306a36Sopenharmony_ci } else { 9662306a36Sopenharmony_ci#ifdef CONFIG_TRANSPARENT_HUGEPAGE 9762306a36Sopenharmony_ci *accessed = pmd_young(pmdp_get(pvmw.pmd)) || 9862306a36Sopenharmony_ci !folio_test_idle(folio) || 9962306a36Sopenharmony_ci mmu_notifier_test_young(vma->vm_mm, addr); 10062306a36Sopenharmony_ci#else 10162306a36Sopenharmony_ci WARN_ON_ONCE(1); 10262306a36Sopenharmony_ci#endif /* CONFIG_TRANSPARENT_HUGEPAGE */ 10362306a36Sopenharmony_ci } 10462306a36Sopenharmony_ci if (*accessed) { 10562306a36Sopenharmony_ci page_vma_mapped_walk_done(&pvmw); 10662306a36Sopenharmony_ci break; 10762306a36Sopenharmony_ci } 10862306a36Sopenharmony_ci } 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci /* If accessed, stop walking */ 11162306a36Sopenharmony_ci return *accessed == false; 11262306a36Sopenharmony_ci} 11362306a36Sopenharmony_ci 11462306a36Sopenharmony_cistatic bool damon_pa_young(unsigned long paddr, unsigned long *folio_sz) 11562306a36Sopenharmony_ci{ 11662306a36Sopenharmony_ci struct folio *folio = damon_get_folio(PHYS_PFN(paddr)); 11762306a36Sopenharmony_ci bool accessed = false; 11862306a36Sopenharmony_ci struct rmap_walk_control rwc = { 11962306a36Sopenharmony_ci .arg = &accessed, 12062306a36Sopenharmony_ci .rmap_one = __damon_pa_young, 12162306a36Sopenharmony_ci .anon_lock = folio_lock_anon_vma_read, 12262306a36Sopenharmony_ci }; 12362306a36Sopenharmony_ci bool need_lock; 12462306a36Sopenharmony_ci 12562306a36Sopenharmony_ci if (!folio) 12662306a36Sopenharmony_ci return false; 12762306a36Sopenharmony_ci 12862306a36Sopenharmony_ci if (!folio_mapped(folio) || !folio_raw_mapping(folio)) { 12962306a36Sopenharmony_ci if (folio_test_idle(folio)) 13062306a36Sopenharmony_ci accessed = false; 13162306a36Sopenharmony_ci else 13262306a36Sopenharmony_ci accessed = true; 13362306a36Sopenharmony_ci goto out; 13462306a36Sopenharmony_ci } 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_ci need_lock = !folio_test_anon(folio) || folio_test_ksm(folio); 13762306a36Sopenharmony_ci if (need_lock && !folio_trylock(folio)) 13862306a36Sopenharmony_ci goto out; 13962306a36Sopenharmony_ci 14062306a36Sopenharmony_ci rmap_walk(folio, &rwc); 14162306a36Sopenharmony_ci 14262306a36Sopenharmony_ci if (need_lock) 14362306a36Sopenharmony_ci folio_unlock(folio); 14462306a36Sopenharmony_ci 14562306a36Sopenharmony_ciout: 14662306a36Sopenharmony_ci *folio_sz = folio_size(folio); 14762306a36Sopenharmony_ci folio_put(folio); 14862306a36Sopenharmony_ci return accessed; 14962306a36Sopenharmony_ci} 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_cistatic void __damon_pa_check_access(struct damon_region *r) 15262306a36Sopenharmony_ci{ 15362306a36Sopenharmony_ci static unsigned long last_addr; 15462306a36Sopenharmony_ci static unsigned long last_folio_sz = PAGE_SIZE; 15562306a36Sopenharmony_ci static bool last_accessed; 15662306a36Sopenharmony_ci 15762306a36Sopenharmony_ci /* If the region is in the last checked page, reuse the result */ 15862306a36Sopenharmony_ci if (ALIGN_DOWN(last_addr, last_folio_sz) == 15962306a36Sopenharmony_ci ALIGN_DOWN(r->sampling_addr, last_folio_sz)) { 16062306a36Sopenharmony_ci if (last_accessed) 16162306a36Sopenharmony_ci r->nr_accesses++; 16262306a36Sopenharmony_ci return; 16362306a36Sopenharmony_ci } 16462306a36Sopenharmony_ci 16562306a36Sopenharmony_ci last_accessed = damon_pa_young(r->sampling_addr, &last_folio_sz); 16662306a36Sopenharmony_ci if (last_accessed) 16762306a36Sopenharmony_ci r->nr_accesses++; 16862306a36Sopenharmony_ci 16962306a36Sopenharmony_ci last_addr = r->sampling_addr; 17062306a36Sopenharmony_ci} 17162306a36Sopenharmony_ci 17262306a36Sopenharmony_cistatic unsigned int damon_pa_check_accesses(struct damon_ctx *ctx) 17362306a36Sopenharmony_ci{ 17462306a36Sopenharmony_ci struct damon_target *t; 17562306a36Sopenharmony_ci struct damon_region *r; 17662306a36Sopenharmony_ci unsigned int max_nr_accesses = 0; 17762306a36Sopenharmony_ci 17862306a36Sopenharmony_ci damon_for_each_target(t, ctx) { 17962306a36Sopenharmony_ci damon_for_each_region(r, t) { 18062306a36Sopenharmony_ci __damon_pa_check_access(r); 18162306a36Sopenharmony_ci max_nr_accesses = max(r->nr_accesses, max_nr_accesses); 18262306a36Sopenharmony_ci } 18362306a36Sopenharmony_ci } 18462306a36Sopenharmony_ci 18562306a36Sopenharmony_ci return max_nr_accesses; 18662306a36Sopenharmony_ci} 18762306a36Sopenharmony_ci 18862306a36Sopenharmony_cistatic bool __damos_pa_filter_out(struct damos_filter *filter, 18962306a36Sopenharmony_ci struct folio *folio) 19062306a36Sopenharmony_ci{ 19162306a36Sopenharmony_ci bool matched = false; 19262306a36Sopenharmony_ci struct mem_cgroup *memcg; 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci switch (filter->type) { 19562306a36Sopenharmony_ci case DAMOS_FILTER_TYPE_ANON: 19662306a36Sopenharmony_ci matched = folio_test_anon(folio); 19762306a36Sopenharmony_ci break; 19862306a36Sopenharmony_ci case DAMOS_FILTER_TYPE_MEMCG: 19962306a36Sopenharmony_ci rcu_read_lock(); 20062306a36Sopenharmony_ci memcg = folio_memcg_check(folio); 20162306a36Sopenharmony_ci if (!memcg) 20262306a36Sopenharmony_ci matched = false; 20362306a36Sopenharmony_ci else 20462306a36Sopenharmony_ci matched = filter->memcg_id == mem_cgroup_id(memcg); 20562306a36Sopenharmony_ci rcu_read_unlock(); 20662306a36Sopenharmony_ci break; 20762306a36Sopenharmony_ci default: 20862306a36Sopenharmony_ci break; 20962306a36Sopenharmony_ci } 21062306a36Sopenharmony_ci 21162306a36Sopenharmony_ci return matched == filter->matching; 21262306a36Sopenharmony_ci} 21362306a36Sopenharmony_ci 21462306a36Sopenharmony_ci/* 21562306a36Sopenharmony_ci * damos_pa_filter_out - Return true if the page should be filtered out. 21662306a36Sopenharmony_ci */ 21762306a36Sopenharmony_cistatic bool damos_pa_filter_out(struct damos *scheme, struct folio *folio) 21862306a36Sopenharmony_ci{ 21962306a36Sopenharmony_ci struct damos_filter *filter; 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci damos_for_each_filter(filter, scheme) { 22262306a36Sopenharmony_ci if (__damos_pa_filter_out(filter, folio)) 22362306a36Sopenharmony_ci return true; 22462306a36Sopenharmony_ci } 22562306a36Sopenharmony_ci return false; 22662306a36Sopenharmony_ci} 22762306a36Sopenharmony_ci 22862306a36Sopenharmony_cistatic unsigned long damon_pa_pageout(struct damon_region *r, struct damos *s) 22962306a36Sopenharmony_ci{ 23062306a36Sopenharmony_ci unsigned long addr, applied; 23162306a36Sopenharmony_ci LIST_HEAD(folio_list); 23262306a36Sopenharmony_ci 23362306a36Sopenharmony_ci for (addr = r->ar.start; addr < r->ar.end; addr += PAGE_SIZE) { 23462306a36Sopenharmony_ci struct folio *folio = damon_get_folio(PHYS_PFN(addr)); 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci if (!folio) 23762306a36Sopenharmony_ci continue; 23862306a36Sopenharmony_ci 23962306a36Sopenharmony_ci if (damos_pa_filter_out(s, folio)) 24062306a36Sopenharmony_ci goto put_folio; 24162306a36Sopenharmony_ci 24262306a36Sopenharmony_ci folio_clear_referenced(folio); 24362306a36Sopenharmony_ci folio_test_clear_young(folio); 24462306a36Sopenharmony_ci if (!folio_isolate_lru(folio)) 24562306a36Sopenharmony_ci goto put_folio; 24662306a36Sopenharmony_ci if (folio_test_unevictable(folio)) 24762306a36Sopenharmony_ci folio_putback_lru(folio); 24862306a36Sopenharmony_ci else 24962306a36Sopenharmony_ci list_add(&folio->lru, &folio_list); 25062306a36Sopenharmony_ciput_folio: 25162306a36Sopenharmony_ci folio_put(folio); 25262306a36Sopenharmony_ci } 25362306a36Sopenharmony_ci applied = reclaim_pages(&folio_list); 25462306a36Sopenharmony_ci cond_resched(); 25562306a36Sopenharmony_ci return applied * PAGE_SIZE; 25662306a36Sopenharmony_ci} 25762306a36Sopenharmony_ci 25862306a36Sopenharmony_cistatic inline unsigned long damon_pa_mark_accessed_or_deactivate( 25962306a36Sopenharmony_ci struct damon_region *r, struct damos *s, bool mark_accessed) 26062306a36Sopenharmony_ci{ 26162306a36Sopenharmony_ci unsigned long addr, applied = 0; 26262306a36Sopenharmony_ci 26362306a36Sopenharmony_ci for (addr = r->ar.start; addr < r->ar.end; addr += PAGE_SIZE) { 26462306a36Sopenharmony_ci struct folio *folio = damon_get_folio(PHYS_PFN(addr)); 26562306a36Sopenharmony_ci 26662306a36Sopenharmony_ci if (!folio) 26762306a36Sopenharmony_ci continue; 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci if (damos_pa_filter_out(s, folio)) 27062306a36Sopenharmony_ci goto put_folio; 27162306a36Sopenharmony_ci 27262306a36Sopenharmony_ci if (mark_accessed) 27362306a36Sopenharmony_ci folio_mark_accessed(folio); 27462306a36Sopenharmony_ci else 27562306a36Sopenharmony_ci folio_deactivate(folio); 27662306a36Sopenharmony_ci applied += folio_nr_pages(folio); 27762306a36Sopenharmony_ciput_folio: 27862306a36Sopenharmony_ci folio_put(folio); 27962306a36Sopenharmony_ci } 28062306a36Sopenharmony_ci return applied * PAGE_SIZE; 28162306a36Sopenharmony_ci} 28262306a36Sopenharmony_ci 28362306a36Sopenharmony_cistatic unsigned long damon_pa_mark_accessed(struct damon_region *r, 28462306a36Sopenharmony_ci struct damos *s) 28562306a36Sopenharmony_ci{ 28662306a36Sopenharmony_ci return damon_pa_mark_accessed_or_deactivate(r, s, true); 28762306a36Sopenharmony_ci} 28862306a36Sopenharmony_ci 28962306a36Sopenharmony_cistatic unsigned long damon_pa_deactivate_pages(struct damon_region *r, 29062306a36Sopenharmony_ci struct damos *s) 29162306a36Sopenharmony_ci{ 29262306a36Sopenharmony_ci return damon_pa_mark_accessed_or_deactivate(r, s, false); 29362306a36Sopenharmony_ci} 29462306a36Sopenharmony_ci 29562306a36Sopenharmony_cistatic unsigned long damon_pa_apply_scheme(struct damon_ctx *ctx, 29662306a36Sopenharmony_ci struct damon_target *t, struct damon_region *r, 29762306a36Sopenharmony_ci struct damos *scheme) 29862306a36Sopenharmony_ci{ 29962306a36Sopenharmony_ci switch (scheme->action) { 30062306a36Sopenharmony_ci case DAMOS_PAGEOUT: 30162306a36Sopenharmony_ci return damon_pa_pageout(r, scheme); 30262306a36Sopenharmony_ci case DAMOS_LRU_PRIO: 30362306a36Sopenharmony_ci return damon_pa_mark_accessed(r, scheme); 30462306a36Sopenharmony_ci case DAMOS_LRU_DEPRIO: 30562306a36Sopenharmony_ci return damon_pa_deactivate_pages(r, scheme); 30662306a36Sopenharmony_ci case DAMOS_STAT: 30762306a36Sopenharmony_ci break; 30862306a36Sopenharmony_ci default: 30962306a36Sopenharmony_ci /* DAMOS actions that not yet supported by 'paddr'. */ 31062306a36Sopenharmony_ci break; 31162306a36Sopenharmony_ci } 31262306a36Sopenharmony_ci return 0; 31362306a36Sopenharmony_ci} 31462306a36Sopenharmony_ci 31562306a36Sopenharmony_cistatic int damon_pa_scheme_score(struct damon_ctx *context, 31662306a36Sopenharmony_ci struct damon_target *t, struct damon_region *r, 31762306a36Sopenharmony_ci struct damos *scheme) 31862306a36Sopenharmony_ci{ 31962306a36Sopenharmony_ci switch (scheme->action) { 32062306a36Sopenharmony_ci case DAMOS_PAGEOUT: 32162306a36Sopenharmony_ci return damon_cold_score(context, r, scheme); 32262306a36Sopenharmony_ci case DAMOS_LRU_PRIO: 32362306a36Sopenharmony_ci return damon_hot_score(context, r, scheme); 32462306a36Sopenharmony_ci case DAMOS_LRU_DEPRIO: 32562306a36Sopenharmony_ci return damon_cold_score(context, r, scheme); 32662306a36Sopenharmony_ci default: 32762306a36Sopenharmony_ci break; 32862306a36Sopenharmony_ci } 32962306a36Sopenharmony_ci 33062306a36Sopenharmony_ci return DAMOS_MAX_SCORE; 33162306a36Sopenharmony_ci} 33262306a36Sopenharmony_ci 33362306a36Sopenharmony_cistatic int __init damon_pa_initcall(void) 33462306a36Sopenharmony_ci{ 33562306a36Sopenharmony_ci struct damon_operations ops = { 33662306a36Sopenharmony_ci .id = DAMON_OPS_PADDR, 33762306a36Sopenharmony_ci .init = NULL, 33862306a36Sopenharmony_ci .update = NULL, 33962306a36Sopenharmony_ci .prepare_access_checks = damon_pa_prepare_access_checks, 34062306a36Sopenharmony_ci .check_accesses = damon_pa_check_accesses, 34162306a36Sopenharmony_ci .reset_aggregated = NULL, 34262306a36Sopenharmony_ci .target_valid = NULL, 34362306a36Sopenharmony_ci .cleanup = NULL, 34462306a36Sopenharmony_ci .apply_scheme = damon_pa_apply_scheme, 34562306a36Sopenharmony_ci .get_scheme_score = damon_pa_scheme_score, 34662306a36Sopenharmony_ci }; 34762306a36Sopenharmony_ci 34862306a36Sopenharmony_ci return damon_register_ops(&ops); 34962306a36Sopenharmony_ci}; 35062306a36Sopenharmony_ci 35162306a36Sopenharmony_cisubsys_initcall(damon_pa_initcall); 352