18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * mm/zswapd.c 48c2ecf20Sopenharmony_ci * 58c2ecf20Sopenharmony_ci * Copyright (c) 2020-2022 Huawei Technologies Co., Ltd. 68c2ecf20Sopenharmony_ci */ 78c2ecf20Sopenharmony_ci 88c2ecf20Sopenharmony_ci#include <linux/freezer.h> 98c2ecf20Sopenharmony_ci#include <linux/memcg_policy.h> 108c2ecf20Sopenharmony_ci#include <trace/events/vmscan.h> 118c2ecf20Sopenharmony_ci#include <uapi/linux/sched/types.h> 128c2ecf20Sopenharmony_ci#include <linux/zswapd.h> 138c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 148c2ecf20Sopenharmony_ci#include <linux/reclaim_acct.h> 158c2ecf20Sopenharmony_ci#endif 168c2ecf20Sopenharmony_ci 178c2ecf20Sopenharmony_ci#include "zswapd_internal.h" 188c2ecf20Sopenharmony_ci#include "internal.h" 198c2ecf20Sopenharmony_ci 208c2ecf20Sopenharmony_ci#define UNSET_ZRAM_WM_RATIO 0 218c2ecf20Sopenharmony_ci#define ESWAP_PERCENT_CONSTANT 100 228c2ecf20Sopenharmony_ci#define DEFAULT_ZRAM_WM_RATIO 37 238c2ecf20Sopenharmony_ci#define SWAP_MORE_ZRAM (50 * (SZ_1M)) 248c2ecf20Sopenharmony_ci 258c2ecf20Sopenharmony_cistatic wait_queue_head_t snapshotd_wait; 268c2ecf20Sopenharmony_cistatic atomic_t snapshotd_wait_flag; 278c2ecf20Sopenharmony_cistatic atomic_t snapshotd_init_flag = ATOMIC_INIT(0); 288c2ecf20Sopenharmony_cistatic struct task_struct *snapshotd_task; 298c2ecf20Sopenharmony_ci 308c2ecf20Sopenharmony_cistatic pid_t zswapd_pid = -1; 318c2ecf20Sopenharmony_cistatic unsigned long long last_anon_pagefault; 328c2ecf20Sopenharmony_cistatic unsigned long long anon_refault_ratio; 338c2ecf20Sopenharmony_cistatic unsigned long long zswapd_skip_interval; 348c2ecf20Sopenharmony_cistatic unsigned long last_zswapd_time; 358c2ecf20Sopenharmony_cistatic unsigned long last_snapshot_time; 368c2ecf20Sopenharmony_cibool last_round_is_empty; 378c2ecf20Sopenharmony_ci 388c2ecf20Sopenharmony_ci 398c2ecf20Sopenharmony_ciDECLARE_RWSEM(gs_lock); 408c2ecf20Sopenharmony_ciLIST_HEAD(gs_list); 418c2ecf20Sopenharmony_ci 428c2ecf20Sopenharmony_civoid unregister_group_swap(struct group_swap_device *gsdev) 438c2ecf20Sopenharmony_ci{ 448c2ecf20Sopenharmony_ci down_write(&gs_lock); 458c2ecf20Sopenharmony_ci list_del(&gsdev->list); 468c2ecf20Sopenharmony_ci up_write(&gs_lock); 478c2ecf20Sopenharmony_ci 488c2ecf20Sopenharmony_ci kfree(gsdev); 498c2ecf20Sopenharmony_ci} 508c2ecf20Sopenharmony_ciEXPORT_SYMBOL(unregister_group_swap); 518c2ecf20Sopenharmony_ci 528c2ecf20Sopenharmony_cistruct group_swap_device *register_group_swap(struct group_swap_ops *ops, void *priv) 538c2ecf20Sopenharmony_ci{ 548c2ecf20Sopenharmony_ci struct group_swap_device *gsdev = kzalloc(sizeof(struct group_swap_device), GFP_KERNEL); 558c2ecf20Sopenharmony_ci 568c2ecf20Sopenharmony_ci if (!gsdev) 578c2ecf20Sopenharmony_ci return NULL; 588c2ecf20Sopenharmony_ci 598c2ecf20Sopenharmony_ci gsdev->priv = priv; 608c2ecf20Sopenharmony_ci gsdev->ops = ops; 618c2ecf20Sopenharmony_ci 628c2ecf20Sopenharmony_ci down_write(&gs_lock); 638c2ecf20Sopenharmony_ci list_add(&gsdev->list, &gs_list); 648c2ecf20Sopenharmony_ci up_write(&gs_lock); 658c2ecf20Sopenharmony_ci 668c2ecf20Sopenharmony_ci return gsdev; 678c2ecf20Sopenharmony_ci} 688c2ecf20Sopenharmony_ciEXPORT_SYMBOL(register_group_swap); 698c2ecf20Sopenharmony_ci 708c2ecf20Sopenharmony_ciu64 memcg_data_size(struct mem_cgroup *memcg, int type) 718c2ecf20Sopenharmony_ci{ 728c2ecf20Sopenharmony_ci struct group_swap_device *gsdev = NULL; 738c2ecf20Sopenharmony_ci u64 size = 0; 748c2ecf20Sopenharmony_ci 758c2ecf20Sopenharmony_ci down_read(&gs_lock); 768c2ecf20Sopenharmony_ci list_for_each_entry(gsdev, &gs_list, list) 778c2ecf20Sopenharmony_ci size += gsdev->ops->group_data_size(memcg->id.id, type, gsdev->priv); 788c2ecf20Sopenharmony_ci up_read(&gs_lock); 798c2ecf20Sopenharmony_ci 808c2ecf20Sopenharmony_ci return size; 818c2ecf20Sopenharmony_ci} 828c2ecf20Sopenharmony_ci 838c2ecf20Sopenharmony_ciu64 swapin_memcg(struct mem_cgroup *memcg, u64 req_size) 848c2ecf20Sopenharmony_ci{ 858c2ecf20Sopenharmony_ci u64 swap_size = memcg_data_size(memcg, SWAP_SIZE); 868c2ecf20Sopenharmony_ci u64 read_size = 0; 878c2ecf20Sopenharmony_ci u64 ratio = atomic64_read(&memcg->memcg_reclaimed.ub_ufs2zram_ratio); 888c2ecf20Sopenharmony_ci struct group_swap_device *gsdev = NULL; 898c2ecf20Sopenharmony_ci 908c2ecf20Sopenharmony_ci if (req_size > div_u64(swap_size * ratio, ESWAP_PERCENT_CONSTANT)) 918c2ecf20Sopenharmony_ci req_size = div_u64(swap_size * ratio, ESWAP_PERCENT_CONSTANT); 928c2ecf20Sopenharmony_ci down_read(&gs_lock); 938c2ecf20Sopenharmony_ci list_for_each_entry(gsdev, &gs_list, list) { 948c2ecf20Sopenharmony_ci read_size += gsdev->ops->group_read(memcg->id.id, req_size - read_size, 958c2ecf20Sopenharmony_ci gsdev->priv); 968c2ecf20Sopenharmony_ci if (read_size >= req_size) 978c2ecf20Sopenharmony_ci break; 988c2ecf20Sopenharmony_ci } 998c2ecf20Sopenharmony_ci up_read(&gs_lock); 1008c2ecf20Sopenharmony_ci 1018c2ecf20Sopenharmony_ci return read_size; 1028c2ecf20Sopenharmony_ci} 1038c2ecf20Sopenharmony_ci 1048c2ecf20Sopenharmony_cistatic u64 swapout_memcg(struct mem_cgroup *memcg, u64 req_size) 1058c2ecf20Sopenharmony_ci{ 1068c2ecf20Sopenharmony_ci u64 cache_size = memcg_data_size(memcg, CACHE_SIZE); 1078c2ecf20Sopenharmony_ci u64 swap_size = memcg_data_size(memcg, SWAP_SIZE); 1088c2ecf20Sopenharmony_ci u64 all_size = cache_size + swap_size; 1098c2ecf20Sopenharmony_ci u64 write_size = 0; 1108c2ecf20Sopenharmony_ci u32 ratio = atomic_read(&memcg->memcg_reclaimed.ub_zram2ufs_ratio); 1118c2ecf20Sopenharmony_ci struct group_swap_device *gsdev = NULL; 1128c2ecf20Sopenharmony_ci 1138c2ecf20Sopenharmony_ci if (div_u64(all_size * ratio, ESWAP_PERCENT_CONSTANT) <= swap_size) 1148c2ecf20Sopenharmony_ci return 0; 1158c2ecf20Sopenharmony_ci if (req_size > div_u64(all_size * ratio, ESWAP_PERCENT_CONSTANT) - swap_size) 1168c2ecf20Sopenharmony_ci req_size = div_u64(all_size * ratio, ESWAP_PERCENT_CONSTANT) - swap_size; 1178c2ecf20Sopenharmony_ci down_read(&gs_lock); 1188c2ecf20Sopenharmony_ci list_for_each_entry(gsdev, &gs_list, list) { 1198c2ecf20Sopenharmony_ci write_size += gsdev->ops->group_write(memcg->id.id, req_size - write_size, 1208c2ecf20Sopenharmony_ci gsdev->priv); 1218c2ecf20Sopenharmony_ci if (write_size >= req_size) 1228c2ecf20Sopenharmony_ci break; 1238c2ecf20Sopenharmony_ci } 1248c2ecf20Sopenharmony_ci up_read(&gs_lock); 1258c2ecf20Sopenharmony_ci 1268c2ecf20Sopenharmony_ci return write_size; 1278c2ecf20Sopenharmony_ci} 1288c2ecf20Sopenharmony_ci 1298c2ecf20Sopenharmony_cistatic u64 swapout(u64 req_size) 1308c2ecf20Sopenharmony_ci{ 1318c2ecf20Sopenharmony_ci struct mem_cgroup *memcg = NULL; 1328c2ecf20Sopenharmony_ci u64 write_size = 0; 1338c2ecf20Sopenharmony_ci 1348c2ecf20Sopenharmony_ci while ((memcg = get_next_memcg(memcg)) != NULL) { 1358c2ecf20Sopenharmony_ci write_size += swapout_memcg(memcg, req_size - write_size); 1368c2ecf20Sopenharmony_ci if (write_size >= req_size) 1378c2ecf20Sopenharmony_ci break; 1388c2ecf20Sopenharmony_ci } 1398c2ecf20Sopenharmony_ci 1408c2ecf20Sopenharmony_ci return write_size; 1418c2ecf20Sopenharmony_ci} 1428c2ecf20Sopenharmony_ci 1438c2ecf20Sopenharmony_cistatic unsigned long long get_zram_used_pages(void) 1448c2ecf20Sopenharmony_ci{ 1458c2ecf20Sopenharmony_ci struct mem_cgroup *memcg = NULL; 1468c2ecf20Sopenharmony_ci unsigned long long zram_pages = 0; 1478c2ecf20Sopenharmony_ci 1488c2ecf20Sopenharmony_ci while ((memcg = get_next_memcg(memcg)) != NULL) 1498c2ecf20Sopenharmony_ci zram_pages += memcg_data_size(memcg, CACHE_PAGE); 1508c2ecf20Sopenharmony_ci 1518c2ecf20Sopenharmony_ci return zram_pages; 1528c2ecf20Sopenharmony_ci} 1538c2ecf20Sopenharmony_ci 1548c2ecf20Sopenharmony_cistatic unsigned long long get_eswap_used_pages(void) 1558c2ecf20Sopenharmony_ci{ 1568c2ecf20Sopenharmony_ci struct mem_cgroup *memcg = NULL; 1578c2ecf20Sopenharmony_ci unsigned long long eswap_pages = 0; 1588c2ecf20Sopenharmony_ci 1598c2ecf20Sopenharmony_ci while ((memcg = get_next_memcg(memcg)) != NULL) 1608c2ecf20Sopenharmony_ci eswap_pages += memcg_data_size(memcg, SWAP_PAGE); 1618c2ecf20Sopenharmony_ci 1628c2ecf20Sopenharmony_ci return eswap_pages; 1638c2ecf20Sopenharmony_ci} 1648c2ecf20Sopenharmony_ci 1658c2ecf20Sopenharmony_cistatic unsigned long long get_zram_pagefault(void) 1668c2ecf20Sopenharmony_ci{ 1678c2ecf20Sopenharmony_ci struct mem_cgroup *memcg = NULL; 1688c2ecf20Sopenharmony_ci unsigned long long cache_fault = 0; 1698c2ecf20Sopenharmony_ci 1708c2ecf20Sopenharmony_ci while ((memcg = get_next_memcg(memcg)) != NULL) 1718c2ecf20Sopenharmony_ci cache_fault += memcg_data_size(memcg, CACHE_FAULT); 1728c2ecf20Sopenharmony_ci 1738c2ecf20Sopenharmony_ci return cache_fault; 1748c2ecf20Sopenharmony_ci} 1758c2ecf20Sopenharmony_ci 1768c2ecf20Sopenharmony_cistatic unsigned int calc_sys_cur_avail_buffers(void) 1778c2ecf20Sopenharmony_ci{ 1788c2ecf20Sopenharmony_ci const unsigned int percent_constant = 100; 1798c2ecf20Sopenharmony_ci unsigned long freemem; 1808c2ecf20Sopenharmony_ci unsigned long active_file; 1818c2ecf20Sopenharmony_ci unsigned long inactive_file; 1828c2ecf20Sopenharmony_ci unsigned long buffers; 1838c2ecf20Sopenharmony_ci 1848c2ecf20Sopenharmony_ci freemem = global_zone_page_state(NR_FREE_PAGES) * PAGE_SIZE / SZ_1K; 1858c2ecf20Sopenharmony_ci active_file = global_node_page_state(NR_ACTIVE_FILE) * PAGE_SIZE / SZ_1K; 1868c2ecf20Sopenharmony_ci inactive_file = global_node_page_state(NR_INACTIVE_FILE) * PAGE_SIZE / SZ_1K; 1878c2ecf20Sopenharmony_ci 1888c2ecf20Sopenharmony_ci buffers = freemem + inactive_file * get_inactive_file_ratio() / percent_constant + 1898c2ecf20Sopenharmony_ci active_file * get_active_file_ratio() / percent_constant; 1908c2ecf20Sopenharmony_ci 1918c2ecf20Sopenharmony_ci return (buffers * SZ_1K / SZ_1M); /* kb to mb */ 1928c2ecf20Sopenharmony_ci} 1938c2ecf20Sopenharmony_ci 1948c2ecf20Sopenharmony_civoid zswapd_status_show(struct seq_file *m) 1958c2ecf20Sopenharmony_ci{ 1968c2ecf20Sopenharmony_ci unsigned int buffers = calc_sys_cur_avail_buffers(); 1978c2ecf20Sopenharmony_ci 1988c2ecf20Sopenharmony_ci seq_printf(m, "buffer_size %u\n", buffers); 1998c2ecf20Sopenharmony_ci seq_printf(m, "recent_refault %llu\n", anon_refault_ratio); 2008c2ecf20Sopenharmony_ci} 2018c2ecf20Sopenharmony_ci 2028c2ecf20Sopenharmony_cipid_t get_zswapd_pid(void) 2038c2ecf20Sopenharmony_ci{ 2048c2ecf20Sopenharmony_ci return zswapd_pid; 2058c2ecf20Sopenharmony_ci} 2068c2ecf20Sopenharmony_ci 2078c2ecf20Sopenharmony_cistatic bool min_buffer_is_suitable(void) 2088c2ecf20Sopenharmony_ci{ 2098c2ecf20Sopenharmony_ci unsigned int buffers = calc_sys_cur_avail_buffers(); 2108c2ecf20Sopenharmony_ci 2118c2ecf20Sopenharmony_ci if (buffers >= get_min_avail_buffers()) 2128c2ecf20Sopenharmony_ci return true; 2138c2ecf20Sopenharmony_ci 2148c2ecf20Sopenharmony_ci return false; 2158c2ecf20Sopenharmony_ci} 2168c2ecf20Sopenharmony_ci 2178c2ecf20Sopenharmony_cistatic bool buffer_is_suitable(void) 2188c2ecf20Sopenharmony_ci{ 2198c2ecf20Sopenharmony_ci unsigned int buffers = calc_sys_cur_avail_buffers(); 2208c2ecf20Sopenharmony_ci 2218c2ecf20Sopenharmony_ci if (buffers >= get_avail_buffers()) 2228c2ecf20Sopenharmony_ci return true; 2238c2ecf20Sopenharmony_ci 2248c2ecf20Sopenharmony_ci return false; 2258c2ecf20Sopenharmony_ci} 2268c2ecf20Sopenharmony_ci 2278c2ecf20Sopenharmony_cistatic bool high_buffer_is_suitable(void) 2288c2ecf20Sopenharmony_ci{ 2298c2ecf20Sopenharmony_ci unsigned int buffers = calc_sys_cur_avail_buffers(); 2308c2ecf20Sopenharmony_ci 2318c2ecf20Sopenharmony_ci if (buffers >= get_high_avail_buffers()) 2328c2ecf20Sopenharmony_ci return true; 2338c2ecf20Sopenharmony_ci 2348c2ecf20Sopenharmony_ci return false; 2358c2ecf20Sopenharmony_ci} 2368c2ecf20Sopenharmony_ci 2378c2ecf20Sopenharmony_cistatic void snapshot_anon_refaults(void) 2388c2ecf20Sopenharmony_ci{ 2398c2ecf20Sopenharmony_ci struct mem_cgroup *memcg = NULL; 2408c2ecf20Sopenharmony_ci 2418c2ecf20Sopenharmony_ci while ((memcg = get_next_memcg(memcg)) != NULL) 2428c2ecf20Sopenharmony_ci memcg->memcg_reclaimed.reclaimed_pagefault = memcg_data_size(memcg, CACHE_FAULT); 2438c2ecf20Sopenharmony_ci 2448c2ecf20Sopenharmony_ci last_anon_pagefault = get_zram_pagefault(); 2458c2ecf20Sopenharmony_ci last_snapshot_time = jiffies; 2468c2ecf20Sopenharmony_ci} 2478c2ecf20Sopenharmony_ci 2488c2ecf20Sopenharmony_ci/* 2498c2ecf20Sopenharmony_ci * Return true if refault changes between two read operations. 2508c2ecf20Sopenharmony_ci */ 2518c2ecf20Sopenharmony_cistatic bool get_memcg_anon_refault_status(struct mem_cgroup *memcg) 2528c2ecf20Sopenharmony_ci{ 2538c2ecf20Sopenharmony_ci const unsigned int percent_constant = 100; 2548c2ecf20Sopenharmony_ci unsigned long long anon_pagefault; 2558c2ecf20Sopenharmony_ci unsigned long long anon_total; 2568c2ecf20Sopenharmony_ci unsigned long long ratio; 2578c2ecf20Sopenharmony_ci struct mem_cgroup_per_node *mz = NULL; 2588c2ecf20Sopenharmony_ci struct lruvec *lruvec = NULL; 2598c2ecf20Sopenharmony_ci 2608c2ecf20Sopenharmony_ci if (!memcg) 2618c2ecf20Sopenharmony_ci return false; 2628c2ecf20Sopenharmony_ci 2638c2ecf20Sopenharmony_ci anon_pagefault = memcg_data_size(memcg, CACHE_FAULT); 2648c2ecf20Sopenharmony_ci if (anon_pagefault == memcg->memcg_reclaimed.reclaimed_pagefault) 2658c2ecf20Sopenharmony_ci return false; 2668c2ecf20Sopenharmony_ci 2678c2ecf20Sopenharmony_ci mz = mem_cgroup_nodeinfo(memcg, 0); 2688c2ecf20Sopenharmony_ci if (!mz) 2698c2ecf20Sopenharmony_ci return false; 2708c2ecf20Sopenharmony_ci 2718c2ecf20Sopenharmony_ci lruvec = &mz->lruvec; 2728c2ecf20Sopenharmony_ci if (!lruvec) 2738c2ecf20Sopenharmony_ci return false; 2748c2ecf20Sopenharmony_ci 2758c2ecf20Sopenharmony_ci anon_total = lruvec_lru_size(lruvec, LRU_ACTIVE_ANON, MAX_NR_ZONES) + 2768c2ecf20Sopenharmony_ci lruvec_lru_size(lruvec, LRU_INACTIVE_ANON, MAX_NR_ZONES) + 2778c2ecf20Sopenharmony_ci memcg_data_size(memcg, SWAP_PAGE) + memcg_data_size(memcg, CACHE_PAGE); 2788c2ecf20Sopenharmony_ci 2798c2ecf20Sopenharmony_ci ratio = div64_u64((anon_pagefault - memcg->memcg_reclaimed.reclaimed_pagefault) * 2808c2ecf20Sopenharmony_ci percent_constant, (anon_total + 1)); 2818c2ecf20Sopenharmony_ci if (ratio > atomic_read(&memcg->memcg_reclaimed.refault_threshold)) 2828c2ecf20Sopenharmony_ci return true; 2838c2ecf20Sopenharmony_ci 2848c2ecf20Sopenharmony_ci return false; 2858c2ecf20Sopenharmony_ci} 2868c2ecf20Sopenharmony_ci 2878c2ecf20Sopenharmony_cistatic bool get_area_anon_refault_status(void) 2888c2ecf20Sopenharmony_ci{ 2898c2ecf20Sopenharmony_ci const unsigned int percent_constant = 1000; 2908c2ecf20Sopenharmony_ci unsigned long long anon_pagefault; 2918c2ecf20Sopenharmony_ci unsigned long long ratio; 2928c2ecf20Sopenharmony_ci unsigned long long time; 2938c2ecf20Sopenharmony_ci 2948c2ecf20Sopenharmony_ci anon_pagefault = get_zram_pagefault(); 2958c2ecf20Sopenharmony_ci time = jiffies; 2968c2ecf20Sopenharmony_ci if (anon_pagefault == last_anon_pagefault || time == last_snapshot_time) 2978c2ecf20Sopenharmony_ci return false; 2988c2ecf20Sopenharmony_ci 2998c2ecf20Sopenharmony_ci ratio = div_u64((anon_pagefault - last_anon_pagefault) * percent_constant, 3008c2ecf20Sopenharmony_ci (jiffies_to_msecs(time - last_snapshot_time) + 1)); 3018c2ecf20Sopenharmony_ci anon_refault_ratio = ratio; 3028c2ecf20Sopenharmony_ci 3038c2ecf20Sopenharmony_ci if (ratio > get_area_anon_refault_threshold()) 3048c2ecf20Sopenharmony_ci return true; 3058c2ecf20Sopenharmony_ci 3068c2ecf20Sopenharmony_ci return false; 3078c2ecf20Sopenharmony_ci} 3088c2ecf20Sopenharmony_ci 3098c2ecf20Sopenharmony_civoid wakeup_snapshotd(void) 3108c2ecf20Sopenharmony_ci{ 3118c2ecf20Sopenharmony_ci unsigned long snapshot_interval; 3128c2ecf20Sopenharmony_ci 3138c2ecf20Sopenharmony_ci snapshot_interval = jiffies_to_msecs(jiffies - last_snapshot_time); 3148c2ecf20Sopenharmony_ci if (snapshot_interval >= get_anon_refault_snapshot_min_interval()) { 3158c2ecf20Sopenharmony_ci atomic_set(&snapshotd_wait_flag, 1); 3168c2ecf20Sopenharmony_ci wake_up_interruptible(&snapshotd_wait); 3178c2ecf20Sopenharmony_ci } 3188c2ecf20Sopenharmony_ci} 3198c2ecf20Sopenharmony_ci 3208c2ecf20Sopenharmony_cistatic int snapshotd(void *p) 3218c2ecf20Sopenharmony_ci{ 3228c2ecf20Sopenharmony_ci int ret; 3238c2ecf20Sopenharmony_ci 3248c2ecf20Sopenharmony_ci while (!kthread_should_stop()) { 3258c2ecf20Sopenharmony_ci ret = wait_event_interruptible(snapshotd_wait, atomic_read(&snapshotd_wait_flag)); 3268c2ecf20Sopenharmony_ci if (ret) 3278c2ecf20Sopenharmony_ci continue; 3288c2ecf20Sopenharmony_ci 3298c2ecf20Sopenharmony_ci atomic_set(&snapshotd_wait_flag, 0); 3308c2ecf20Sopenharmony_ci 3318c2ecf20Sopenharmony_ci snapshot_anon_refaults(); 3328c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_SNAPSHOT_TIMES); 3338c2ecf20Sopenharmony_ci } 3348c2ecf20Sopenharmony_ci 3358c2ecf20Sopenharmony_ci return 0; 3368c2ecf20Sopenharmony_ci} 3378c2ecf20Sopenharmony_ci 3388c2ecf20Sopenharmony_civoid set_snapshotd_init_flag(unsigned int val) 3398c2ecf20Sopenharmony_ci{ 3408c2ecf20Sopenharmony_ci atomic_set(&snapshotd_init_flag, val); 3418c2ecf20Sopenharmony_ci} 3428c2ecf20Sopenharmony_ci 3438c2ecf20Sopenharmony_ci/* 3448c2ecf20Sopenharmony_ci * This snapshotd start function will be called by init. 3458c2ecf20Sopenharmony_ci */ 3468c2ecf20Sopenharmony_ciint snapshotd_run(void) 3478c2ecf20Sopenharmony_ci{ 3488c2ecf20Sopenharmony_ci atomic_set(&snapshotd_wait_flag, 0); 3498c2ecf20Sopenharmony_ci init_waitqueue_head(&snapshotd_wait); 3508c2ecf20Sopenharmony_ci 3518c2ecf20Sopenharmony_ci snapshotd_task = kthread_run(snapshotd, NULL, "snapshotd"); 3528c2ecf20Sopenharmony_ci if (IS_ERR(snapshotd_task)) { 3538c2ecf20Sopenharmony_ci pr_err("Failed to start snapshotd\n"); 3548c2ecf20Sopenharmony_ci return PTR_ERR(snapshotd_task); 3558c2ecf20Sopenharmony_ci } 3568c2ecf20Sopenharmony_ci 3578c2ecf20Sopenharmony_ci return 0; 3588c2ecf20Sopenharmony_ci} 3598c2ecf20Sopenharmony_ci 3608c2ecf20Sopenharmony_cistatic int __init snapshotd_init(void) 3618c2ecf20Sopenharmony_ci{ 3628c2ecf20Sopenharmony_ci snapshotd_run(); 3638c2ecf20Sopenharmony_ci 3648c2ecf20Sopenharmony_ci return 0; 3658c2ecf20Sopenharmony_ci} 3668c2ecf20Sopenharmony_cimodule_init(snapshotd_init); 3678c2ecf20Sopenharmony_ci 3688c2ecf20Sopenharmony_cistatic int get_zswapd_eswap_policy(void) 3698c2ecf20Sopenharmony_ci{ 3708c2ecf20Sopenharmony_ci if (get_zram_wm_ratio() == UNSET_ZRAM_WM_RATIO) 3718c2ecf20Sopenharmony_ci return CHECK_BUFFER_ONLY; 3728c2ecf20Sopenharmony_ci else 3738c2ecf20Sopenharmony_ci return CHECK_BUFFER_ZRAMRATIO_BOTH; 3748c2ecf20Sopenharmony_ci} 3758c2ecf20Sopenharmony_ci 3768c2ecf20Sopenharmony_cistatic unsigned int get_policy_zram_wm_ratio(void) 3778c2ecf20Sopenharmony_ci{ 3788c2ecf20Sopenharmony_ci enum zswapd_eswap_policy policy = get_zswapd_eswap_policy(); 3798c2ecf20Sopenharmony_ci 3808c2ecf20Sopenharmony_ci if (policy == CHECK_BUFFER_ONLY) 3818c2ecf20Sopenharmony_ci return DEFAULT_ZRAM_WM_RATIO; 3828c2ecf20Sopenharmony_ci else 3838c2ecf20Sopenharmony_ci return get_zram_wm_ratio(); 3848c2ecf20Sopenharmony_ci} 3858c2ecf20Sopenharmony_ci 3868c2ecf20Sopenharmony_ciint get_zram_current_watermark(void) 3878c2ecf20Sopenharmony_ci{ 3888c2ecf20Sopenharmony_ci long long diff_buffers; 3898c2ecf20Sopenharmony_ci const unsigned int percent_constant = 10; 3908c2ecf20Sopenharmony_ci u64 nr_total; 3918c2ecf20Sopenharmony_ci unsigned int zram_wm_ratio = get_policy_zram_wm_ratio(); 3928c2ecf20Sopenharmony_ci 3938c2ecf20Sopenharmony_ci nr_total = totalram_pages(); 3948c2ecf20Sopenharmony_ci /* B_target - B_current */ 3958c2ecf20Sopenharmony_ci diff_buffers = get_avail_buffers() - calc_sys_cur_avail_buffers(); 3968c2ecf20Sopenharmony_ci /* MB to page */ 3978c2ecf20Sopenharmony_ci diff_buffers *= SZ_1M / PAGE_SIZE; 3988c2ecf20Sopenharmony_ci /* after_comp to before_comp */ 3998c2ecf20Sopenharmony_ci diff_buffers *= get_compress_ratio(); 4008c2ecf20Sopenharmony_ci /* page to ratio */ 4018c2ecf20Sopenharmony_ci diff_buffers = div64_s64(diff_buffers * percent_constant, nr_total); 4028c2ecf20Sopenharmony_ci 4038c2ecf20Sopenharmony_ci return min((long long)zram_wm_ratio, zram_wm_ratio - diff_buffers); 4048c2ecf20Sopenharmony_ci} 4058c2ecf20Sopenharmony_ci 4068c2ecf20Sopenharmony_cibool zram_watermark_ok(void) 4078c2ecf20Sopenharmony_ci{ 4088c2ecf20Sopenharmony_ci const unsigned int percent_constant = 100; 4098c2ecf20Sopenharmony_ci u64 nr_zram_used; 4108c2ecf20Sopenharmony_ci u64 nr_wm; 4118c2ecf20Sopenharmony_ci u64 ratio; 4128c2ecf20Sopenharmony_ci 4138c2ecf20Sopenharmony_ci ratio = get_zram_current_watermark(); 4148c2ecf20Sopenharmony_ci nr_zram_used = get_zram_used_pages(); 4158c2ecf20Sopenharmony_ci nr_wm = div_u64(totalram_pages() * ratio, percent_constant); 4168c2ecf20Sopenharmony_ci if (nr_zram_used > nr_wm) 4178c2ecf20Sopenharmony_ci return true; 4188c2ecf20Sopenharmony_ci 4198c2ecf20Sopenharmony_ci return false; 4208c2ecf20Sopenharmony_ci} 4218c2ecf20Sopenharmony_ci 4228c2ecf20Sopenharmony_cibool zram_watermark_exceed(void) 4238c2ecf20Sopenharmony_ci{ 4248c2ecf20Sopenharmony_ci u64 nr_zram_used; 4258c2ecf20Sopenharmony_ci const unsigned long long nr_wm = get_zram_critical_threshold() * (SZ_1M / PAGE_SIZE); 4268c2ecf20Sopenharmony_ci 4278c2ecf20Sopenharmony_ci if (!nr_wm) 4288c2ecf20Sopenharmony_ci return false; 4298c2ecf20Sopenharmony_ci 4308c2ecf20Sopenharmony_ci nr_zram_used = get_zram_used_pages(); 4318c2ecf20Sopenharmony_ci if (nr_zram_used > nr_wm) 4328c2ecf20Sopenharmony_ci return true; 4338c2ecf20Sopenharmony_ci return false; 4348c2ecf20Sopenharmony_ci} 4358c2ecf20Sopenharmony_ci 4368c2ecf20Sopenharmony_civoid wakeup_zswapd(pg_data_t *pgdat) 4378c2ecf20Sopenharmony_ci{ 4388c2ecf20Sopenharmony_ci unsigned long interval; 4398c2ecf20Sopenharmony_ci 4408c2ecf20Sopenharmony_ci if (IS_ERR(pgdat->zswapd)) 4418c2ecf20Sopenharmony_ci return; 4428c2ecf20Sopenharmony_ci 4438c2ecf20Sopenharmony_ci if (!wq_has_sleeper(&pgdat->zswapd_wait)) 4448c2ecf20Sopenharmony_ci return; 4458c2ecf20Sopenharmony_ci 4468c2ecf20Sopenharmony_ci /* 4478c2ecf20Sopenharmony_ci * make anon pagefault snapshots 4488c2ecf20Sopenharmony_ci * wake up snapshotd 4498c2ecf20Sopenharmony_ci */ 4508c2ecf20Sopenharmony_ci if (atomic_read(&snapshotd_init_flag) == 1) 4518c2ecf20Sopenharmony_ci wakeup_snapshotd(); 4528c2ecf20Sopenharmony_ci 4538c2ecf20Sopenharmony_ci /* wake up when the buffer is lower than min_avail_buffer */ 4548c2ecf20Sopenharmony_ci if (min_buffer_is_suitable()) 4558c2ecf20Sopenharmony_ci return; 4568c2ecf20Sopenharmony_ci 4578c2ecf20Sopenharmony_ci interval = jiffies_to_msecs(jiffies - last_zswapd_time); 4588c2ecf20Sopenharmony_ci if (interval < zswapd_skip_interval) { 4598c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_EMPTY_ROUND_SKIP_TIMES); 4608c2ecf20Sopenharmony_ci return; 4618c2ecf20Sopenharmony_ci } 4628c2ecf20Sopenharmony_ci 4638c2ecf20Sopenharmony_ci atomic_set(&pgdat->zswapd_wait_flag, 1); 4648c2ecf20Sopenharmony_ci wake_up_interruptible(&pgdat->zswapd_wait); 4658c2ecf20Sopenharmony_ci} 4668c2ecf20Sopenharmony_ci 4678c2ecf20Sopenharmony_civoid wake_all_zswapd(void) 4688c2ecf20Sopenharmony_ci{ 4698c2ecf20Sopenharmony_ci pg_data_t *pgdat = NULL; 4708c2ecf20Sopenharmony_ci int nid; 4718c2ecf20Sopenharmony_ci 4728c2ecf20Sopenharmony_ci for_each_online_node(nid) { 4738c2ecf20Sopenharmony_ci pgdat = NODE_DATA(nid); 4748c2ecf20Sopenharmony_ci wakeup_zswapd(pgdat); 4758c2ecf20Sopenharmony_ci } 4768c2ecf20Sopenharmony_ci} 4778c2ecf20Sopenharmony_ci 4788c2ecf20Sopenharmony_ci#ifdef CONFIG_HYPERHOLD_FILE_LRU 4798c2ecf20Sopenharmony_cistatic void zswapd_shrink_active_list(unsigned long nr_to_scan, 4808c2ecf20Sopenharmony_ci struct lruvec *lruvec, struct scan_control *sc, enum lru_list lru) 4818c2ecf20Sopenharmony_ci{ 4828c2ecf20Sopenharmony_ci unsigned int nr_deactivate; 4838c2ecf20Sopenharmony_ci unsigned long nr_scanned; 4848c2ecf20Sopenharmony_ci unsigned long nr_taken; 4858c2ecf20Sopenharmony_ci 4868c2ecf20Sopenharmony_ci struct page *page = NULL; 4878c2ecf20Sopenharmony_ci struct pglist_data *pgdat = lruvec_pgdat(lruvec); 4888c2ecf20Sopenharmony_ci unsigned long *node_anon_cost = &pgdat->__lruvec.anon_cost; 4898c2ecf20Sopenharmony_ci unsigned long *anon_cost = &lruvec->anon_cost; 4908c2ecf20Sopenharmony_ci LIST_HEAD(l_inactive); 4918c2ecf20Sopenharmony_ci LIST_HEAD(l_hold); 4928c2ecf20Sopenharmony_ci 4938c2ecf20Sopenharmony_ci lru_add_drain(); 4948c2ecf20Sopenharmony_ci 4958c2ecf20Sopenharmony_ci spin_lock_irq(&pgdat->lru_lock); 4968c2ecf20Sopenharmony_ci nr_taken = isolate_lru_pages(nr_to_scan, lruvec, &l_hold, &nr_scanned, sc, lru); 4978c2ecf20Sopenharmony_ci __mod_node_page_state(pgdat, NR_ISOLATED_ANON, nr_taken); 4988c2ecf20Sopenharmony_ci *anon_cost += nr_taken; 4998c2ecf20Sopenharmony_ci *node_anon_cost += nr_taken; 5008c2ecf20Sopenharmony_ci __count_vm_events(PGREFILL, nr_scanned); 5018c2ecf20Sopenharmony_ci count_memcg_events(lruvec_memcg(lruvec), PGREFILL, nr_scanned); 5028c2ecf20Sopenharmony_ci spin_unlock_irq(&pgdat->lru_lock); 5038c2ecf20Sopenharmony_ci 5048c2ecf20Sopenharmony_ci while (!list_empty(&l_hold)) { 5058c2ecf20Sopenharmony_ci cond_resched(); 5068c2ecf20Sopenharmony_ci page = lru_to_page(&l_hold); 5078c2ecf20Sopenharmony_ci list_del(&page->lru); 5088c2ecf20Sopenharmony_ci 5098c2ecf20Sopenharmony_ci if (unlikely(!page_evictable(page))) { 5108c2ecf20Sopenharmony_ci putback_lru_page(page); 5118c2ecf20Sopenharmony_ci continue; 5128c2ecf20Sopenharmony_ci } 5138c2ecf20Sopenharmony_ci 5148c2ecf20Sopenharmony_ci ClearPageActive(page); 5158c2ecf20Sopenharmony_ci SetPageWorkingset(page); 5168c2ecf20Sopenharmony_ci list_add(&page->lru, &l_inactive); 5178c2ecf20Sopenharmony_ci } 5188c2ecf20Sopenharmony_ci 5198c2ecf20Sopenharmony_ci spin_lock_irq(&pgdat->lru_lock); 5208c2ecf20Sopenharmony_ci nr_deactivate = move_pages_to_lru(lruvec, &l_inactive); 5218c2ecf20Sopenharmony_ci __mod_node_page_state(pgdat, NR_ISOLATED_ANON, -nr_taken); 5228c2ecf20Sopenharmony_ci spin_unlock_irq(&pgdat->lru_lock); 5238c2ecf20Sopenharmony_ci 5248c2ecf20Sopenharmony_ci mem_cgroup_uncharge_list(&l_inactive); 5258c2ecf20Sopenharmony_ci free_unref_page_list(&l_inactive); 5268c2ecf20Sopenharmony_ci 5278c2ecf20Sopenharmony_ci trace_mm_vmscan_lru_zswapd_shrink_active(pgdat->node_id, nr_taken, 5288c2ecf20Sopenharmony_ci nr_deactivate, sc->priority); 5298c2ecf20Sopenharmony_ci} 5308c2ecf20Sopenharmony_ci 5318c2ecf20Sopenharmony_cistatic unsigned long zswapd_shrink_list(enum lru_list lru, 5328c2ecf20Sopenharmony_ci unsigned long nr_to_scan, struct lruvec *lruvec, 5338c2ecf20Sopenharmony_ci struct scan_control *sc) 5348c2ecf20Sopenharmony_ci{ 5358c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 5368c2ecf20Sopenharmony_ci unsigned long nr_reclaimed; 5378c2ecf20Sopenharmony_ci 5388c2ecf20Sopenharmony_ci reclaimacct_substage_start(RA_SHRINKANON); 5398c2ecf20Sopenharmony_ci#endif 5408c2ecf20Sopenharmony_ci if (is_active_lru(lru)) { 5418c2ecf20Sopenharmony_ci if (sc->may_deactivate & (1 << is_file_lru(lru))) 5428c2ecf20Sopenharmony_ci zswapd_shrink_active_list(nr_to_scan, lruvec, sc, lru); 5438c2ecf20Sopenharmony_ci else 5448c2ecf20Sopenharmony_ci sc->skipped_deactivate = 1; 5458c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 5468c2ecf20Sopenharmony_ci reclaimacct_substage_end(RA_SHRINKANON, 0, NULL); 5478c2ecf20Sopenharmony_ci#endif 5488c2ecf20Sopenharmony_ci return 0; 5498c2ecf20Sopenharmony_ci } 5508c2ecf20Sopenharmony_ci 5518c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 5528c2ecf20Sopenharmony_ci nr_reclaimed = shrink_inactive_list(nr_to_scan, lruvec, sc, lru); 5538c2ecf20Sopenharmony_ci reclaimacct_substage_end(RA_SHRINKANON, nr_reclaimed, NULL); 5548c2ecf20Sopenharmony_ci return nr_reclaimed; 5558c2ecf20Sopenharmony_ci#else 5568c2ecf20Sopenharmony_ci return shrink_inactive_list(nr_to_scan, lruvec, sc, lru); 5578c2ecf20Sopenharmony_ci#endif 5588c2ecf20Sopenharmony_ci} 5598c2ecf20Sopenharmony_ci 5608c2ecf20Sopenharmony_cistatic void zswapd_shrink_anon_memcg(struct pglist_data *pgdat, 5618c2ecf20Sopenharmony_ci struct mem_cgroup *memcg, struct scan_control *sc, unsigned long *nr) 5628c2ecf20Sopenharmony_ci{ 5638c2ecf20Sopenharmony_ci struct lruvec *lruvec = mem_cgroup_lruvec(memcg, pgdat); 5648c2ecf20Sopenharmony_ci unsigned long nr_reclaimed = 0; 5658c2ecf20Sopenharmony_ci unsigned long nr_to_scan; 5668c2ecf20Sopenharmony_ci struct blk_plug plug; 5678c2ecf20Sopenharmony_ci enum lru_list lru; 5688c2ecf20Sopenharmony_ci 5698c2ecf20Sopenharmony_ci blk_start_plug(&plug); 5708c2ecf20Sopenharmony_ci 5718c2ecf20Sopenharmony_ci while (nr[LRU_INACTIVE_ANON] || nr[LRU_ACTIVE_ANON]) { 5728c2ecf20Sopenharmony_ci for (lru = 0; lru <= LRU_ACTIVE_ANON; lru++) { 5738c2ecf20Sopenharmony_ci if (nr[lru]) { 5748c2ecf20Sopenharmony_ci nr_to_scan = min(nr[lru], SWAP_CLUSTER_MAX); 5758c2ecf20Sopenharmony_ci nr[lru] -= nr_to_scan; 5768c2ecf20Sopenharmony_ci nr_reclaimed += zswapd_shrink_list(lru, 5778c2ecf20Sopenharmony_ci nr_to_scan, lruvec, sc); 5788c2ecf20Sopenharmony_ci } 5798c2ecf20Sopenharmony_ci } 5808c2ecf20Sopenharmony_ci } 5818c2ecf20Sopenharmony_ci 5828c2ecf20Sopenharmony_ci blk_finish_plug(&plug); 5838c2ecf20Sopenharmony_ci sc->nr_reclaimed += nr_reclaimed; 5848c2ecf20Sopenharmony_ci} 5858c2ecf20Sopenharmony_ci#endif 5868c2ecf20Sopenharmony_ci 5878c2ecf20Sopenharmony_cistatic bool zswapd_shrink_anon(pg_data_t *pgdat, struct scan_control *sc) 5888c2ecf20Sopenharmony_ci{ 5898c2ecf20Sopenharmony_ci const unsigned int percent_constant = 100; 5908c2ecf20Sopenharmony_ci struct mem_cgroup *memcg = NULL; 5918c2ecf20Sopenharmony_ci unsigned long nr[NR_LRU_LISTS]; 5928c2ecf20Sopenharmony_ci 5938c2ecf20Sopenharmony_ci while ((memcg = get_next_memcg(memcg)) != NULL) { 5948c2ecf20Sopenharmony_ci struct lruvec *lruvec = mem_cgroup_lruvec(memcg, pgdat); 5958c2ecf20Sopenharmony_ci u64 nr_active, nr_inactive, nr_zram, nr_eswap, zram_ratio; 5968c2ecf20Sopenharmony_ci 5978c2ecf20Sopenharmony_ci /* reclaim and try to meet the high buffer watermark */ 5988c2ecf20Sopenharmony_ci if (high_buffer_is_suitable()) { 5998c2ecf20Sopenharmony_ci get_next_memcg_break(memcg); 6008c2ecf20Sopenharmony_ci break; 6018c2ecf20Sopenharmony_ci } 6028c2ecf20Sopenharmony_ci 6038c2ecf20Sopenharmony_ci if (get_memcg_anon_refault_status(memcg)) { 6048c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_MEMCG_REFAULT_SKIP); 6058c2ecf20Sopenharmony_ci continue; 6068c2ecf20Sopenharmony_ci } 6078c2ecf20Sopenharmony_ci 6088c2ecf20Sopenharmony_ci nr_active = lruvec_lru_size(lruvec, LRU_ACTIVE_ANON, MAX_NR_ZONES); 6098c2ecf20Sopenharmony_ci nr_inactive = lruvec_lru_size(lruvec, LRU_INACTIVE_ANON, MAX_NR_ZONES); 6108c2ecf20Sopenharmony_ci nr_zram = memcg_data_size(memcg, CACHE_PAGE); 6118c2ecf20Sopenharmony_ci nr_eswap = memcg_data_size(memcg, SWAP_PAGE); 6128c2ecf20Sopenharmony_ci 6138c2ecf20Sopenharmony_ci zram_ratio = div64_u64((nr_zram + nr_eswap) * percent_constant, 6148c2ecf20Sopenharmony_ci (nr_inactive + nr_active + nr_zram + nr_eswap + 1)); 6158c2ecf20Sopenharmony_ci if (zram_ratio >= (u32)atomic_read(&memcg->memcg_reclaimed.ub_mem2zram_ratio)) { 6168c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_MEMCG_RATIO_SKIP); 6178c2ecf20Sopenharmony_ci continue; 6188c2ecf20Sopenharmony_ci } 6198c2ecf20Sopenharmony_ci 6208c2ecf20Sopenharmony_ci nr[LRU_ACTIVE_ANON] = nr_active >> (unsigned int)sc->priority; 6218c2ecf20Sopenharmony_ci nr[LRU_INACTIVE_ANON] = nr_inactive >> (unsigned int)sc->priority; 6228c2ecf20Sopenharmony_ci nr[LRU_ACTIVE_FILE] = 0; 6238c2ecf20Sopenharmony_ci nr[LRU_INACTIVE_FILE] = 0; 6248c2ecf20Sopenharmony_ci 6258c2ecf20Sopenharmony_ci#ifdef CONFIG_HYPERHOLD_FILE_LRU 6268c2ecf20Sopenharmony_ci zswapd_shrink_anon_memcg(pgdat, memcg, sc, nr); 6278c2ecf20Sopenharmony_ci#else 6288c2ecf20Sopenharmony_ci shrink_lruvec(lruvec, sc); 6298c2ecf20Sopenharmony_ci#endif 6308c2ecf20Sopenharmony_ci shrink_slab(sc->gfp_mask, pgdat->node_id, memcg, sc->priority); 6318c2ecf20Sopenharmony_ci 6328c2ecf20Sopenharmony_ci if (sc->nr_reclaimed >= sc->nr_to_reclaim) { 6338c2ecf20Sopenharmony_ci get_next_memcg_break(memcg); 6348c2ecf20Sopenharmony_ci break; 6358c2ecf20Sopenharmony_ci } 6368c2ecf20Sopenharmony_ci } 6378c2ecf20Sopenharmony_ci 6388c2ecf20Sopenharmony_ci return sc->nr_scanned >= sc->nr_to_reclaim; 6398c2ecf20Sopenharmony_ci} 6408c2ecf20Sopenharmony_ci 6418c2ecf20Sopenharmony_cistatic u64 __calc_nr_to_reclaim(void) 6428c2ecf20Sopenharmony_ci{ 6438c2ecf20Sopenharmony_ci unsigned int buffers; 6448c2ecf20Sopenharmony_ci unsigned int high_buffers; 6458c2ecf20Sopenharmony_ci unsigned int max_reclaim_size; 6468c2ecf20Sopenharmony_ci u64 reclaim_size = 0; 6478c2ecf20Sopenharmony_ci 6488c2ecf20Sopenharmony_ci high_buffers = get_high_avail_buffers(); 6498c2ecf20Sopenharmony_ci buffers = calc_sys_cur_avail_buffers(); 6508c2ecf20Sopenharmony_ci max_reclaim_size = get_zswapd_max_reclaim_size(); 6518c2ecf20Sopenharmony_ci if (buffers < high_buffers) 6528c2ecf20Sopenharmony_ci reclaim_size = high_buffers - buffers; 6538c2ecf20Sopenharmony_ci 6548c2ecf20Sopenharmony_ci /* once max reclaim target is max_reclaim_size */ 6558c2ecf20Sopenharmony_ci reclaim_size = min(reclaim_size, (u64)max_reclaim_size); 6568c2ecf20Sopenharmony_ci 6578c2ecf20Sopenharmony_ci /* MB to pages */ 6588c2ecf20Sopenharmony_ci return div_u64(reclaim_size * SZ_1M, PAGE_SIZE); 6598c2ecf20Sopenharmony_ci} 6608c2ecf20Sopenharmony_ci 6618c2ecf20Sopenharmony_cistatic void zswapd_shrink_node(pg_data_t *pgdat) 6628c2ecf20Sopenharmony_ci{ 6638c2ecf20Sopenharmony_ci struct scan_control sc = { 6648c2ecf20Sopenharmony_ci .gfp_mask = GFP_KERNEL, 6658c2ecf20Sopenharmony_ci .order = 0, 6668c2ecf20Sopenharmony_ci .priority = DEF_PRIORITY / 2, 6678c2ecf20Sopenharmony_ci .may_writepage = !laptop_mode, 6688c2ecf20Sopenharmony_ci .may_unmap = 1, 6698c2ecf20Sopenharmony_ci .may_swap = 1, 6708c2ecf20Sopenharmony_ci .reclaim_idx = MAX_NR_ZONES - 1, 6718c2ecf20Sopenharmony_ci }; 6728c2ecf20Sopenharmony_ci const unsigned int increase_rate = 2; 6738c2ecf20Sopenharmony_ci 6748c2ecf20Sopenharmony_ci do { 6758c2ecf20Sopenharmony_ci unsigned long nr_reclaimed = sc.nr_reclaimed; 6768c2ecf20Sopenharmony_ci bool raise_priority = true; 6778c2ecf20Sopenharmony_ci 6788c2ecf20Sopenharmony_ci /* reclaim and try to meet the high buffer watermark */ 6798c2ecf20Sopenharmony_ci if (high_buffer_is_suitable()) 6808c2ecf20Sopenharmony_ci break; 6818c2ecf20Sopenharmony_ci 6828c2ecf20Sopenharmony_ci sc.nr_scanned = 0; 6838c2ecf20Sopenharmony_ci sc.nr_to_reclaim = __calc_nr_to_reclaim(); 6848c2ecf20Sopenharmony_ci 6858c2ecf20Sopenharmony_ci if (zswapd_shrink_anon(pgdat, &sc)) 6868c2ecf20Sopenharmony_ci raise_priority = false; 6878c2ecf20Sopenharmony_ci count_vm_events(ZSWAPD_SCANNED, sc.nr_scanned); 6888c2ecf20Sopenharmony_ci count_vm_events(ZSWAPD_RECLAIMED, sc.nr_reclaimed); 6898c2ecf20Sopenharmony_ci if (try_to_freeze() || kthread_should_stop()) 6908c2ecf20Sopenharmony_ci break; 6918c2ecf20Sopenharmony_ci 6928c2ecf20Sopenharmony_ci nr_reclaimed = sc.nr_reclaimed - nr_reclaimed; 6938c2ecf20Sopenharmony_ci if (raise_priority || !nr_reclaimed) 6948c2ecf20Sopenharmony_ci sc.priority--; 6958c2ecf20Sopenharmony_ci } while (sc.priority >= 1); 6968c2ecf20Sopenharmony_ci 6978c2ecf20Sopenharmony_ci /* 6988c2ecf20Sopenharmony_ci * When meets the first empty round, set the interval to t. 6998c2ecf20Sopenharmony_ci * If the following round is still empty, set the intervall 7008c2ecf20Sopenharmony_ci * to 2t. If the round is always empty, then 4t, 8t, and so on. 7018c2ecf20Sopenharmony_ci * But make sure the interval is not more than the max_skip_interval. 7028c2ecf20Sopenharmony_ci * Once a non-empty round occurs, reset the interval to 0. 7038c2ecf20Sopenharmony_ci */ 7048c2ecf20Sopenharmony_ci if (sc.nr_reclaimed < get_empty_round_check_threshold()) { 7058c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_EMPTY_ROUND); 7068c2ecf20Sopenharmony_ci if (last_round_is_empty) 7078c2ecf20Sopenharmony_ci zswapd_skip_interval = min(zswapd_skip_interval * 7088c2ecf20Sopenharmony_ci increase_rate, get_max_skip_interval()); 7098c2ecf20Sopenharmony_ci else 7108c2ecf20Sopenharmony_ci zswapd_skip_interval = get_empty_round_skip_interval(); 7118c2ecf20Sopenharmony_ci last_round_is_empty = true; 7128c2ecf20Sopenharmony_ci } else { 7138c2ecf20Sopenharmony_ci zswapd_skip_interval = 0; 7148c2ecf20Sopenharmony_ci last_round_is_empty = false; 7158c2ecf20Sopenharmony_ci } 7168c2ecf20Sopenharmony_ci} 7178c2ecf20Sopenharmony_ci 7188c2ecf20Sopenharmony_ciu64 zram_watermark_diff(void) 7198c2ecf20Sopenharmony_ci{ 7208c2ecf20Sopenharmony_ci const unsigned int percent_constant = 100; 7218c2ecf20Sopenharmony_ci u64 nr_zram_used; 7228c2ecf20Sopenharmony_ci u64 nr_wm; 7238c2ecf20Sopenharmony_ci u64 ratio; 7248c2ecf20Sopenharmony_ci 7258c2ecf20Sopenharmony_ci ratio = get_zram_current_watermark(); 7268c2ecf20Sopenharmony_ci nr_zram_used = get_zram_used_pages(); 7278c2ecf20Sopenharmony_ci nr_wm = div_u64(totalram_pages() * ratio, percent_constant); 7288c2ecf20Sopenharmony_ci if (nr_zram_used > nr_wm) 7298c2ecf20Sopenharmony_ci return (nr_zram_used - nr_wm) * PAGE_SIZE + SWAP_MORE_ZRAM; 7308c2ecf20Sopenharmony_ci 7318c2ecf20Sopenharmony_ci return 0; 7328c2ecf20Sopenharmony_ci} 7338c2ecf20Sopenharmony_ci 7348c2ecf20Sopenharmony_ciu64 zswapd_buffer_diff(void) 7358c2ecf20Sopenharmony_ci{ 7368c2ecf20Sopenharmony_ci u64 buffers; 7378c2ecf20Sopenharmony_ci u64 avail; 7388c2ecf20Sopenharmony_ci 7398c2ecf20Sopenharmony_ci buffers = calc_sys_cur_avail_buffers(); 7408c2ecf20Sopenharmony_ci avail = get_high_avail_buffers(); 7418c2ecf20Sopenharmony_ci if (buffers < avail) 7428c2ecf20Sopenharmony_ci return (avail - buffers) * SZ_1M; 7438c2ecf20Sopenharmony_ci 7448c2ecf20Sopenharmony_ci return 0; 7458c2ecf20Sopenharmony_ci} 7468c2ecf20Sopenharmony_ci 7478c2ecf20Sopenharmony_ciu64 get_do_eswap_size(bool refault) 7488c2ecf20Sopenharmony_ci{ 7498c2ecf20Sopenharmony_ci u64 size = 0; 7508c2ecf20Sopenharmony_ci enum zswapd_eswap_policy policy = get_zswapd_eswap_policy(); 7518c2ecf20Sopenharmony_ci 7528c2ecf20Sopenharmony_ci if (policy == CHECK_BUFFER_ZRAMRATIO_BOTH) 7538c2ecf20Sopenharmony_ci size = max(zram_watermark_diff(), zswapd_buffer_diff()); 7548c2ecf20Sopenharmony_ci else if (policy == CHECK_BUFFER_ONLY && (zram_watermark_ok() || refault)) 7558c2ecf20Sopenharmony_ci size = zswapd_buffer_diff(); 7568c2ecf20Sopenharmony_ci 7578c2ecf20Sopenharmony_ci return size; 7588c2ecf20Sopenharmony_ci} 7598c2ecf20Sopenharmony_ci 7608c2ecf20Sopenharmony_cistatic int zswapd(void *p) 7618c2ecf20Sopenharmony_ci{ 7628c2ecf20Sopenharmony_ci struct task_struct *tsk = current; 7638c2ecf20Sopenharmony_ci pg_data_t *pgdat = (pg_data_t *)p; 7648c2ecf20Sopenharmony_ci const struct cpumask *cpumask = cpumask_of_node(pgdat->node_id); 7658c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 7668c2ecf20Sopenharmony_ci struct reclaim_acct ra = {0}; 7678c2ecf20Sopenharmony_ci#endif 7688c2ecf20Sopenharmony_ci 7698c2ecf20Sopenharmony_ci /* save zswapd pid for schedule strategy */ 7708c2ecf20Sopenharmony_ci zswapd_pid = tsk->pid; 7718c2ecf20Sopenharmony_ci 7728c2ecf20Sopenharmony_ci 7738c2ecf20Sopenharmony_ci if (!cpumask_empty(cpumask)) 7748c2ecf20Sopenharmony_ci set_cpus_allowed_ptr(tsk, cpumask); 7758c2ecf20Sopenharmony_ci 7768c2ecf20Sopenharmony_ci set_freezable(); 7778c2ecf20Sopenharmony_ci 7788c2ecf20Sopenharmony_ci while (!kthread_should_stop()) { 7798c2ecf20Sopenharmony_ci bool refault = false; 7808c2ecf20Sopenharmony_ci u64 size = 0; 7818c2ecf20Sopenharmony_ci 7828c2ecf20Sopenharmony_ci (void)wait_event_freezable(pgdat->zswapd_wait, 7838c2ecf20Sopenharmony_ci atomic_read(&pgdat->zswapd_wait_flag)); 7848c2ecf20Sopenharmony_ci atomic_set(&pgdat->zswapd_wait_flag, 0); 7858c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_WAKEUP); 7868c2ecf20Sopenharmony_ci zswapd_pressure_report(LEVEL_LOW); 7878c2ecf20Sopenharmony_ci 7888c2ecf20Sopenharmony_ci if (get_area_anon_refault_status()) { 7898c2ecf20Sopenharmony_ci refault = true; 7908c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_REFAULT); 7918c2ecf20Sopenharmony_ci goto do_eswap; 7928c2ecf20Sopenharmony_ci } 7938c2ecf20Sopenharmony_ci 7948c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 7958c2ecf20Sopenharmony_ci reclaimacct_start(ZSWAPD_RECLAIM, &ra); 7968c2ecf20Sopenharmony_ci#endif 7978c2ecf20Sopenharmony_ci zswapd_shrink_node(pgdat); 7988c2ecf20Sopenharmony_ci#ifdef CONFIG_RECLAIM_ACCT 7998c2ecf20Sopenharmony_ci reclaimacct_end(ZSWAPD_RECLAIM); 8008c2ecf20Sopenharmony_ci#endif 8018c2ecf20Sopenharmony_ci last_zswapd_time = jiffies; 8028c2ecf20Sopenharmony_ci 8038c2ecf20Sopenharmony_cido_eswap: 8048c2ecf20Sopenharmony_ci size = get_do_eswap_size(refault); 8058c2ecf20Sopenharmony_ci if (size >= SZ_1M) { 8068c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_SWAPOUT); 8078c2ecf20Sopenharmony_ci size = swapout(size); 8088c2ecf20Sopenharmony_ci } 8098c2ecf20Sopenharmony_ci 8108c2ecf20Sopenharmony_ci if (!buffer_is_suitable()) { 8118c2ecf20Sopenharmony_ci if (free_swap_is_low() || zram_watermark_exceed()) { 8128c2ecf20Sopenharmony_ci zswapd_pressure_report(LEVEL_CRITICAL); 8138c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_CRITICAL_PRESS); 8148c2ecf20Sopenharmony_ci pr_info("%s:zrampages:%llu, eswappages:%llu\n", __func__, 8158c2ecf20Sopenharmony_ci get_zram_used_pages(), get_eswap_used_pages()); 8168c2ecf20Sopenharmony_ci } else { 8178c2ecf20Sopenharmony_ci zswapd_pressure_report(LEVEL_MEDIUM); 8188c2ecf20Sopenharmony_ci count_vm_event(ZSWAPD_MEDIUM_PRESS); 8198c2ecf20Sopenharmony_ci } 8208c2ecf20Sopenharmony_ci } 8218c2ecf20Sopenharmony_ci } 8228c2ecf20Sopenharmony_ci 8238c2ecf20Sopenharmony_ci return 0; 8248c2ecf20Sopenharmony_ci} 8258c2ecf20Sopenharmony_ci 8268c2ecf20Sopenharmony_ci/* 8278c2ecf20Sopenharmony_ci * This zswapd start function will be called by init and node-hot-add. 8288c2ecf20Sopenharmony_ci */ 8298c2ecf20Sopenharmony_ciint zswapd_run(int nid) 8308c2ecf20Sopenharmony_ci{ 8318c2ecf20Sopenharmony_ci const unsigned int priority_less = 5; 8328c2ecf20Sopenharmony_ci struct sched_param param = { 8338c2ecf20Sopenharmony_ci .sched_priority = MAX_PRIO - priority_less, 8348c2ecf20Sopenharmony_ci }; 8358c2ecf20Sopenharmony_ci pg_data_t *pgdat = NODE_DATA(nid); 8368c2ecf20Sopenharmony_ci 8378c2ecf20Sopenharmony_ci if (pgdat->zswapd) 8388c2ecf20Sopenharmony_ci return 0; 8398c2ecf20Sopenharmony_ci 8408c2ecf20Sopenharmony_ci atomic_set(&pgdat->zswapd_wait_flag, 0); 8418c2ecf20Sopenharmony_ci pgdat->zswapd = kthread_create(zswapd, pgdat, "zswapd%d", nid); 8428c2ecf20Sopenharmony_ci if (IS_ERR(pgdat->zswapd)) { 8438c2ecf20Sopenharmony_ci pr_err("Failed to start zswapd on node %d\n", nid); 8448c2ecf20Sopenharmony_ci return PTR_ERR(pgdat->zswapd); 8458c2ecf20Sopenharmony_ci } 8468c2ecf20Sopenharmony_ci 8478c2ecf20Sopenharmony_ci sched_setscheduler_nocheck(pgdat->zswapd, SCHED_NORMAL, ¶m); 8488c2ecf20Sopenharmony_ci set_user_nice(pgdat->zswapd, PRIO_TO_NICE(param.sched_priority)); 8498c2ecf20Sopenharmony_ci wake_up_process(pgdat->zswapd); 8508c2ecf20Sopenharmony_ci 8518c2ecf20Sopenharmony_ci return 0; 8528c2ecf20Sopenharmony_ci} 8538c2ecf20Sopenharmony_ci 8548c2ecf20Sopenharmony_ci/* 8558c2ecf20Sopenharmony_ci * Called by memory hotplug when all memory in a node is offlined. Caller must 8568c2ecf20Sopenharmony_ci * hold mem_hotplug_begin/end(). 8578c2ecf20Sopenharmony_ci */ 8588c2ecf20Sopenharmony_civoid zswapd_stop(int nid) 8598c2ecf20Sopenharmony_ci{ 8608c2ecf20Sopenharmony_ci struct task_struct *zswapd = NODE_DATA(nid)->zswapd; 8618c2ecf20Sopenharmony_ci 8628c2ecf20Sopenharmony_ci if (zswapd) { 8638c2ecf20Sopenharmony_ci kthread_stop(zswapd); 8648c2ecf20Sopenharmony_ci NODE_DATA(nid)->zswapd = NULL; 8658c2ecf20Sopenharmony_ci } 8668c2ecf20Sopenharmony_ci 8678c2ecf20Sopenharmony_ci zswapd_pid = -1; 8688c2ecf20Sopenharmony_ci} 8698c2ecf20Sopenharmony_ci 8708c2ecf20Sopenharmony_ci/* 8718c2ecf20Sopenharmony_ci * It's optimal to keep kswapds on the same CPUs as their memory, but 8728c2ecf20Sopenharmony_ci * not required for correctness. So if the last cpu in a node goes away, 8738c2ecf20Sopenharmony_ci * we get changed to run anywhere: as the first one comes back, restore 8748c2ecf20Sopenharmony_ci * their cpu bindings. 8758c2ecf20Sopenharmony_ci */ 8768c2ecf20Sopenharmony_cistatic int zswapd_cpu_online(unsigned int cpu) 8778c2ecf20Sopenharmony_ci{ 8788c2ecf20Sopenharmony_ci int nid; 8798c2ecf20Sopenharmony_ci 8808c2ecf20Sopenharmony_ci for_each_node_state(nid, N_MEMORY) { 8818c2ecf20Sopenharmony_ci pg_data_t *pgdat = NODE_DATA(nid); 8828c2ecf20Sopenharmony_ci const struct cpumask *mask; 8838c2ecf20Sopenharmony_ci 8848c2ecf20Sopenharmony_ci mask = cpumask_of_node(pgdat->node_id); 8858c2ecf20Sopenharmony_ci if (cpumask_any_and(cpu_online_mask, mask) < nr_cpu_ids) 8868c2ecf20Sopenharmony_ci /* One of our CPUs online: restore mask */ 8878c2ecf20Sopenharmony_ci set_cpus_allowed_ptr(pgdat->zswapd, mask); 8888c2ecf20Sopenharmony_ci } 8898c2ecf20Sopenharmony_ci 8908c2ecf20Sopenharmony_ci return 0; 8918c2ecf20Sopenharmony_ci} 8928c2ecf20Sopenharmony_ci 8938c2ecf20Sopenharmony_cistatic int __init zswapd_init(void) 8948c2ecf20Sopenharmony_ci{ 8958c2ecf20Sopenharmony_ci int nid; 8968c2ecf20Sopenharmony_ci int ret; 8978c2ecf20Sopenharmony_ci 8988c2ecf20Sopenharmony_ci ret = cpuhp_setup_state_nocalls(CPUHP_AP_ONLINE_DYN, "mm/zswapd:online", 8998c2ecf20Sopenharmony_ci zswapd_cpu_online, NULL); 9008c2ecf20Sopenharmony_ci if (ret < 0) { 9018c2ecf20Sopenharmony_ci pr_err("zswapd: failed to register hotplug callbacks.\n"); 9028c2ecf20Sopenharmony_ci return ret; 9038c2ecf20Sopenharmony_ci } 9048c2ecf20Sopenharmony_ci 9058c2ecf20Sopenharmony_ci for_each_node_state(nid, N_MEMORY) 9068c2ecf20Sopenharmony_ci zswapd_run(nid); 9078c2ecf20Sopenharmony_ci 9088c2ecf20Sopenharmony_ci return 0; 9098c2ecf20Sopenharmony_ci} 9108c2ecf20Sopenharmony_cimodule_init(zswapd_init) 911