18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci * mm/balloon_compaction.c
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * Common interface for making balloon pages movable by compaction.
68c2ecf20Sopenharmony_ci *
78c2ecf20Sopenharmony_ci * Copyright (C) 2012, Red Hat, Inc.  Rafael Aquini <aquini@redhat.com>
88c2ecf20Sopenharmony_ci */
98c2ecf20Sopenharmony_ci#include <linux/mm.h>
108c2ecf20Sopenharmony_ci#include <linux/slab.h>
118c2ecf20Sopenharmony_ci#include <linux/export.h>
128c2ecf20Sopenharmony_ci#include <linux/balloon_compaction.h>
138c2ecf20Sopenharmony_ci
148c2ecf20Sopenharmony_cistatic void balloon_page_enqueue_one(struct balloon_dev_info *b_dev_info,
158c2ecf20Sopenharmony_ci				     struct page *page)
168c2ecf20Sopenharmony_ci{
178c2ecf20Sopenharmony_ci	/*
188c2ecf20Sopenharmony_ci	 * Block others from accessing the 'page' when we get around to
198c2ecf20Sopenharmony_ci	 * establishing additional references. We should be the only one
208c2ecf20Sopenharmony_ci	 * holding a reference to the 'page' at this point. If we are not, then
218c2ecf20Sopenharmony_ci	 * memory corruption is possible and we should stop execution.
228c2ecf20Sopenharmony_ci	 */
238c2ecf20Sopenharmony_ci	BUG_ON(!trylock_page(page));
248c2ecf20Sopenharmony_ci	balloon_page_insert(b_dev_info, page);
258c2ecf20Sopenharmony_ci	unlock_page(page);
268c2ecf20Sopenharmony_ci	__count_vm_event(BALLOON_INFLATE);
278c2ecf20Sopenharmony_ci}
288c2ecf20Sopenharmony_ci
298c2ecf20Sopenharmony_ci/**
308c2ecf20Sopenharmony_ci * balloon_page_list_enqueue() - inserts a list of pages into the balloon page
318c2ecf20Sopenharmony_ci *				 list.
328c2ecf20Sopenharmony_ci * @b_dev_info: balloon device descriptor where we will insert a new page to
338c2ecf20Sopenharmony_ci * @pages: pages to enqueue - allocated using balloon_page_alloc.
348c2ecf20Sopenharmony_ci *
358c2ecf20Sopenharmony_ci * Driver must call this function to properly enqueue balloon pages before
368c2ecf20Sopenharmony_ci * definitively removing them from the guest system.
378c2ecf20Sopenharmony_ci *
388c2ecf20Sopenharmony_ci * Return: number of pages that were enqueued.
398c2ecf20Sopenharmony_ci */
408c2ecf20Sopenharmony_cisize_t balloon_page_list_enqueue(struct balloon_dev_info *b_dev_info,
418c2ecf20Sopenharmony_ci				 struct list_head *pages)
428c2ecf20Sopenharmony_ci{
438c2ecf20Sopenharmony_ci	struct page *page, *tmp;
448c2ecf20Sopenharmony_ci	unsigned long flags;
458c2ecf20Sopenharmony_ci	size_t n_pages = 0;
468c2ecf20Sopenharmony_ci
478c2ecf20Sopenharmony_ci	spin_lock_irqsave(&b_dev_info->pages_lock, flags);
488c2ecf20Sopenharmony_ci	list_for_each_entry_safe(page, tmp, pages, lru) {
498c2ecf20Sopenharmony_ci		list_del(&page->lru);
508c2ecf20Sopenharmony_ci		balloon_page_enqueue_one(b_dev_info, page);
518c2ecf20Sopenharmony_ci		n_pages++;
528c2ecf20Sopenharmony_ci	}
538c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags);
548c2ecf20Sopenharmony_ci	return n_pages;
558c2ecf20Sopenharmony_ci}
568c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(balloon_page_list_enqueue);
578c2ecf20Sopenharmony_ci
588c2ecf20Sopenharmony_ci/**
598c2ecf20Sopenharmony_ci * balloon_page_list_dequeue() - removes pages from balloon's page list and
608c2ecf20Sopenharmony_ci *				 returns a list of the pages.
618c2ecf20Sopenharmony_ci * @b_dev_info: balloon device decriptor where we will grab a page from.
628c2ecf20Sopenharmony_ci * @pages: pointer to the list of pages that would be returned to the caller.
638c2ecf20Sopenharmony_ci * @n_req_pages: number of requested pages.
648c2ecf20Sopenharmony_ci *
658c2ecf20Sopenharmony_ci * Driver must call this function to properly de-allocate a previous enlisted
668c2ecf20Sopenharmony_ci * balloon pages before definitively releasing it back to the guest system.
678c2ecf20Sopenharmony_ci * This function tries to remove @n_req_pages from the ballooned pages and
688c2ecf20Sopenharmony_ci * return them to the caller in the @pages list.
698c2ecf20Sopenharmony_ci *
708c2ecf20Sopenharmony_ci * Note that this function may fail to dequeue some pages even if the balloon
718c2ecf20Sopenharmony_ci * isn't empty - since the page list can be temporarily empty due to compaction
728c2ecf20Sopenharmony_ci * of isolated pages.
738c2ecf20Sopenharmony_ci *
748c2ecf20Sopenharmony_ci * Return: number of pages that were added to the @pages list.
758c2ecf20Sopenharmony_ci */
768c2ecf20Sopenharmony_cisize_t balloon_page_list_dequeue(struct balloon_dev_info *b_dev_info,
778c2ecf20Sopenharmony_ci				 struct list_head *pages, size_t n_req_pages)
788c2ecf20Sopenharmony_ci{
798c2ecf20Sopenharmony_ci	struct page *page, *tmp;
808c2ecf20Sopenharmony_ci	unsigned long flags;
818c2ecf20Sopenharmony_ci	size_t n_pages = 0;
828c2ecf20Sopenharmony_ci
838c2ecf20Sopenharmony_ci	spin_lock_irqsave(&b_dev_info->pages_lock, flags);
848c2ecf20Sopenharmony_ci	list_for_each_entry_safe(page, tmp, &b_dev_info->pages, lru) {
858c2ecf20Sopenharmony_ci		if (n_pages == n_req_pages)
868c2ecf20Sopenharmony_ci			break;
878c2ecf20Sopenharmony_ci
888c2ecf20Sopenharmony_ci		/*
898c2ecf20Sopenharmony_ci		 * Block others from accessing the 'page' while we get around to
908c2ecf20Sopenharmony_ci		 * establishing additional references and preparing the 'page'
918c2ecf20Sopenharmony_ci		 * to be released by the balloon driver.
928c2ecf20Sopenharmony_ci		 */
938c2ecf20Sopenharmony_ci		if (!trylock_page(page))
948c2ecf20Sopenharmony_ci			continue;
958c2ecf20Sopenharmony_ci
968c2ecf20Sopenharmony_ci		if (IS_ENABLED(CONFIG_BALLOON_COMPACTION) &&
978c2ecf20Sopenharmony_ci		    PageIsolated(page)) {
988c2ecf20Sopenharmony_ci			/* raced with isolation */
998c2ecf20Sopenharmony_ci			unlock_page(page);
1008c2ecf20Sopenharmony_ci			continue;
1018c2ecf20Sopenharmony_ci		}
1028c2ecf20Sopenharmony_ci		balloon_page_delete(page);
1038c2ecf20Sopenharmony_ci		__count_vm_event(BALLOON_DEFLATE);
1048c2ecf20Sopenharmony_ci		list_add(&page->lru, pages);
1058c2ecf20Sopenharmony_ci		unlock_page(page);
1068c2ecf20Sopenharmony_ci		n_pages++;
1078c2ecf20Sopenharmony_ci	}
1088c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags);
1098c2ecf20Sopenharmony_ci
1108c2ecf20Sopenharmony_ci	return n_pages;
1118c2ecf20Sopenharmony_ci}
1128c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(balloon_page_list_dequeue);
1138c2ecf20Sopenharmony_ci
1148c2ecf20Sopenharmony_ci/*
1158c2ecf20Sopenharmony_ci * balloon_page_alloc - allocates a new page for insertion into the balloon
1168c2ecf20Sopenharmony_ci *			page list.
1178c2ecf20Sopenharmony_ci *
1188c2ecf20Sopenharmony_ci * Driver must call this function to properly allocate a new balloon page.
1198c2ecf20Sopenharmony_ci * Driver must call balloon_page_enqueue before definitively removing the page
1208c2ecf20Sopenharmony_ci * from the guest system.
1218c2ecf20Sopenharmony_ci *
1228c2ecf20Sopenharmony_ci * Return: struct page for the allocated page or NULL on allocation failure.
1238c2ecf20Sopenharmony_ci */
1248c2ecf20Sopenharmony_cistruct page *balloon_page_alloc(void)
1258c2ecf20Sopenharmony_ci{
1268c2ecf20Sopenharmony_ci	struct page *page = alloc_page(balloon_mapping_gfp_mask() |
1278c2ecf20Sopenharmony_ci				       __GFP_NOMEMALLOC | __GFP_NORETRY |
1288c2ecf20Sopenharmony_ci				       __GFP_NOWARN);
1298c2ecf20Sopenharmony_ci	return page;
1308c2ecf20Sopenharmony_ci}
1318c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(balloon_page_alloc);
1328c2ecf20Sopenharmony_ci
1338c2ecf20Sopenharmony_ci/*
1348c2ecf20Sopenharmony_ci * balloon_page_enqueue - inserts a new page into the balloon page list.
1358c2ecf20Sopenharmony_ci *
1368c2ecf20Sopenharmony_ci * @b_dev_info: balloon device descriptor where we will insert a new page
1378c2ecf20Sopenharmony_ci * @page: new page to enqueue - allocated using balloon_page_alloc.
1388c2ecf20Sopenharmony_ci *
1398c2ecf20Sopenharmony_ci * Drivers must call this function to properly enqueue a new allocated balloon
1408c2ecf20Sopenharmony_ci * page before definitively removing the page from the guest system.
1418c2ecf20Sopenharmony_ci *
1428c2ecf20Sopenharmony_ci * Drivers must not call balloon_page_enqueue on pages that have been pushed to
1438c2ecf20Sopenharmony_ci * a list with balloon_page_push before removing them with balloon_page_pop. To
1448c2ecf20Sopenharmony_ci * enqueue a list of pages, use balloon_page_list_enqueue instead.
1458c2ecf20Sopenharmony_ci */
1468c2ecf20Sopenharmony_civoid balloon_page_enqueue(struct balloon_dev_info *b_dev_info,
1478c2ecf20Sopenharmony_ci			  struct page *page)
1488c2ecf20Sopenharmony_ci{
1498c2ecf20Sopenharmony_ci	unsigned long flags;
1508c2ecf20Sopenharmony_ci
1518c2ecf20Sopenharmony_ci	spin_lock_irqsave(&b_dev_info->pages_lock, flags);
1528c2ecf20Sopenharmony_ci	balloon_page_enqueue_one(b_dev_info, page);
1538c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags);
1548c2ecf20Sopenharmony_ci}
1558c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(balloon_page_enqueue);
1568c2ecf20Sopenharmony_ci
1578c2ecf20Sopenharmony_ci/*
1588c2ecf20Sopenharmony_ci * balloon_page_dequeue - removes a page from balloon's page list and returns
1598c2ecf20Sopenharmony_ci *			  its address to allow the driver to release the page.
1608c2ecf20Sopenharmony_ci * @b_dev_info: balloon device decriptor where we will grab a page from.
1618c2ecf20Sopenharmony_ci *
1628c2ecf20Sopenharmony_ci * Driver must call this function to properly dequeue a previously enqueued page
1638c2ecf20Sopenharmony_ci * before definitively releasing it back to the guest system.
1648c2ecf20Sopenharmony_ci *
1658c2ecf20Sopenharmony_ci * Caller must perform its own accounting to ensure that this
1668c2ecf20Sopenharmony_ci * function is called only if some pages are actually enqueued.
1678c2ecf20Sopenharmony_ci *
1688c2ecf20Sopenharmony_ci * Note that this function may fail to dequeue some pages even if there are
1698c2ecf20Sopenharmony_ci * some enqueued pages - since the page list can be temporarily empty due to
1708c2ecf20Sopenharmony_ci * the compaction of isolated pages.
1718c2ecf20Sopenharmony_ci *
1728c2ecf20Sopenharmony_ci * TODO: remove the caller accounting requirements, and allow caller to wait
1738c2ecf20Sopenharmony_ci * until all pages can be dequeued.
1748c2ecf20Sopenharmony_ci *
1758c2ecf20Sopenharmony_ci * Return: struct page for the dequeued page, or NULL if no page was dequeued.
1768c2ecf20Sopenharmony_ci */
1778c2ecf20Sopenharmony_cistruct page *balloon_page_dequeue(struct balloon_dev_info *b_dev_info)
1788c2ecf20Sopenharmony_ci{
1798c2ecf20Sopenharmony_ci	unsigned long flags;
1808c2ecf20Sopenharmony_ci	LIST_HEAD(pages);
1818c2ecf20Sopenharmony_ci	int n_pages;
1828c2ecf20Sopenharmony_ci
1838c2ecf20Sopenharmony_ci	n_pages = balloon_page_list_dequeue(b_dev_info, &pages, 1);
1848c2ecf20Sopenharmony_ci
1858c2ecf20Sopenharmony_ci	if (n_pages != 1) {
1868c2ecf20Sopenharmony_ci		/*
1878c2ecf20Sopenharmony_ci		 * If we are unable to dequeue a balloon page because the page
1888c2ecf20Sopenharmony_ci		 * list is empty and there are no isolated pages, then something
1898c2ecf20Sopenharmony_ci		 * went out of track and some balloon pages are lost.
1908c2ecf20Sopenharmony_ci		 * BUG() here, otherwise the balloon driver may get stuck in
1918c2ecf20Sopenharmony_ci		 * an infinite loop while attempting to release all its pages.
1928c2ecf20Sopenharmony_ci		 */
1938c2ecf20Sopenharmony_ci		spin_lock_irqsave(&b_dev_info->pages_lock, flags);
1948c2ecf20Sopenharmony_ci		if (unlikely(list_empty(&b_dev_info->pages) &&
1958c2ecf20Sopenharmony_ci			     !b_dev_info->isolated_pages))
1968c2ecf20Sopenharmony_ci			BUG();
1978c2ecf20Sopenharmony_ci		spin_unlock_irqrestore(&b_dev_info->pages_lock, flags);
1988c2ecf20Sopenharmony_ci		return NULL;
1998c2ecf20Sopenharmony_ci	}
2008c2ecf20Sopenharmony_ci	return list_first_entry(&pages, struct page, lru);
2018c2ecf20Sopenharmony_ci}
2028c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(balloon_page_dequeue);
2038c2ecf20Sopenharmony_ci
2048c2ecf20Sopenharmony_ci#ifdef CONFIG_BALLOON_COMPACTION
2058c2ecf20Sopenharmony_ci
2068c2ecf20Sopenharmony_cibool balloon_page_isolate(struct page *page, isolate_mode_t mode)
2078c2ecf20Sopenharmony_ci
2088c2ecf20Sopenharmony_ci{
2098c2ecf20Sopenharmony_ci	struct balloon_dev_info *b_dev_info = balloon_page_device(page);
2108c2ecf20Sopenharmony_ci	unsigned long flags;
2118c2ecf20Sopenharmony_ci
2128c2ecf20Sopenharmony_ci	spin_lock_irqsave(&b_dev_info->pages_lock, flags);
2138c2ecf20Sopenharmony_ci	list_del(&page->lru);
2148c2ecf20Sopenharmony_ci	b_dev_info->isolated_pages++;
2158c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags);
2168c2ecf20Sopenharmony_ci
2178c2ecf20Sopenharmony_ci	return true;
2188c2ecf20Sopenharmony_ci}
2198c2ecf20Sopenharmony_ci
2208c2ecf20Sopenharmony_civoid balloon_page_putback(struct page *page)
2218c2ecf20Sopenharmony_ci{
2228c2ecf20Sopenharmony_ci	struct balloon_dev_info *b_dev_info = balloon_page_device(page);
2238c2ecf20Sopenharmony_ci	unsigned long flags;
2248c2ecf20Sopenharmony_ci
2258c2ecf20Sopenharmony_ci	spin_lock_irqsave(&b_dev_info->pages_lock, flags);
2268c2ecf20Sopenharmony_ci	list_add(&page->lru, &b_dev_info->pages);
2278c2ecf20Sopenharmony_ci	b_dev_info->isolated_pages--;
2288c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&b_dev_info->pages_lock, flags);
2298c2ecf20Sopenharmony_ci}
2308c2ecf20Sopenharmony_ci
2318c2ecf20Sopenharmony_ci
2328c2ecf20Sopenharmony_ci/* move_to_new_page() counterpart for a ballooned page */
2338c2ecf20Sopenharmony_ciint balloon_page_migrate(struct address_space *mapping,
2348c2ecf20Sopenharmony_ci		struct page *newpage, struct page *page,
2358c2ecf20Sopenharmony_ci		enum migrate_mode mode)
2368c2ecf20Sopenharmony_ci{
2378c2ecf20Sopenharmony_ci	struct balloon_dev_info *balloon = balloon_page_device(page);
2388c2ecf20Sopenharmony_ci
2398c2ecf20Sopenharmony_ci	/*
2408c2ecf20Sopenharmony_ci	 * We can not easily support the no copy case here so ignore it as it
2418c2ecf20Sopenharmony_ci	 * is unlikely to be used with balloon pages. See include/linux/hmm.h
2428c2ecf20Sopenharmony_ci	 * for a user of the MIGRATE_SYNC_NO_COPY mode.
2438c2ecf20Sopenharmony_ci	 */
2448c2ecf20Sopenharmony_ci	if (mode == MIGRATE_SYNC_NO_COPY)
2458c2ecf20Sopenharmony_ci		return -EINVAL;
2468c2ecf20Sopenharmony_ci
2478c2ecf20Sopenharmony_ci	VM_BUG_ON_PAGE(!PageLocked(page), page);
2488c2ecf20Sopenharmony_ci	VM_BUG_ON_PAGE(!PageLocked(newpage), newpage);
2498c2ecf20Sopenharmony_ci
2508c2ecf20Sopenharmony_ci	return balloon->migratepage(balloon, newpage, page, mode);
2518c2ecf20Sopenharmony_ci}
2528c2ecf20Sopenharmony_ci
2538c2ecf20Sopenharmony_ciconst struct address_space_operations balloon_aops = {
2548c2ecf20Sopenharmony_ci	.migratepage = balloon_page_migrate,
2558c2ecf20Sopenharmony_ci	.isolate_page = balloon_page_isolate,
2568c2ecf20Sopenharmony_ci	.putback_page = balloon_page_putback,
2578c2ecf20Sopenharmony_ci};
2588c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(balloon_aops);
2598c2ecf20Sopenharmony_ci
2608c2ecf20Sopenharmony_ci#endif /* CONFIG_BALLOON_COMPACTION */
261