18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
28c2ecf20Sopenharmony_ci
38c2ecf20Sopenharmony_ci/*
48c2ecf20Sopenharmony_ci *  Handling Page Tables through page fragments
58c2ecf20Sopenharmony_ci *
68c2ecf20Sopenharmony_ci */
78c2ecf20Sopenharmony_ci
88c2ecf20Sopenharmony_ci#include <linux/kernel.h>
98c2ecf20Sopenharmony_ci#include <linux/gfp.h>
108c2ecf20Sopenharmony_ci#include <linux/mm.h>
118c2ecf20Sopenharmony_ci#include <linux/percpu.h>
128c2ecf20Sopenharmony_ci#include <linux/hardirq.h>
138c2ecf20Sopenharmony_ci#include <linux/hugetlb.h>
148c2ecf20Sopenharmony_ci#include <asm/pgalloc.h>
158c2ecf20Sopenharmony_ci#include <asm/tlbflush.h>
168c2ecf20Sopenharmony_ci#include <asm/tlb.h>
178c2ecf20Sopenharmony_ci
188c2ecf20Sopenharmony_civoid pte_frag_destroy(void *pte_frag)
198c2ecf20Sopenharmony_ci{
208c2ecf20Sopenharmony_ci	int count;
218c2ecf20Sopenharmony_ci	struct page *page;
228c2ecf20Sopenharmony_ci
238c2ecf20Sopenharmony_ci	page = virt_to_page(pte_frag);
248c2ecf20Sopenharmony_ci	/* drop all the pending references */
258c2ecf20Sopenharmony_ci	count = ((unsigned long)pte_frag & ~PAGE_MASK) >> PTE_FRAG_SIZE_SHIFT;
268c2ecf20Sopenharmony_ci	/* We allow PTE_FRAG_NR fragments from a PTE page */
278c2ecf20Sopenharmony_ci	if (atomic_sub_and_test(PTE_FRAG_NR - count, &page->pt_frag_refcount)) {
288c2ecf20Sopenharmony_ci		pgtable_pte_page_dtor(page);
298c2ecf20Sopenharmony_ci		__free_page(page);
308c2ecf20Sopenharmony_ci	}
318c2ecf20Sopenharmony_ci}
328c2ecf20Sopenharmony_ci
338c2ecf20Sopenharmony_cistatic pte_t *get_pte_from_cache(struct mm_struct *mm)
348c2ecf20Sopenharmony_ci{
358c2ecf20Sopenharmony_ci	void *pte_frag, *ret;
368c2ecf20Sopenharmony_ci
378c2ecf20Sopenharmony_ci	if (PTE_FRAG_NR == 1)
388c2ecf20Sopenharmony_ci		return NULL;
398c2ecf20Sopenharmony_ci
408c2ecf20Sopenharmony_ci	spin_lock(&mm->page_table_lock);
418c2ecf20Sopenharmony_ci	ret = pte_frag_get(&mm->context);
428c2ecf20Sopenharmony_ci	if (ret) {
438c2ecf20Sopenharmony_ci		pte_frag = ret + PTE_FRAG_SIZE;
448c2ecf20Sopenharmony_ci		/*
458c2ecf20Sopenharmony_ci		 * If we have taken up all the fragments mark PTE page NULL
468c2ecf20Sopenharmony_ci		 */
478c2ecf20Sopenharmony_ci		if (((unsigned long)pte_frag & ~PAGE_MASK) == 0)
488c2ecf20Sopenharmony_ci			pte_frag = NULL;
498c2ecf20Sopenharmony_ci		pte_frag_set(&mm->context, pte_frag);
508c2ecf20Sopenharmony_ci	}
518c2ecf20Sopenharmony_ci	spin_unlock(&mm->page_table_lock);
528c2ecf20Sopenharmony_ci	return (pte_t *)ret;
538c2ecf20Sopenharmony_ci}
548c2ecf20Sopenharmony_ci
558c2ecf20Sopenharmony_cistatic pte_t *__alloc_for_ptecache(struct mm_struct *mm, int kernel)
568c2ecf20Sopenharmony_ci{
578c2ecf20Sopenharmony_ci	void *ret = NULL;
588c2ecf20Sopenharmony_ci	struct page *page;
598c2ecf20Sopenharmony_ci
608c2ecf20Sopenharmony_ci	if (!kernel) {
618c2ecf20Sopenharmony_ci		page = alloc_page(PGALLOC_GFP | __GFP_ACCOUNT);
628c2ecf20Sopenharmony_ci		if (!page)
638c2ecf20Sopenharmony_ci			return NULL;
648c2ecf20Sopenharmony_ci		if (!pgtable_pte_page_ctor(page)) {
658c2ecf20Sopenharmony_ci			__free_page(page);
668c2ecf20Sopenharmony_ci			return NULL;
678c2ecf20Sopenharmony_ci		}
688c2ecf20Sopenharmony_ci	} else {
698c2ecf20Sopenharmony_ci		page = alloc_page(PGALLOC_GFP);
708c2ecf20Sopenharmony_ci		if (!page)
718c2ecf20Sopenharmony_ci			return NULL;
728c2ecf20Sopenharmony_ci	}
738c2ecf20Sopenharmony_ci
748c2ecf20Sopenharmony_ci	atomic_set(&page->pt_frag_refcount, 1);
758c2ecf20Sopenharmony_ci
768c2ecf20Sopenharmony_ci	ret = page_address(page);
778c2ecf20Sopenharmony_ci	/*
788c2ecf20Sopenharmony_ci	 * if we support only one fragment just return the
798c2ecf20Sopenharmony_ci	 * allocated page.
808c2ecf20Sopenharmony_ci	 */
818c2ecf20Sopenharmony_ci	if (PTE_FRAG_NR == 1)
828c2ecf20Sopenharmony_ci		return ret;
838c2ecf20Sopenharmony_ci	spin_lock(&mm->page_table_lock);
848c2ecf20Sopenharmony_ci	/*
858c2ecf20Sopenharmony_ci	 * If we find pgtable_page set, we return
868c2ecf20Sopenharmony_ci	 * the allocated page with single fragement
878c2ecf20Sopenharmony_ci	 * count.
888c2ecf20Sopenharmony_ci	 */
898c2ecf20Sopenharmony_ci	if (likely(!pte_frag_get(&mm->context))) {
908c2ecf20Sopenharmony_ci		atomic_set(&page->pt_frag_refcount, PTE_FRAG_NR);
918c2ecf20Sopenharmony_ci		pte_frag_set(&mm->context, ret + PTE_FRAG_SIZE);
928c2ecf20Sopenharmony_ci	}
938c2ecf20Sopenharmony_ci	spin_unlock(&mm->page_table_lock);
948c2ecf20Sopenharmony_ci
958c2ecf20Sopenharmony_ci	return (pte_t *)ret;
968c2ecf20Sopenharmony_ci}
978c2ecf20Sopenharmony_ci
988c2ecf20Sopenharmony_cipte_t *pte_fragment_alloc(struct mm_struct *mm, int kernel)
998c2ecf20Sopenharmony_ci{
1008c2ecf20Sopenharmony_ci	pte_t *pte;
1018c2ecf20Sopenharmony_ci
1028c2ecf20Sopenharmony_ci	pte = get_pte_from_cache(mm);
1038c2ecf20Sopenharmony_ci	if (pte)
1048c2ecf20Sopenharmony_ci		return pte;
1058c2ecf20Sopenharmony_ci
1068c2ecf20Sopenharmony_ci	return __alloc_for_ptecache(mm, kernel);
1078c2ecf20Sopenharmony_ci}
1088c2ecf20Sopenharmony_ci
1098c2ecf20Sopenharmony_civoid pte_fragment_free(unsigned long *table, int kernel)
1108c2ecf20Sopenharmony_ci{
1118c2ecf20Sopenharmony_ci	struct page *page = virt_to_page(table);
1128c2ecf20Sopenharmony_ci
1138c2ecf20Sopenharmony_ci	if (PageReserved(page))
1148c2ecf20Sopenharmony_ci		return free_reserved_page(page);
1158c2ecf20Sopenharmony_ci
1168c2ecf20Sopenharmony_ci	BUG_ON(atomic_read(&page->pt_frag_refcount) <= 0);
1178c2ecf20Sopenharmony_ci	if (atomic_dec_and_test(&page->pt_frag_refcount)) {
1188c2ecf20Sopenharmony_ci		if (!kernel)
1198c2ecf20Sopenharmony_ci			pgtable_pte_page_dtor(page);
1208c2ecf20Sopenharmony_ci		__free_page(page);
1218c2ecf20Sopenharmony_ci	}
1228c2ecf20Sopenharmony_ci}
123