// SPDX-License-Identifier: GPL-2.0 /* * Handling Page Tables through page fragments * */ #include <linux/kernel.h> #include <linux/gfp.h> #include <linux/mm.h> #include <linux/percpu.h> #include <linux/hardirq.h> #include <linux/hugetlb.h> #include <asm/pgalloc.h> #include <asm/tlbflush.h> #include <asm/tlb.h> void pte_frag_destroy(void *pte_frag) { int count; struct ptdesc *ptdesc; ptdesc = virt_to_ptdesc(pte_frag); /* drop all the pending references */ count = ((unsigned long)pte_frag & ~PAGE_MASK) >> PTE_FRAG_SIZE_SHIFT; /* We allow PTE_FRAG_NR fragments from a PTE page */ if (atomic_sub_and_test(PTE_FRAG_NR - count, &ptdesc->pt_frag_refcount)) { pagetable_pte_dtor(ptdesc); pagetable_free(ptdesc); } } static pte_t *get_pte_from_cache(struct mm_struct *mm) { void *pte_frag, *ret; if (PTE_FRAG_NR == 1) return NULL; spin_lock(&mm->page_table_lock); ret = pte_frag_get(&mm->context); if (ret) { pte_frag = ret + PTE_FRAG_SIZE; /* * If we have taken up all the fragments mark PTE page NULL */ if (((unsigned long)pte_frag & ~PAGE_MASK) == 0) pte_frag = NULL; pte_frag_set(&mm->context, pte_frag); } spin_unlock(&mm->page_table_lock); return (pte_t *)ret; } static pte_t *__alloc_for_ptecache(struct mm_struct *mm, int kernel) { void *ret = NULL; struct ptdesc *ptdesc; if (!kernel) { ptdesc = pagetable_alloc(PGALLOC_GFP | __GFP_ACCOUNT, 0); if (!ptdesc) return NULL; if (!pagetable_pte_ctor(ptdesc)) { pagetable_free(ptdesc); return NULL; } } else { ptdesc = pagetable_alloc(PGALLOC_GFP, 0); if (!ptdesc) return NULL; } atomic_set(&ptdesc->pt_frag_refcount, 1); ret = ptdesc_address(ptdesc); /* * if we support only one fragment just return the * allocated page. */ if (PTE_FRAG_NR == 1) return ret; spin_lock(&mm->page_table_lock); /* * If we find ptdesc_page set, we return * the allocated page with single fragment * count. */ if (likely(!pte_frag_get(&mm->context))) { atomic_set(&ptdesc->pt_frag_refcount, PTE_FRAG_NR); pte_frag_set(&mm->context, ret + PTE_FRAG_SIZE); } spin_unlock(&mm->page_table_lock); return (pte_t *)ret; } pte_t *pte_fragment_alloc(struct mm_struct *mm, int kernel) { pte_t *pte; pte = get_pte_from_cache(mm); if (pte) return pte; return __alloc_for_ptecache(mm, kernel); } static void pte_free_now(struct rcu_head *head) { struct ptdesc *ptdesc; ptdesc = container_of(head, struct ptdesc, pt_rcu_head); pagetable_pte_dtor(ptdesc); pagetable_free(ptdesc); } void pte_fragment_free(unsigned long *table, int kernel) { struct ptdesc *ptdesc = virt_to_ptdesc(table); if (pagetable_is_reserved(ptdesc)) return free_reserved_ptdesc(ptdesc); BUG_ON(atomic_read(&ptdesc->pt_frag_refcount) <= 0); if (atomic_dec_and_test(&ptdesc->pt_frag_refcount)) { if (kernel) pagetable_free(ptdesc); else if (folio_test_clear_active(ptdesc_folio(ptdesc))) call_rcu(&ptdesc->pt_rcu_head, pte_free_now); else pte_free_now(&ptdesc->pt_rcu_head); } } #ifdef CONFIG_TRANSPARENT_HUGEPAGE void pte_free_defer(struct mm_struct *mm, pgtable_t pgtable) { struct page *page; page = virt_to_page(pgtable); SetPageActive(page); pte_fragment_free((unsigned long *)pgtable, 0); } #endif /* CONFIG_TRANSPARENT_HUGEPAGE */