arch/arm/mm/fault-armv.c - linux - Git at Google

 // SPDX-License-Identifier: GPL-2.0-only
 /*
  *  linux/arch/arm/mm/fault-armv.c
  *
  *  Copyright (C) 1995  Linus Torvalds
  *  Modifications for ARM processor (c) 1995-2002 Russell King
  */
 #include <linux/sched.h>
 #include <linux/kernel.h>
 #include <linux/mm.h>
 #include <linux/bitops.h>
 #include <linux/vmalloc.h>
 #include <linux/init.h>
 #include <linux/pagemap.h>
 #include <linux/gfp.h>

 #include <asm/bugs.h>
 #include <asm/cacheflush.h>
 #include <asm/cachetype.h>
 #include <asm/tlbflush.h>

 #include "mm.h"

 static pteval_t shared_pte_mask = L_PTE_MT_BUFFERABLE;

 #if __LINUX_ARM_ARCH__ < 6
 /*
  * We take the easy way out of this problem - we make the
  * PTE uncacheable.  However, we leave the write buffer on.
  *
  * Note that the pte lock held when calling update_mmu_cache must also
  * guard the pte (somewhere else in the same mm) that we modify here.
  * Therefore those configurations which might call adjust_pte (those
  * without CONFIG_CPU_CACHE_VIPT) cannot support split page_table_lock.
  */
 static int do_adjust_pte(struct vm_area_struct *vma, unsigned long address,
 	unsigned long pfn, pte_t *ptep)
 {
 	pte_t entry = *ptep;
 	int ret;

 	/*
 	 * If this page is present, it's actually being shared.
 	 */
 	ret = pte_present(entry);

 	/*
 	 * If this page isn't present, or is already setup to
 	 * fault (ie, is old), we can safely ignore any issues.
 	 */
 	if (ret && (pte_val(entry) & L_PTE_MT_MASK) != shared_pte_mask) {
 		flush_cache_page(vma, address, pfn);
 		outer_flush_range((pfn << PAGE_SHIFT),
 				  (pfn << PAGE_SHIFT) + PAGE_SIZE);
 		pte_val(entry) &= ~L_PTE_MT_MASK;
 		pte_val(entry) |= shared_pte_mask;
 		set_pte_at(vma->vm_mm, address, ptep, entry);
 		flush_tlb_page(vma, address);
 	}

 	return ret;
 }

 #if defined(CONFIG_SPLIT_PTE_PTLOCKS)
 /*
  * If we are using split PTE locks, then we need to take the page
  * lock here.  Otherwise we are using shared mm->page_table_lock
  * which is already locked, thus cannot take it.
  */
 static inline void do_pte_lock(spinlock_t *ptl)
 {
 	/*
 	 * Use nested version here to indicate that we are already
 	 * holding one similar spinlock.
 	 */
 	spin_lock_nested(ptl, SINGLE_DEPTH_NESTING);
 }

 static inline void do_pte_unlock(spinlock_t *ptl)
 {
 	spin_unlock(ptl);
 }
 #else /* !defined(CONFIG_SPLIT_PTE_PTLOCKS) */
 static inline void do_pte_lock(spinlock_t *ptl) {}
 static inline void do_pte_unlock(spinlock_t *ptl) {}
 #endif /* defined(CONFIG_SPLIT_PTE_PTLOCKS) */

 static int adjust_pte(struct vm_area_struct *vma, unsigned long address,
 	unsigned long pfn)
 {
 	spinlock_t *ptl;
 	pgd_t *pgd;
 	p4d_t *p4d;
 	pud_t *pud;
 	pmd_t *pmd;
 	pte_t *pte;
 	int ret;

 	pgd = pgd_offset(vma->vm_mm, address);
 	if (pgd_none_or_clear_bad(pgd))
 		return 0;

 	p4d = p4d_offset(pgd, address);
 	if (p4d_none_or_clear_bad(p4d))
 		return 0;

 	pud = pud_offset(p4d, address);
 	if (pud_none_or_clear_bad(pud))
 		return 0;

 	pmd = pmd_offset(pud, address);
 	if (pmd_none_or_clear_bad(pmd))
 		return 0;

 	/*
 	 * This is called while another page table is mapped, so we
 	 * must use the nested version.  This also means we need to
 	 * open-code the spin-locking.
 	 */
 	pte = pte_offset_map_nolock(vma->vm_mm, pmd, address, &ptl);
 	if (!pte)
 		return 0;

 	do_pte_lock(ptl);

 	ret = do_adjust_pte(vma, address, pfn, pte);

 	do_pte_unlock(ptl);
 	pte_unmap(pte);

 	return ret;
 }

 static void
 make_coherent(struct address_space *mapping, struct vm_area_struct *vma,
 	unsigned long addr, pte_t *ptep, unsigned long pfn)
 {
 	struct mm_struct *mm = vma->vm_mm;
 	struct vm_area_struct *mpnt;
 	unsigned long offset;
 	pgoff_t pgoff;
 	int aliases = 0;

 	pgoff = vma->vm_pgoff + ((addr - vma->vm_start) >> PAGE_SHIFT);

 	/*
 	 * If we have any shared mappings that are in the same mm
 	 * space, then we need to handle them specially to maintain
 	 * cache coherency.
 	 */
 	flush_dcache_mmap_lock(mapping);
 	vma_interval_tree_foreach(mpnt, &mapping->i_mmap, pgoff, pgoff) {
 		/*
 		 * If this VMA is not in our MM, we can ignore it.
 		 * Note that we intentionally mask out the VMA
 		 * that we are fixing up.
 		 */
 		if (mpnt->vm_mm != mm || mpnt == vma)
 			continue;
 		if (!(mpnt->vm_flags & VM_MAYSHARE))
 			continue;
 		offset = (pgoff - mpnt->vm_pgoff) << PAGE_SHIFT;
 		aliases += adjust_pte(mpnt, mpnt->vm_start + offset, pfn);
 	}
 	flush_dcache_mmap_unlock(mapping);
 	if (aliases)
 		do_adjust_pte(vma, addr, pfn, ptep);
 }

 /*
  * Take care of architecture specific things when placing a new PTE into
  * a page table, or changing an existing PTE.  Basically, there are two
  * things that we need to take care of:
  *
  *  1. If PG_dcache_clean is not set for the page, we need to ensure
  *     that any cache entries for the kernels virtual memory
  *     range are written back to the page.
  *  2. If we have multiple shared mappings of the same space in
  *     an object, we need to deal with the cache aliasing issues.
  *
  * Note that the pte lock will be held.
  */
 void update_mmu_cache_range(struct vm_fault *vmf, struct vm_area_struct *vma,
 		unsigned long addr, pte_t *ptep, unsigned int nr)
 {
 	unsigned long pfn = pte_pfn(*ptep);
 	struct address_space *mapping;
 	struct folio *folio;

 	if (!pfn_valid(pfn))
 		return;

 	/*
 	 * The zero page is never written to, so never has any dirty
 	 * cache lines, and therefore never needs to be flushed.
 	 */
 	if (is_zero_pfn(pfn))
 		return;

 	folio = page_folio(pfn_to_page(pfn));
 	mapping = folio_flush_mapping(folio);
 	if (!test_and_set_bit(PG_dcache_clean, &folio->flags))
 		__flush_dcache_folio(mapping, folio);
 	if (mapping) {
 		if (cache_is_vivt())
 			make_coherent(mapping, vma, addr, ptep, pfn);
 		else if (vma->vm_flags & VM_EXEC)
 			__flush_icache_all();
 	}
 }
 #endif	/* __LINUX_ARM_ARCH__ < 6 */

 /*
  * Check whether the write buffer has physical address aliasing
  * issues.  If it has, we need to avoid them for the case where
  * we have several shared mappings of the same object in user
  * space.
  */
 static int __init check_writebuffer(unsigned long *p1, unsigned long *p2)
 {
 	register unsigned long zero = 0, one = 1, val;

 	local_irq_disable();
 	mb();
 	*p1 = one;
 	mb();
 	*p2 = zero;
 	mb();
 	val = *p1;
 	mb();
 	local_irq_enable();
 	return val != zero;
 }

 void __init check_writebuffer_bugs(void)
 {
 	struct page *page;
 	const char *reason;
 	unsigned long v = 1;

 	pr_info("CPU: Testing write buffer coherency: ");

 	page = alloc_page(GFP_KERNEL);
 	if (page) {
 		unsigned long *p1, *p2;
 		pgprot_t prot = __pgprot_modify(PAGE_KERNEL,
 					L_PTE_MT_MASK, L_PTE_MT_BUFFERABLE);

 		p1 = vmap(&page, 1, VM_IOREMAP, prot);
 		p2 = vmap(&page, 1, VM_IOREMAP, prot);

 		if (p1 && p2) {
 			v = check_writebuffer(p1, p2);
 			reason = "enabling work-around";
 		} else {
 			reason = "unable to map memory\n";
 		}

 		vunmap(p1);
 		vunmap(p2);
 		put_page(page);
 	} else {
 		reason = "unable to grab page\n";
 	}

 	if (v) {
 		pr_cont("failed, %s\n", reason);
 		shared_pte_mask = L_PTE_MT_UNCACHED;
 	} else {
 		pr_cont("ok\n");
 	}
 }
	// SPDX-License-Identifier: GPL-2.0-only
	/*
	* linux/arch/arm/mm/fault-armv.c
	*
	* Copyright (C) 1995 Linus Torvalds
	* Modifications for ARM processor (c) 1995-2002 Russell King
	*/
	#include <linux/sched.h>
	#include <linux/kernel.h>
	#include <linux/mm.h>
	#include <linux/bitops.h>
	#include <linux/vmalloc.h>
	#include <linux/init.h>
	#include <linux/pagemap.h>
	#include <linux/gfp.h>

	#include <asm/bugs.h>
	#include <asm/cacheflush.h>
	#include <asm/cachetype.h>
	#include <asm/tlbflush.h>

	#include "mm.h"

	static pteval_t shared_pte_mask = L_PTE_MT_BUFFERABLE;

	#if __LINUX_ARM_ARCH__ < 6
	/*
	* We take the easy way out of this problem - we make the
	* PTE uncacheable. However, we leave the write buffer on.
	*
	* Note that the pte lock held when calling update_mmu_cache must also
	* guard the pte (somewhere else in the same mm) that we modify here.
	* Therefore those configurations which might call adjust_pte (those
	* without CONFIG_CPU_CACHE_VIPT) cannot support split page_table_lock.
	*/
	static int do_adjust_pte(struct vm_area_struct *vma, unsigned long address,
	unsigned long pfn, pte_t *ptep)
	{
	pte_t entry = *ptep;
	int ret;

	/*
	* If this page is present, it's actually being shared.
	*/
	ret = pte_present(entry);

	/*
	* If this page isn't present, or is already setup to
	* fault (ie, is old), we can safely ignore any issues.
	*/
	if (ret && (pte_val(entry) & L_PTE_MT_MASK) != shared_pte_mask) {
	flush_cache_page(vma, address, pfn);
	outer_flush_range((pfn << PAGE_SHIFT),
	(pfn << PAGE_SHIFT) + PAGE_SIZE);
	pte_val(entry) &= ~L_PTE_MT_MASK;
	pte_val(entry) \|= shared_pte_mask;
	set_pte_at(vma->vm_mm, address, ptep, entry);
	flush_tlb_page(vma, address);
	}

	return ret;
	}

	#if defined(CONFIG_SPLIT_PTE_PTLOCKS)
	/*
	* If we are using split PTE locks, then we need to take the page
	* lock here. Otherwise we are using shared mm->page_table_lock
	* which is already locked, thus cannot take it.
	*/
	static inline void do_pte_lock(spinlock_t *ptl)
	{
	/*
	* Use nested version here to indicate that we are already
	* holding one similar spinlock.
	*/
	spin_lock_nested(ptl, SINGLE_DEPTH_NESTING);
	}

	static inline void do_pte_unlock(spinlock_t *ptl)
	{
	spin_unlock(ptl);
	}
	#else /* !defined(CONFIG_SPLIT_PTE_PTLOCKS) */
	static inline void do_pte_lock(spinlock_t *ptl) {}
	static inline void do_pte_unlock(spinlock_t *ptl) {}
	#endif /* defined(CONFIG_SPLIT_PTE_PTLOCKS) */

	static int adjust_pte(struct vm_area_struct *vma, unsigned long address,
	unsigned long pfn)
	{
	spinlock_t *ptl;
	pgd_t *pgd;
	p4d_t *p4d;
	pud_t *pud;
	pmd_t *pmd;
	pte_t *pte;
	int ret;

	pgd = pgd_offset(vma->vm_mm, address);
	if (pgd_none_or_clear_bad(pgd))
	return 0;

	p4d = p4d_offset(pgd, address);
	if (p4d_none_or_clear_bad(p4d))
	return 0;

	pud = pud_offset(p4d, address);
	if (pud_none_or_clear_bad(pud))
	return 0;

	pmd = pmd_offset(pud, address);
	if (pmd_none_or_clear_bad(pmd))
	return 0;

	/*
	* This is called while another page table is mapped, so we
	* must use the nested version. This also means we need to
	* open-code the spin-locking.
	*/
	pte = pte_offset_map_nolock(vma->vm_mm, pmd, address, &ptl);
	if (!pte)
	return 0;

	do_pte_lock(ptl);

	ret = do_adjust_pte(vma, address, pfn, pte);

	do_pte_unlock(ptl);
	pte_unmap(pte);

	return ret;
	}

	static void
	make_coherent(struct address_space mapping, struct vm_area_struct vma,
	unsigned long addr, pte_t *ptep, unsigned long pfn)
	{
	struct mm_struct *mm = vma->vm_mm;
	struct vm_area_struct *mpnt;
	unsigned long offset;
	pgoff_t pgoff;
	int aliases = 0;

	pgoff = vma->vm_pgoff + ((addr - vma->vm_start) >> PAGE_SHIFT);

	/*
	* If we have any shared mappings that are in the same mm
	* space, then we need to handle them specially to maintain
	* cache coherency.
	*/
	flush_dcache_mmap_lock(mapping);
	vma_interval_tree_foreach(mpnt, &mapping->i_mmap, pgoff, pgoff) {
	/*
	* If this VMA is not in our MM, we can ignore it.
	* Note that we intentionally mask out the VMA
	* that we are fixing up.
	*/
	if (mpnt->vm_mm != mm \|\| mpnt == vma)
	continue;
	if (!(mpnt->vm_flags & VM_MAYSHARE))
	continue;
	offset = (pgoff - mpnt->vm_pgoff) << PAGE_SHIFT;
	aliases += adjust_pte(mpnt, mpnt->vm_start + offset, pfn);
	}
	flush_dcache_mmap_unlock(mapping);
	if (aliases)
	do_adjust_pte(vma, addr, pfn, ptep);
	}

	/*
	* Take care of architecture specific things when placing a new PTE into
	* a page table, or changing an existing PTE. Basically, there are two
	* things that we need to take care of:
	*
	* 1. If PG_dcache_clean is not set for the page, we need to ensure
	* that any cache entries for the kernels virtual memory
	* range are written back to the page.
	* 2. If we have multiple shared mappings of the same space in
	* an object, we need to deal with the cache aliasing issues.
	*
	* Note that the pte lock will be held.
	*/
	void update_mmu_cache_range(struct vm_fault vmf, struct vm_area_struct vma,
	unsigned long addr, pte_t *ptep, unsigned int nr)
	{
	unsigned long pfn = pte_pfn(*ptep);
	struct address_space *mapping;
	struct folio *folio;

	if (!pfn_valid(pfn))
	return;

	/*
	* The zero page is never written to, so never has any dirty
	* cache lines, and therefore never needs to be flushed.
	*/
	if (is_zero_pfn(pfn))
	return;

	folio = page_folio(pfn_to_page(pfn));
	mapping = folio_flush_mapping(folio);
	if (!test_and_set_bit(PG_dcache_clean, &folio->flags))
	__flush_dcache_folio(mapping, folio);
	if (mapping) {
	if (cache_is_vivt())
	make_coherent(mapping, vma, addr, ptep, pfn);
	else if (vma->vm_flags & VM_EXEC)
	__flush_icache_all();
	}
	}
	#endif /* __LINUX_ARM_ARCH__ < 6 */

	/*
	* Check whether the write buffer has physical address aliasing
	* issues. If it has, we need to avoid them for the case where
	* we have several shared mappings of the same object in user
	* space.
	*/
	static int __init check_writebuffer(unsigned long p1, unsigned long p2)
	{
	register unsigned long zero = 0, one = 1, val;

	local_irq_disable();
	mb();
	*p1 = one;
	mb();
	*p2 = zero;
	mb();
	val = *p1;
	mb();
	local_irq_enable();
	return val != zero;
	}

	void __init check_writebuffer_bugs(void)
	{
	struct page *page;
	const char *reason;
	unsigned long v = 1;

	pr_info("CPU: Testing write buffer coherency: ");

	page = alloc_page(GFP_KERNEL);
	if (page) {
	unsigned long p1, p2;
	pgprot_t prot = __pgprot_modify(PAGE_KERNEL,
	L_PTE_MT_MASK, L_PTE_MT_BUFFERABLE);

	p1 = vmap(&page, 1, VM_IOREMAP, prot);
	p2 = vmap(&page, 1, VM_IOREMAP, prot);

	if (p1 && p2) {
	v = check_writebuffer(p1, p2);
	reason = "enabling work-around";
	} else {
	reason = "unable to map memory\n";
	}

	vunmap(p1);
	vunmap(p2);
	put_page(page);
	} else {
	reason = "unable to grab page\n";
	}

	if (v) {
	pr_cont("failed, %s\n", reason);
	shared_pte_mask = L_PTE_MT_UNCACHED;
	} else {
	pr_cont("ok\n");
	}
	}