WSL2-Linux-Kernel/arch/riscv/mm/fault.c

// SPDX-License-Identifier: GPL-2.0-or-later
/*
 * Copyright (C) 2009 Sunplus Core Technology Co., Ltd.
 *  Lennox Wu <lennox.wu@sunplusct.com>
 *  Chen Liqin <liqin.chen@sunplusct.com>
 * Copyright (C) 2012 Regents of the University of California
 */


#include <linux/mm.h>
#include <linux/kernel.h>
#include <linux/interrupt.h>
#include <linux/perf_event.h>
#include <linux/signal.h>
#include <linux/uaccess.h>

#include <asm/pgalloc.h>
#include <asm/ptrace.h>
#include <asm/tlbflush.h>

#include "../kernel/head.h"

/*
 * This routine handles page faults.  It determines the address and the
 * problem, and then passes it off to one of the appropriate routines.
 */
asmlinkage void do_page_fault(struct pt_regs *regs)
{
	struct task_struct *tsk;
	struct vm_area_struct *vma;
	struct mm_struct *mm;
	unsigned long addr, cause;
	unsigned int flags = FAULT_FLAG_ALLOW_RETRY | FAULT_FLAG_KILLABLE;
	int code = SEGV_MAPERR;
	vm_fault_t fault;

	cause = regs->cause;
	addr = regs->badaddr;

	tsk = current;
	mm = tsk->mm;

	/*
	 * Fault-in kernel-space virtual memory on-demand.
	 * The 'reference' page table is init_mm.pgd.
	 *
	 * NOTE! We MUST NOT take any locks for this case. We may
	 * be in an interrupt or a critical region, and should
	 * only copy the information from the master page table,
	 * nothing more.
	 */
	if (unlikely((addr >= VMALLOC_START) && (addr <= VMALLOC_END)))
		goto vmalloc_fault;

	/* Enable interrupts if they were enabled in the parent context. */
	if (likely(regs->status & SR_PIE))
		local_irq_enable();

	/*
	 * If we're in an interrupt, have no user context, or are running
	 * in an atomic region, then we must not take the fault.
	 */
	if (unlikely(faulthandler_disabled() || !mm))
		goto no_context;

	if (user_mode(regs))
		flags |= FAULT_FLAG_USER;

	perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS, 1, regs, addr);

retry:
	down_read(&mm->mmap_sem);
	vma = find_vma(mm, addr);
	if (unlikely(!vma))
		goto bad_area;
	if (likely(vma->vm_start <= addr))
		goto good_area;
	if (unlikely(!(vma->vm_flags & VM_GROWSDOWN)))
		goto bad_area;
	if (unlikely(expand_stack(vma, addr)))
		goto bad_area;

	/*
	 * Ok, we have a good vm_area for this memory access, so
	 * we can handle it.
	 */
good_area:
	code = SEGV_ACCERR;

	switch (cause) {
	case EXC_INST_PAGE_FAULT:
		if (!(vma->vm_flags & VM_EXEC))
			goto bad_area;
		break;
	case EXC_LOAD_PAGE_FAULT:
		if (!(vma->vm_flags & VM_READ))
			goto bad_area;
		break;
	case EXC_STORE_PAGE_FAULT:
		if (!(vma->vm_flags & VM_WRITE))
			goto bad_area;
		flags |= FAULT_FLAG_WRITE;
		break;
	default:
		panic("%s: unhandled cause %lu", __func__, cause);
	}

	/*
	 * If for any reason at all we could not handle the fault,
	 * make sure we exit gracefully rather than endlessly redo
	 * the fault.
	 */
	fault = handle_mm_fault(vma, addr, flags);

	/*
	 * If we need to retry but a fatal signal is pending, handle the
	 * signal first. We do not need to release the mmap_sem because it
	 * would already be released in __lock_page_or_retry in mm/filemap.c.
	 */
	if (fault_signal_pending(fault, regs))
		return;

	if (unlikely(fault & VM_FAULT_ERROR)) {
		if (fault & VM_FAULT_OOM)
			goto out_of_memory;
		else if (fault & VM_FAULT_SIGBUS)
			goto do_sigbus;
		BUG();
	}

	/*
	 * Major/minor page fault accounting is only done on the
	 * initial attempt. If we go through a retry, it is extremely
	 * likely that the page will be found in page cache at that point.
	 */
	if (flags & FAULT_FLAG_ALLOW_RETRY) {
		if (fault & VM_FAULT_MAJOR) {
			tsk->maj_flt++;
			perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS_MAJ,
				      1, regs, addr);
		} else {
			tsk->min_flt++;
			perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS_MIN,
				      1, regs, addr);
		}
		if (fault & VM_FAULT_RETRY) {
			/*
			 * Clear FAULT_FLAG_ALLOW_RETRY to avoid any risk
			 * of starvation.
			 */
			flags &= ~(FAULT_FLAG_ALLOW_RETRY);
			flags |= FAULT_FLAG_TRIED;

			/*
			 * No need to up_read(&mm->mmap_sem) as we would
			 * have already released it in __lock_page_or_retry
			 * in mm/filemap.c.
			 */
			goto retry;
		}
	}

	up_read(&mm->mmap_sem);
	return;

	/*
	 * Something tried to access memory that isn't in our memory map.
	 * Fix it, but check if it's kernel or user first.
	 */
bad_area:
	up_read(&mm->mmap_sem);
	/* User mode accesses just cause a SIGSEGV */
	if (user_mode(regs)) {
		do_trap(regs, SIGSEGV, code, addr);
		return;
	}

no_context:
	/* Are we prepared to handle this kernel fault? */
	if (fixup_exception(regs))
		return;

	/*
	 * Oops. The kernel tried to access some bad page. We'll have to
	 * terminate things with extreme prejudice.
	 */
	bust_spinlocks(1);
	pr_alert("Unable to handle kernel %s at virtual address " REG_FMT "\n",
		(addr < PAGE_SIZE) ? "NULL pointer dereference" :
		"paging request", addr);
	die(regs, "Oops");
	do_exit(SIGKILL);

	/*
	 * We ran out of memory, call the OOM killer, and return the userspace
	 * (which will retry the fault, or kill us if we got oom-killed).
	 */
out_of_memory:
	up_read(&mm->mmap_sem);
	if (!user_mode(regs))
		goto no_context;
	pagefault_out_of_memory();
	return;

do_sigbus:
	up_read(&mm->mmap_sem);
	/* Kernel mode? Handle exceptions or die */
	if (!user_mode(regs))
		goto no_context;
	do_trap(regs, SIGBUS, BUS_ADRERR, addr);
	return;

vmalloc_fault:
	{
		pgd_t *pgd, *pgd_k;
		pud_t *pud, *pud_k;
		p4d_t *p4d, *p4d_k;
		pmd_t *pmd, *pmd_k;
		pte_t *pte_k;
		int index;

		/* User mode accesses just cause a SIGSEGV */
		if (user_mode(regs))
			return do_trap(regs, SIGSEGV, code, addr);

		/*
		 * Synchronize this task's top level page-table
		 * with the 'reference' page table.
		 *
		 * Do _not_ use "tsk->active_mm->pgd" here.
		 * We might be inside an interrupt in the middle
		 * of a task switch.
		 */
		index = pgd_index(addr);
		pgd = (pgd_t *)pfn_to_virt(csr_read(CSR_SATP)) + index;
		pgd_k = init_mm.pgd + index;

		if (!pgd_present(*pgd_k))
			goto no_context;
		set_pgd(pgd, *pgd_k);

		p4d = p4d_offset(pgd, addr);
		p4d_k = p4d_offset(pgd_k, addr);
		if (!p4d_present(*p4d_k))
			goto no_context;

		pud = pud_offset(p4d, addr);
		pud_k = pud_offset(p4d_k, addr);
		if (!pud_present(*pud_k))
			goto no_context;

		/*
		 * Since the vmalloc area is global, it is unnecessary
		 * to copy individual PTEs
		 */
		pmd = pmd_offset(pud, addr);
		pmd_k = pmd_offset(pud_k, addr);
		if (!pmd_present(*pmd_k))
			goto no_context;
		set_pmd(pmd, *pmd_k);

		/*
		 * Make sure the actual PTE exists as well to
		 * catch kernel vmalloc-area accesses to non-mapped
		 * addresses. If we don't do this, this will just
		 * silently loop forever.
		 */
		pte_k = pte_offset_kernel(pmd_k, addr);
		if (!pte_present(*pte_k))
			goto no_context;

		/*
		 * The kernel assumes that TLBs don't cache invalid
		 * entries, but in RISC-V, SFENCE.VMA specifies an
		 * ordering constraint, not a cache flush; it is
		 * necessary even after writing invalid entries.
		 */
		local_flush_tlb_page(addr);

		return;
	}
}
treewide: Replace GPLv2 boilerplate/reference with SPDX - rule 120 Based on 1 normalized pattern(s): this program is free software you can redistribute it and or modify it under the terms of the gnu general public license as published by the free software foundation either version 2 of the license or at your option any later version this program is distributed in the hope that it will be useful but without any warranty without even the implied warranty of merchantability or fitness for a particular purpose see the gnu general public license for more details you should have received a copy of the gnu general public license along with this program if not see the file copying or write to the free software foundation inc extracted by the scancode license scanner the SPDX license identifier GPL-2.0-or-later has been chosen to replace the boilerplate/reference in 12 file(s). Signed-off-by: Thomas Gleixner <tglx@linutronix.de> Reviewed-by: Richard Fontana <rfontana@redhat.com> Reviewed-by: Allison Randal <allison@lohutok.net> Cc: linux-spdx@vger.kernel.org Link: https://lkml.kernel.org/r/20190523091651.231300438@linutronix.de Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org> 2019-05-23 12:14:57 +03:00			`// SPDX-License-Identifier: GPL-2.0-or-later`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`/*`
			`* Copyright (C) 2009 Sunplus Core Technology Co., Ltd.`
			`* Lennox Wu <lennox.wu@sunplusct.com>`
			`* Chen Liqin <liqin.chen@sunplusct.com>`
			`* Copyright (C) 2012 Regents of the University of California`
			`*/`


			`#include <linux/mm.h>`
			`#include <linux/kernel.h>`
			`#include <linux/interrupt.h>`
			`#include <linux/perf_event.h>`
			`#include <linux/signal.h>`
			`#include <linux/uaccess.h>`

			`#include <asm/pgalloc.h>`
			`#include <asm/ptrace.h>`
riscv: mm: synchronize MMU after pte change Because RISC-V compliant implementations can cache invalid entries in TLB, an SFENCE.VMA is necessary after changes to the page table. This patch adds an SFENCE.vma for the vmalloc_fault path. Signed-off-by: ShihPo Hung <shihpo.hung@sifive.com> [paul.walmsley@sifive.com: reversed tab->whitespace conversion, wrapped comment lines] Signed-off-by: Paul Walmsley <paul.walmsley@sifive.com> Cc: Palmer Dabbelt <palmer@sifive.com> Cc: Albert Ou <aou@eecs.berkeley.edu> Cc: Paul Walmsley <paul.walmsley@sifive.com> Cc: linux-riscv@lists.infradead.org Cc: stable@vger.kernel.org 2019-06-17 07:26:17 +03:00			`#include <asm/tlbflush.h>`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00
riscv: add prototypes for assembly language functions from head.S Add prototypes for assembly language functions defined in head.S, and include these prototypes into C source files that call those functions. This patch resolves the following warnings from sparse: arch/riscv/kernel/setup.c:39:10: warning: symbol 'hart_lottery' was not declared. Should it be static? arch/riscv/kernel/setup.c:42:13: warning: symbol 'parse_dtb' was not declared. Should it be static? arch/riscv/kernel/smpboot.c:33:6: warning: symbol '__cpu_up_stack_pointer' was not declared. Should it be static? arch/riscv/kernel/smpboot.c:34:6: warning: symbol '__cpu_up_task_pointer' was not declared. Should it be static? arch/riscv/mm/fault.c:25:17: warning: symbol 'do_page_fault' was not declared. Should it be static? This change should have no functional impact. Signed-off-by: Paul Walmsley <paul.walmsley@sifive.com> 2019-10-18 01:00:17 +03:00			`#include "../kernel/head.h"`

RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`/*`
			`* This routine handles page faults. It determines the address and the`
			`* problem, and then passes it off to one of the appropriate routines.`
			`*/`
			`asmlinkage void do_page_fault(struct pt_regs *regs)`
			`{`
			`struct task_struct *tsk;`
			`struct vm_area_struct *vma;`
			`struct mm_struct *mm;`
			`unsigned long addr, cause;`
			`unsigned int flags = FAULT_FLAG_ALLOW_RETRY \| FAULT_FLAG_KILLABLE;`
mm: convert return type of handle_mm_fault() caller to vm_fault_t Use new return type vm_fault_t for fault handler. For now, this is just documenting that the function returns a VM_FAULT value rather than an errno. Once all instances are converted, vm_fault_t will become a distinct type. Ref-> commit 1c8f422059ae ("mm: change return type to vm_fault_t") In this patch all the caller of handle_mm_fault() are changed to return vm_fault_t type. Link: http://lkml.kernel.org/r/20180617084810.GA6730@jordon-HP-15-Notebook-PC Signed-off-by: Souptick Joarder <jrdr.linux@gmail.com> Cc: Matthew Wilcox <willy@infradead.org> Cc: Richard Henderson <rth@twiddle.net> Cc: Tony Luck <tony.luck@intel.com> Cc: Matt Turner <mattst88@gmail.com> Cc: Vineet Gupta <vgupta@synopsys.com> Cc: Russell King <linux@armlinux.org.uk> Cc: Catalin Marinas <catalin.marinas@arm.com> Cc: Will Deacon <will.deacon@arm.com> Cc: Richard Kuo <rkuo@codeaurora.org> Cc: Geert Uytterhoeven <geert@linux-m68k.org> Cc: Michal Simek <monstr@monstr.eu> Cc: James Hogan <jhogan@kernel.org> Cc: Ley Foon Tan <lftan@altera.com> Cc: Jonas Bonn <jonas@southpole.se> Cc: James E.J. Bottomley <jejb@parisc-linux.org> Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org> Cc: Palmer Dabbelt <palmer@sifive.com> Cc: Yoshinori Sato <ysato@users.sourceforge.jp> Cc: David S. Miller <davem@davemloft.net> Cc: Richard Weinberger <richard@nod.at> Cc: Guan Xuetao <gxt@pku.edu.cn> Cc: Thomas Gleixner <tglx@linutronix.de> Cc: "H. Peter Anvin" <hpa@zytor.com> Cc: "Levin, Alexander (Sasha Levin)" <alexander.levin@verizon.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2018-08-18 01:44:47 +03:00			`int code = SEGV_MAPERR;`
			`vm_fault_t fault;`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00
riscv: abstract out CSR names for supervisor vs machine mode Many of the privileged CSRs exist in a supervisor and machine version that are used very similarly. Provide versions of the CSR names and fields that map to either the S-mode or M-mode variant depending on a new CONFIG_RISCV_M_MODE kconfig symbol. Contains contributions from Damien Le Moal <Damien.LeMoal@wdc.com> and Paul Walmsley <paul.walmsley@sifive.com>. Signed-off-by: Christoph Hellwig <hch@lst.de> Acked-by: Thomas Gleixner <tglx@linutronix.de> # for drivers/clocksource, drivers/irqchip [paul.walmsley@sifive.com: updated to apply] Signed-off-by: Paul Walmsley <paul.walmsley@sifive.com> 2019-10-28 15:10:32 +03:00			`cause = regs->cause;`
			`addr = regs->badaddr;`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00
			`tsk = current;`
			`mm = tsk->mm;`

			`/*`
			`* Fault-in kernel-space virtual memory on-demand.`
			`* The 'reference' page table is init_mm.pgd.`
			`*`
			`* NOTE! We MUST NOT take any locks for this case. We may`
			`* be in an interrupt or a critical region, and should`
			`* only copy the information from the master page table,`
			`* nothing more.`
			`*/`
			`if (unlikely((addr >= VMALLOC_START) && (addr <= VMALLOC_END)))`
			`goto vmalloc_fault;`

			`/* Enable interrupts if they were enabled in the parent context. */`
riscv: abstract out CSR names for supervisor vs machine mode Many of the privileged CSRs exist in a supervisor and machine version that are used very similarly. Provide versions of the CSR names and fields that map to either the S-mode or M-mode variant depending on a new CONFIG_RISCV_M_MODE kconfig symbol. Contains contributions from Damien Le Moal <Damien.LeMoal@wdc.com> and Paul Walmsley <paul.walmsley@sifive.com>. Signed-off-by: Christoph Hellwig <hch@lst.de> Acked-by: Thomas Gleixner <tglx@linutronix.de> # for drivers/clocksource, drivers/irqchip [paul.walmsley@sifive.com: updated to apply] Signed-off-by: Paul Walmsley <paul.walmsley@sifive.com> 2019-10-28 15:10:32 +03:00			`if (likely(regs->status & SR_PIE))`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`local_irq_enable();`

			`/*`
			`* If we're in an interrupt, have no user context, or are running`
			`* in an atomic region, then we must not take the fault.`
			`*/`
			`if (unlikely(faulthandler_disabled() \|\| !mm))`
			`goto no_context;`

			`if (user_mode(regs))`
			`flags \|= FAULT_FLAG_USER;`

			`perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS, 1, regs, addr);`

			`retry:`
			`down_read(&mm->mmap_sem);`
			`vma = find_vma(mm, addr);`
			`if (unlikely(!vma))`
			`goto bad_area;`
			`if (likely(vma->vm_start <= addr))`
			`goto good_area;`
			`if (unlikely(!(vma->vm_flags & VM_GROWSDOWN)))`
			`goto bad_area;`
			`if (unlikely(expand_stack(vma, addr)))`
			`goto bad_area;`

			`/*`
			`* Ok, we have a good vm_area for this memory access, so`
			`* we can handle it.`
			`*/`
			`good_area:`
			`code = SEGV_ACCERR;`

			`switch (cause) {`
			`case EXC_INST_PAGE_FAULT:`
			`if (!(vma->vm_flags & VM_EXEC))`
			`goto bad_area;`
			`break;`
			`case EXC_LOAD_PAGE_FAULT:`
			`if (!(vma->vm_flags & VM_READ))`
			`goto bad_area;`
			`break;`
			`case EXC_STORE_PAGE_FAULT:`
			`if (!(vma->vm_flags & VM_WRITE))`
			`goto bad_area;`
			`flags \|= FAULT_FLAG_WRITE;`
			`break;`
			`default:`
			`panic("%s: unhandled cause %lu", __func__, cause);`
			`}`

			`/*`
			`* If for any reason at all we could not handle the fault,`
			`* make sure we exit gracefully rather than endlessly redo`
			`* the fault.`
			`*/`
			`fault = handle_mm_fault(vma, addr, flags);`

			`/*`
			`* If we need to retry but a fatal signal is pending, handle the`
			`* signal first. We do not need to release the mmap_sem because it`
			`* would already be released in __lock_page_or_retry in mm/filemap.c.`
			`*/`
mm: introduce fault_signal_pending() For most architectures, we've got a quick path to detect fatal signal after a handle_mm_fault(). Introduce a helper for that quick path. It cleans the current codes a bit so we don't need to duplicate the same check across archs. More importantly, this will be an unified place that we handle the signal immediately right after an interrupted page fault, so it'll be much easier for us if we want to change the behavior of handling signals later on for all the archs. Note that currently only part of the archs are using this new helper, because some archs have their own way to handle signals. In the follow up patches, we'll try to apply this helper to all the rest of archs. Another note is that the "regs" parameter in the new helper is not used yet. It'll be used very soon. Now we kept it in this patch only to avoid touching all the archs again in the follow up patches. [peterx@redhat.com: fix sparse warnings] Link: http://lkml.kernel.org/r/20200311145921.GD479302@xz-x1 Signed-off-by: Peter Xu <peterx@redhat.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Tested-by: Brian Geffon <bgeffon@google.com> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Bobby Powers <bobbypowers@gmail.com> Cc: David Hildenbrand <david@redhat.com> Cc: Denis Plotnikov <dplotnikov@virtuozzo.com> Cc: "Dr . David Alan Gilbert" <dgilbert@redhat.com> Cc: Hugh Dickins <hughd@google.com> Cc: Jerome Glisse <jglisse@redhat.com> Cc: Johannes Weiner <hannes@cmpxchg.org> Cc: "Kirill A . Shutemov" <kirill@shutemov.name> Cc: Martin Cracauer <cracauer@cons.org> Cc: Marty McFadden <mcfadden8@llnl.gov> Cc: Matthew Wilcox <willy@infradead.org> Cc: Maya Gokhale <gokhale2@llnl.gov> Cc: Mel Gorman <mgorman@suse.de> Cc: Mike Kravetz <mike.kravetz@oracle.com> Cc: Mike Rapoport <rppt@linux.vnet.ibm.com> Cc: Pavel Emelyanov <xemul@openvz.org> Link: http://lkml.kernel.org/r/20200220155353.8676-4-peterx@redhat.com Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2020-04-02 07:08:06 +03:00			`if (fault_signal_pending(fault, regs))`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`return;`

			`if (unlikely(fault & VM_FAULT_ERROR)) {`
			`if (fault & VM_FAULT_OOM)`
			`goto out_of_memory;`
			`else if (fault & VM_FAULT_SIGBUS)`
			`goto do_sigbus;`
			`BUG();`
			`}`

			`/*`
			`* Major/minor page fault accounting is only done on the`
			`* initial attempt. If we go through a retry, it is extremely`
			`* likely that the page will be found in page cache at that point.`
			`*/`
			`if (flags & FAULT_FLAG_ALLOW_RETRY) {`
			`if (fault & VM_FAULT_MAJOR) {`
			`tsk->maj_flt++;`
			`perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS_MAJ,`
			`1, regs, addr);`
			`} else {`
			`tsk->min_flt++;`
			`perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS_MIN,`
			`1, regs, addr);`
			`}`
			`if (fault & VM_FAULT_RETRY) {`
			`/*`
			`* Clear FAULT_FLAG_ALLOW_RETRY to avoid any risk`
			`* of starvation.`
			`*/`
			`flags &= ~(FAULT_FLAG_ALLOW_RETRY);`
			`flags \|= FAULT_FLAG_TRIED;`

			`/*`
			`* No need to up_read(&mm->mmap_sem) as we would`
			`* have already released it in __lock_page_or_retry`
			`* in mm/filemap.c.`
			`*/`
			`goto retry;`
			`}`
			`}`

			`up_read(&mm->mmap_sem);`
			`return;`

			`/*`
			`* Something tried to access memory that isn't in our memory map.`
			`* Fix it, but check if it's kernel or user first.`
			`*/`
			`bad_area:`
			`up_read(&mm->mmap_sem);`
			`/* User mode accesses just cause a SIGSEGV */`
			`if (user_mode(regs)) {`
signal/riscv: Remove tsk parameter from do_trap The do_trap function is always called with tsk == current. Make that obvious by removing the tsk parameter. This also makes it clear that do_trap calls force_sig_fault on the current task. Signed-off-by: "Eric W. Biederman" <ebiederm@xmission.com> 2019-02-06 04:10:48 +03:00			`do_trap(regs, SIGSEGV, code, addr);`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`return;`
			`}`

			`no_context:`
			`/* Are we prepared to handle this kernel fault? */`
			`if (fixup_exception(regs))`
			`return;`

			`/*`
			`* Oops. The kernel tried to access some bad page. We'll have to`
			`* terminate things with extreme prejudice.`
			`*/`
			`bust_spinlocks(1);`
			`pr_alert("Unable to handle kernel %s at virtual address " REG_FMT "\n",`
			`(addr < PAGE_SIZE) ? "NULL pointer dereference" :`
			`"paging request", addr);`
			`die(regs, "Oops");`
			`do_exit(SIGKILL);`

			`/*`
			`* We ran out of memory, call the OOM killer, and return the userspace`
			`* (which will retry the fault, or kill us if we got oom-killed).`
			`*/`
			`out_of_memory:`
			`up_read(&mm->mmap_sem);`
			`if (!user_mode(regs))`
			`goto no_context;`
			`pagefault_out_of_memory();`
			`return;`

			`do_sigbus:`
			`up_read(&mm->mmap_sem);`
			`/* Kernel mode? Handle exceptions or die */`
			`if (!user_mode(regs))`
			`goto no_context;`
signal/riscv: Remove tsk parameter from do_trap The do_trap function is always called with tsk == current. Make that obvious by removing the tsk parameter. This also makes it clear that do_trap calls force_sig_fault on the current task. Signed-off-by: "Eric W. Biederman" <ebiederm@xmission.com> 2019-02-06 04:10:48 +03:00			`do_trap(regs, SIGBUS, BUS_ADRERR, addr);`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`return;`

			`vmalloc_fault:`
			`{`
			`pgd_t pgd, pgd_k;`
			`pud_t pud, pud_k;`
			`p4d_t p4d, p4d_k;`
			`pmd_t pmd, pmd_k;`
			`pte_t *pte_k;`
			`int index;`

riscv: fix locking violation in page fault handler When a user mode process accesses an address in the vmalloc area do_page_fault tries to unlock the mmap semaphore when it isn't locked. Signed-off-by: Andreas Schwab <schwab@suse.de> [Palmer: Duplicated code instead of a goto] Signed-off-by: Palmer Dabbelt <palmer@sifive.com> 2019-05-07 10:36:46 +03:00			`/* User mode accesses just cause a SIGSEGV */`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`if (user_mode(regs))`
signal/riscv: Remove tsk parameter from do_trap The do_trap function is always called with tsk == current. Make that obvious by removing the tsk parameter. This also makes it clear that do_trap calls force_sig_fault on the current task. Signed-off-by: "Eric W. Biederman" <ebiederm@xmission.com> 2019-02-06 04:10:48 +03:00			`return do_trap(regs, SIGSEGV, code, addr);`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00
			`/*`
			`* Synchronize this task's top level page-table`
			`* with the 'reference' page table.`
			`*`
			`* Do _not_ use "tsk->active_mm->pgd" here.`
			`* We might be inside an interrupt in the middle`
			`* of a task switch.`
			`*/`
			`index = pgd_index(addr);`
RISC-V: Access CSRs using CSR numbers We should prefer accessing CSRs using their CSR numbers because: 1. It compiles fine with older toolchains. 2. We can use latest CSR names in #define macro names of CSR numbers as-per RISC-V spec. 3. We can access newly added CSRs even if toolchain does not recognize newly addes CSRs by name. Signed-off-by: Anup Patel <anup.patel@wdc.com> Reviewed-by: Christoph Hellwig <hch@lst.de> Signed-off-by: Palmer Dabbelt <palmer@sifive.com> 2019-04-25 11:38:41 +03:00			`pgd = (pgd_t *)pfn_to_virt(csr_read(CSR_SATP)) + index;`
RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`pgd_k = init_mm.pgd + index;`

			`if (!pgd_present(*pgd_k))`
			`goto no_context;`
			`set_pgd(pgd, *pgd_k);`

			`p4d = p4d_offset(pgd, addr);`
			`p4d_k = p4d_offset(pgd_k, addr);`
			`if (!p4d_present(*p4d_k))`
			`goto no_context;`

			`pud = pud_offset(p4d, addr);`
			`pud_k = pud_offset(p4d_k, addr);`
			`if (!pud_present(*pud_k))`
			`goto no_context;`

			`/*`
			`* Since the vmalloc area is global, it is unnecessary`
			`* to copy individual PTEs`
			`*/`
			`pmd = pmd_offset(pud, addr);`
			`pmd_k = pmd_offset(pud_k, addr);`
			`if (!pmd_present(*pmd_k))`
			`goto no_context;`
			`set_pmd(pmd, *pmd_k);`

			`/*`
			`* Make sure the actual PTE exists as well to`
			`* catch kernel vmalloc-area accesses to non-mapped`
			`* addresses. If we don't do this, this will just`
			`* silently loop forever.`
			`*/`
			`pte_k = pte_offset_kernel(pmd_k, addr);`
			`if (!pte_present(*pte_k))`
			`goto no_context;`
riscv: mm: synchronize MMU after pte change Because RISC-V compliant implementations can cache invalid entries in TLB, an SFENCE.VMA is necessary after changes to the page table. This patch adds an SFENCE.vma for the vmalloc_fault path. Signed-off-by: ShihPo Hung <shihpo.hung@sifive.com> [paul.walmsley@sifive.com: reversed tab->whitespace conversion, wrapped comment lines] Signed-off-by: Paul Walmsley <paul.walmsley@sifive.com> Cc: Palmer Dabbelt <palmer@sifive.com> Cc: Albert Ou <aou@eecs.berkeley.edu> Cc: Paul Walmsley <paul.walmsley@sifive.com> Cc: linux-riscv@lists.infradead.org Cc: stable@vger.kernel.org 2019-06-17 07:26:17 +03:00
			`/*`
			`* The kernel assumes that TLBs don't cache invalid`
			`* entries, but in RISC-V, SFENCE.VMA specifies an`
			`* ordering constraint, not a cache flush; it is`
			`* necessary even after writing invalid entries.`
			`*/`
			`local_flush_tlb_page(addr);`

RISC-V: Paging and MMU This patch contains code to manage the RISC-V MMU, including definitions of the page tables and the page walking code. Signed-off-by: Palmer Dabbelt <palmer@dabbelt.com> 2017-07-11 04:06:09 +03:00			`return;`
			`}`
			`}`