162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * S390 version 462306a36Sopenharmony_ci * Copyright IBM Corp. 1999 562306a36Sopenharmony_ci * Author(s): Hartmut Penner (hp@de.ibm.com) 662306a36Sopenharmony_ci * Ulrich Weigand (uweigand@de.ibm.com) 762306a36Sopenharmony_ci * 862306a36Sopenharmony_ci * Derived from "arch/i386/mm/fault.c" 962306a36Sopenharmony_ci * Copyright (C) 1995 Linus Torvalds 1062306a36Sopenharmony_ci */ 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci#include <linux/kernel_stat.h> 1362306a36Sopenharmony_ci#include <linux/perf_event.h> 1462306a36Sopenharmony_ci#include <linux/signal.h> 1562306a36Sopenharmony_ci#include <linux/sched.h> 1662306a36Sopenharmony_ci#include <linux/sched/debug.h> 1762306a36Sopenharmony_ci#include <linux/kernel.h> 1862306a36Sopenharmony_ci#include <linux/errno.h> 1962306a36Sopenharmony_ci#include <linux/string.h> 2062306a36Sopenharmony_ci#include <linux/types.h> 2162306a36Sopenharmony_ci#include <linux/ptrace.h> 2262306a36Sopenharmony_ci#include <linux/mman.h> 2362306a36Sopenharmony_ci#include <linux/mm.h> 2462306a36Sopenharmony_ci#include <linux/compat.h> 2562306a36Sopenharmony_ci#include <linux/smp.h> 2662306a36Sopenharmony_ci#include <linux/kdebug.h> 2762306a36Sopenharmony_ci#include <linux/init.h> 2862306a36Sopenharmony_ci#include <linux/console.h> 2962306a36Sopenharmony_ci#include <linux/extable.h> 3062306a36Sopenharmony_ci#include <linux/hardirq.h> 3162306a36Sopenharmony_ci#include <linux/kprobes.h> 3262306a36Sopenharmony_ci#include <linux/uaccess.h> 3362306a36Sopenharmony_ci#include <linux/hugetlb.h> 3462306a36Sopenharmony_ci#include <linux/kfence.h> 3562306a36Sopenharmony_ci#include <asm/asm-extable.h> 3662306a36Sopenharmony_ci#include <asm/asm-offsets.h> 3762306a36Sopenharmony_ci#include <asm/diag.h> 3862306a36Sopenharmony_ci#include <asm/gmap.h> 3962306a36Sopenharmony_ci#include <asm/irq.h> 4062306a36Sopenharmony_ci#include <asm/mmu_context.h> 4162306a36Sopenharmony_ci#include <asm/facility.h> 4262306a36Sopenharmony_ci#include <asm/uv.h> 4362306a36Sopenharmony_ci#include "../kernel/entry.h" 4462306a36Sopenharmony_ci 4562306a36Sopenharmony_ci#define __FAIL_ADDR_MASK -4096L 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_ci/* 4862306a36Sopenharmony_ci * Allocate private vm_fault_reason from top. Please make sure it won't 4962306a36Sopenharmony_ci * collide with vm_fault_reason. 5062306a36Sopenharmony_ci */ 5162306a36Sopenharmony_ci#define VM_FAULT_BADCONTEXT ((__force vm_fault_t)0x80000000) 5262306a36Sopenharmony_ci#define VM_FAULT_BADMAP ((__force vm_fault_t)0x40000000) 5362306a36Sopenharmony_ci#define VM_FAULT_BADACCESS ((__force vm_fault_t)0x20000000) 5462306a36Sopenharmony_ci#define VM_FAULT_SIGNAL ((__force vm_fault_t)0x10000000) 5562306a36Sopenharmony_ci#define VM_FAULT_PFAULT ((__force vm_fault_t)0x8000000) 5662306a36Sopenharmony_ci 5762306a36Sopenharmony_cienum fault_type { 5862306a36Sopenharmony_ci KERNEL_FAULT, 5962306a36Sopenharmony_ci USER_FAULT, 6062306a36Sopenharmony_ci GMAP_FAULT, 6162306a36Sopenharmony_ci}; 6262306a36Sopenharmony_ci 6362306a36Sopenharmony_cistatic unsigned long store_indication __read_mostly; 6462306a36Sopenharmony_ci 6562306a36Sopenharmony_cistatic int __init fault_init(void) 6662306a36Sopenharmony_ci{ 6762306a36Sopenharmony_ci if (test_facility(75)) 6862306a36Sopenharmony_ci store_indication = 0xc00; 6962306a36Sopenharmony_ci return 0; 7062306a36Sopenharmony_ci} 7162306a36Sopenharmony_ciearly_initcall(fault_init); 7262306a36Sopenharmony_ci 7362306a36Sopenharmony_ci/* 7462306a36Sopenharmony_ci * Find out which address space caused the exception. 7562306a36Sopenharmony_ci */ 7662306a36Sopenharmony_cistatic enum fault_type get_fault_type(struct pt_regs *regs) 7762306a36Sopenharmony_ci{ 7862306a36Sopenharmony_ci unsigned long trans_exc_code; 7962306a36Sopenharmony_ci 8062306a36Sopenharmony_ci trans_exc_code = regs->int_parm_long & 3; 8162306a36Sopenharmony_ci if (likely(trans_exc_code == 0)) { 8262306a36Sopenharmony_ci /* primary space exception */ 8362306a36Sopenharmony_ci if (user_mode(regs)) 8462306a36Sopenharmony_ci return USER_FAULT; 8562306a36Sopenharmony_ci if (!IS_ENABLED(CONFIG_PGSTE)) 8662306a36Sopenharmony_ci return KERNEL_FAULT; 8762306a36Sopenharmony_ci if (test_pt_regs_flag(regs, PIF_GUEST_FAULT)) 8862306a36Sopenharmony_ci return GMAP_FAULT; 8962306a36Sopenharmony_ci return KERNEL_FAULT; 9062306a36Sopenharmony_ci } 9162306a36Sopenharmony_ci if (trans_exc_code == 2) 9262306a36Sopenharmony_ci return USER_FAULT; 9362306a36Sopenharmony_ci if (trans_exc_code == 1) { 9462306a36Sopenharmony_ci /* access register mode, not used in the kernel */ 9562306a36Sopenharmony_ci return USER_FAULT; 9662306a36Sopenharmony_ci } 9762306a36Sopenharmony_ci /* home space exception -> access via kernel ASCE */ 9862306a36Sopenharmony_ci return KERNEL_FAULT; 9962306a36Sopenharmony_ci} 10062306a36Sopenharmony_ci 10162306a36Sopenharmony_cistatic unsigned long get_fault_address(struct pt_regs *regs) 10262306a36Sopenharmony_ci{ 10362306a36Sopenharmony_ci unsigned long trans_exc_code = regs->int_parm_long; 10462306a36Sopenharmony_ci 10562306a36Sopenharmony_ci return trans_exc_code & __FAIL_ADDR_MASK; 10662306a36Sopenharmony_ci} 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_cistatic bool fault_is_write(struct pt_regs *regs) 10962306a36Sopenharmony_ci{ 11062306a36Sopenharmony_ci unsigned long trans_exc_code = regs->int_parm_long; 11162306a36Sopenharmony_ci 11262306a36Sopenharmony_ci return (trans_exc_code & store_indication) == 0x400; 11362306a36Sopenharmony_ci} 11462306a36Sopenharmony_ci 11562306a36Sopenharmony_cistatic int bad_address(void *p) 11662306a36Sopenharmony_ci{ 11762306a36Sopenharmony_ci unsigned long dummy; 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci return get_kernel_nofault(dummy, (unsigned long *)p); 12062306a36Sopenharmony_ci} 12162306a36Sopenharmony_ci 12262306a36Sopenharmony_cistatic void dump_pagetable(unsigned long asce, unsigned long address) 12362306a36Sopenharmony_ci{ 12462306a36Sopenharmony_ci unsigned long *table = __va(asce & _ASCE_ORIGIN); 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci pr_alert("AS:%016lx ", asce); 12762306a36Sopenharmony_ci switch (asce & _ASCE_TYPE_MASK) { 12862306a36Sopenharmony_ci case _ASCE_TYPE_REGION1: 12962306a36Sopenharmony_ci table += (address & _REGION1_INDEX) >> _REGION1_SHIFT; 13062306a36Sopenharmony_ci if (bad_address(table)) 13162306a36Sopenharmony_ci goto bad; 13262306a36Sopenharmony_ci pr_cont("R1:%016lx ", *table); 13362306a36Sopenharmony_ci if (*table & _REGION_ENTRY_INVALID) 13462306a36Sopenharmony_ci goto out; 13562306a36Sopenharmony_ci table = __va(*table & _REGION_ENTRY_ORIGIN); 13662306a36Sopenharmony_ci fallthrough; 13762306a36Sopenharmony_ci case _ASCE_TYPE_REGION2: 13862306a36Sopenharmony_ci table += (address & _REGION2_INDEX) >> _REGION2_SHIFT; 13962306a36Sopenharmony_ci if (bad_address(table)) 14062306a36Sopenharmony_ci goto bad; 14162306a36Sopenharmony_ci pr_cont("R2:%016lx ", *table); 14262306a36Sopenharmony_ci if (*table & _REGION_ENTRY_INVALID) 14362306a36Sopenharmony_ci goto out; 14462306a36Sopenharmony_ci table = __va(*table & _REGION_ENTRY_ORIGIN); 14562306a36Sopenharmony_ci fallthrough; 14662306a36Sopenharmony_ci case _ASCE_TYPE_REGION3: 14762306a36Sopenharmony_ci table += (address & _REGION3_INDEX) >> _REGION3_SHIFT; 14862306a36Sopenharmony_ci if (bad_address(table)) 14962306a36Sopenharmony_ci goto bad; 15062306a36Sopenharmony_ci pr_cont("R3:%016lx ", *table); 15162306a36Sopenharmony_ci if (*table & (_REGION_ENTRY_INVALID | _REGION3_ENTRY_LARGE)) 15262306a36Sopenharmony_ci goto out; 15362306a36Sopenharmony_ci table = __va(*table & _REGION_ENTRY_ORIGIN); 15462306a36Sopenharmony_ci fallthrough; 15562306a36Sopenharmony_ci case _ASCE_TYPE_SEGMENT: 15662306a36Sopenharmony_ci table += (address & _SEGMENT_INDEX) >> _SEGMENT_SHIFT; 15762306a36Sopenharmony_ci if (bad_address(table)) 15862306a36Sopenharmony_ci goto bad; 15962306a36Sopenharmony_ci pr_cont("S:%016lx ", *table); 16062306a36Sopenharmony_ci if (*table & (_SEGMENT_ENTRY_INVALID | _SEGMENT_ENTRY_LARGE)) 16162306a36Sopenharmony_ci goto out; 16262306a36Sopenharmony_ci table = __va(*table & _SEGMENT_ENTRY_ORIGIN); 16362306a36Sopenharmony_ci } 16462306a36Sopenharmony_ci table += (address & _PAGE_INDEX) >> _PAGE_SHIFT; 16562306a36Sopenharmony_ci if (bad_address(table)) 16662306a36Sopenharmony_ci goto bad; 16762306a36Sopenharmony_ci pr_cont("P:%016lx ", *table); 16862306a36Sopenharmony_ciout: 16962306a36Sopenharmony_ci pr_cont("\n"); 17062306a36Sopenharmony_ci return; 17162306a36Sopenharmony_cibad: 17262306a36Sopenharmony_ci pr_cont("BAD\n"); 17362306a36Sopenharmony_ci} 17462306a36Sopenharmony_ci 17562306a36Sopenharmony_cistatic void dump_fault_info(struct pt_regs *regs) 17662306a36Sopenharmony_ci{ 17762306a36Sopenharmony_ci unsigned long asce; 17862306a36Sopenharmony_ci 17962306a36Sopenharmony_ci pr_alert("Failing address: %016lx TEID: %016lx\n", 18062306a36Sopenharmony_ci regs->int_parm_long & __FAIL_ADDR_MASK, regs->int_parm_long); 18162306a36Sopenharmony_ci pr_alert("Fault in "); 18262306a36Sopenharmony_ci switch (regs->int_parm_long & 3) { 18362306a36Sopenharmony_ci case 3: 18462306a36Sopenharmony_ci pr_cont("home space "); 18562306a36Sopenharmony_ci break; 18662306a36Sopenharmony_ci case 2: 18762306a36Sopenharmony_ci pr_cont("secondary space "); 18862306a36Sopenharmony_ci break; 18962306a36Sopenharmony_ci case 1: 19062306a36Sopenharmony_ci pr_cont("access register "); 19162306a36Sopenharmony_ci break; 19262306a36Sopenharmony_ci case 0: 19362306a36Sopenharmony_ci pr_cont("primary space "); 19462306a36Sopenharmony_ci break; 19562306a36Sopenharmony_ci } 19662306a36Sopenharmony_ci pr_cont("mode while using "); 19762306a36Sopenharmony_ci switch (get_fault_type(regs)) { 19862306a36Sopenharmony_ci case USER_FAULT: 19962306a36Sopenharmony_ci asce = S390_lowcore.user_asce; 20062306a36Sopenharmony_ci pr_cont("user "); 20162306a36Sopenharmony_ci break; 20262306a36Sopenharmony_ci case GMAP_FAULT: 20362306a36Sopenharmony_ci asce = ((struct gmap *) S390_lowcore.gmap)->asce; 20462306a36Sopenharmony_ci pr_cont("gmap "); 20562306a36Sopenharmony_ci break; 20662306a36Sopenharmony_ci case KERNEL_FAULT: 20762306a36Sopenharmony_ci asce = S390_lowcore.kernel_asce; 20862306a36Sopenharmony_ci pr_cont("kernel "); 20962306a36Sopenharmony_ci break; 21062306a36Sopenharmony_ci default: 21162306a36Sopenharmony_ci unreachable(); 21262306a36Sopenharmony_ci } 21362306a36Sopenharmony_ci pr_cont("ASCE.\n"); 21462306a36Sopenharmony_ci dump_pagetable(asce, regs->int_parm_long & __FAIL_ADDR_MASK); 21562306a36Sopenharmony_ci} 21662306a36Sopenharmony_ci 21762306a36Sopenharmony_ciint show_unhandled_signals = 1; 21862306a36Sopenharmony_ci 21962306a36Sopenharmony_civoid report_user_fault(struct pt_regs *regs, long signr, int is_mm_fault) 22062306a36Sopenharmony_ci{ 22162306a36Sopenharmony_ci if ((task_pid_nr(current) > 1) && !show_unhandled_signals) 22262306a36Sopenharmony_ci return; 22362306a36Sopenharmony_ci if (!unhandled_signal(current, signr)) 22462306a36Sopenharmony_ci return; 22562306a36Sopenharmony_ci if (!printk_ratelimit()) 22662306a36Sopenharmony_ci return; 22762306a36Sopenharmony_ci printk(KERN_ALERT "User process fault: interruption code %04x ilc:%d ", 22862306a36Sopenharmony_ci regs->int_code & 0xffff, regs->int_code >> 17); 22962306a36Sopenharmony_ci print_vma_addr(KERN_CONT "in ", regs->psw.addr); 23062306a36Sopenharmony_ci printk(KERN_CONT "\n"); 23162306a36Sopenharmony_ci if (is_mm_fault) 23262306a36Sopenharmony_ci dump_fault_info(regs); 23362306a36Sopenharmony_ci show_regs(regs); 23462306a36Sopenharmony_ci} 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci/* 23762306a36Sopenharmony_ci * Send SIGSEGV to task. This is an external routine 23862306a36Sopenharmony_ci * to keep the stack usage of do_page_fault small. 23962306a36Sopenharmony_ci */ 24062306a36Sopenharmony_cistatic noinline void do_sigsegv(struct pt_regs *regs, int si_code) 24162306a36Sopenharmony_ci{ 24262306a36Sopenharmony_ci report_user_fault(regs, SIGSEGV, 1); 24362306a36Sopenharmony_ci force_sig_fault(SIGSEGV, si_code, 24462306a36Sopenharmony_ci (void __user *)(regs->int_parm_long & __FAIL_ADDR_MASK)); 24562306a36Sopenharmony_ci} 24662306a36Sopenharmony_ci 24762306a36Sopenharmony_cistatic noinline void do_no_context(struct pt_regs *regs, vm_fault_t fault) 24862306a36Sopenharmony_ci{ 24962306a36Sopenharmony_ci enum fault_type fault_type; 25062306a36Sopenharmony_ci unsigned long address; 25162306a36Sopenharmony_ci bool is_write; 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_ci if (fixup_exception(regs)) 25462306a36Sopenharmony_ci return; 25562306a36Sopenharmony_ci fault_type = get_fault_type(regs); 25662306a36Sopenharmony_ci if ((fault_type == KERNEL_FAULT) && (fault == VM_FAULT_BADCONTEXT)) { 25762306a36Sopenharmony_ci address = get_fault_address(regs); 25862306a36Sopenharmony_ci is_write = fault_is_write(regs); 25962306a36Sopenharmony_ci if (kfence_handle_page_fault(address, is_write, regs)) 26062306a36Sopenharmony_ci return; 26162306a36Sopenharmony_ci } 26262306a36Sopenharmony_ci /* 26362306a36Sopenharmony_ci * Oops. The kernel tried to access some bad page. We'll have to 26462306a36Sopenharmony_ci * terminate things with extreme prejudice. 26562306a36Sopenharmony_ci */ 26662306a36Sopenharmony_ci if (fault_type == KERNEL_FAULT) 26762306a36Sopenharmony_ci printk(KERN_ALERT "Unable to handle kernel pointer dereference" 26862306a36Sopenharmony_ci " in virtual kernel address space\n"); 26962306a36Sopenharmony_ci else 27062306a36Sopenharmony_ci printk(KERN_ALERT "Unable to handle kernel paging request" 27162306a36Sopenharmony_ci " in virtual user address space\n"); 27262306a36Sopenharmony_ci dump_fault_info(regs); 27362306a36Sopenharmony_ci die(regs, "Oops"); 27462306a36Sopenharmony_ci} 27562306a36Sopenharmony_ci 27662306a36Sopenharmony_cistatic noinline void do_low_address(struct pt_regs *regs) 27762306a36Sopenharmony_ci{ 27862306a36Sopenharmony_ci /* Low-address protection hit in kernel mode means 27962306a36Sopenharmony_ci NULL pointer write access in kernel mode. */ 28062306a36Sopenharmony_ci if (regs->psw.mask & PSW_MASK_PSTATE) { 28162306a36Sopenharmony_ci /* Low-address protection hit in user mode 'cannot happen'. */ 28262306a36Sopenharmony_ci die (regs, "Low-address protection"); 28362306a36Sopenharmony_ci } 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_ci do_no_context(regs, VM_FAULT_BADACCESS); 28662306a36Sopenharmony_ci} 28762306a36Sopenharmony_ci 28862306a36Sopenharmony_cistatic noinline void do_sigbus(struct pt_regs *regs) 28962306a36Sopenharmony_ci{ 29062306a36Sopenharmony_ci /* 29162306a36Sopenharmony_ci * Send a sigbus, regardless of whether we were in kernel 29262306a36Sopenharmony_ci * or user mode. 29362306a36Sopenharmony_ci */ 29462306a36Sopenharmony_ci force_sig_fault(SIGBUS, BUS_ADRERR, 29562306a36Sopenharmony_ci (void __user *)(regs->int_parm_long & __FAIL_ADDR_MASK)); 29662306a36Sopenharmony_ci} 29762306a36Sopenharmony_ci 29862306a36Sopenharmony_cistatic noinline void do_fault_error(struct pt_regs *regs, vm_fault_t fault) 29962306a36Sopenharmony_ci{ 30062306a36Sopenharmony_ci int si_code; 30162306a36Sopenharmony_ci 30262306a36Sopenharmony_ci switch (fault) { 30362306a36Sopenharmony_ci case VM_FAULT_BADACCESS: 30462306a36Sopenharmony_ci case VM_FAULT_BADMAP: 30562306a36Sopenharmony_ci /* Bad memory access. Check if it is kernel or user space. */ 30662306a36Sopenharmony_ci if (user_mode(regs)) { 30762306a36Sopenharmony_ci /* User mode accesses just cause a SIGSEGV */ 30862306a36Sopenharmony_ci si_code = (fault == VM_FAULT_BADMAP) ? 30962306a36Sopenharmony_ci SEGV_MAPERR : SEGV_ACCERR; 31062306a36Sopenharmony_ci do_sigsegv(regs, si_code); 31162306a36Sopenharmony_ci break; 31262306a36Sopenharmony_ci } 31362306a36Sopenharmony_ci fallthrough; 31462306a36Sopenharmony_ci case VM_FAULT_BADCONTEXT: 31562306a36Sopenharmony_ci case VM_FAULT_PFAULT: 31662306a36Sopenharmony_ci do_no_context(regs, fault); 31762306a36Sopenharmony_ci break; 31862306a36Sopenharmony_ci case VM_FAULT_SIGNAL: 31962306a36Sopenharmony_ci if (!user_mode(regs)) 32062306a36Sopenharmony_ci do_no_context(regs, fault); 32162306a36Sopenharmony_ci break; 32262306a36Sopenharmony_ci default: /* fault & VM_FAULT_ERROR */ 32362306a36Sopenharmony_ci if (fault & VM_FAULT_OOM) { 32462306a36Sopenharmony_ci if (!user_mode(regs)) 32562306a36Sopenharmony_ci do_no_context(regs, fault); 32662306a36Sopenharmony_ci else 32762306a36Sopenharmony_ci pagefault_out_of_memory(); 32862306a36Sopenharmony_ci } else if (fault & VM_FAULT_SIGSEGV) { 32962306a36Sopenharmony_ci /* Kernel mode? Handle exceptions or die */ 33062306a36Sopenharmony_ci if (!user_mode(regs)) 33162306a36Sopenharmony_ci do_no_context(regs, fault); 33262306a36Sopenharmony_ci else 33362306a36Sopenharmony_ci do_sigsegv(regs, SEGV_MAPERR); 33462306a36Sopenharmony_ci } else if (fault & VM_FAULT_SIGBUS) { 33562306a36Sopenharmony_ci /* Kernel mode? Handle exceptions or die */ 33662306a36Sopenharmony_ci if (!user_mode(regs)) 33762306a36Sopenharmony_ci do_no_context(regs, fault); 33862306a36Sopenharmony_ci else 33962306a36Sopenharmony_ci do_sigbus(regs); 34062306a36Sopenharmony_ci } else 34162306a36Sopenharmony_ci BUG(); 34262306a36Sopenharmony_ci break; 34362306a36Sopenharmony_ci } 34462306a36Sopenharmony_ci} 34562306a36Sopenharmony_ci 34662306a36Sopenharmony_ci/* 34762306a36Sopenharmony_ci * This routine handles page faults. It determines the address, 34862306a36Sopenharmony_ci * and the problem, and then passes it off to one of the appropriate 34962306a36Sopenharmony_ci * routines. 35062306a36Sopenharmony_ci * 35162306a36Sopenharmony_ci * interruption code (int_code): 35262306a36Sopenharmony_ci * 04 Protection -> Write-Protection (suppression) 35362306a36Sopenharmony_ci * 10 Segment translation -> Not present (nullification) 35462306a36Sopenharmony_ci * 11 Page translation -> Not present (nullification) 35562306a36Sopenharmony_ci * 3b Region third trans. -> Not present (nullification) 35662306a36Sopenharmony_ci */ 35762306a36Sopenharmony_cistatic inline vm_fault_t do_exception(struct pt_regs *regs, int access) 35862306a36Sopenharmony_ci{ 35962306a36Sopenharmony_ci struct gmap *gmap; 36062306a36Sopenharmony_ci struct task_struct *tsk; 36162306a36Sopenharmony_ci struct mm_struct *mm; 36262306a36Sopenharmony_ci struct vm_area_struct *vma; 36362306a36Sopenharmony_ci enum fault_type type; 36462306a36Sopenharmony_ci unsigned long address; 36562306a36Sopenharmony_ci unsigned int flags; 36662306a36Sopenharmony_ci vm_fault_t fault; 36762306a36Sopenharmony_ci bool is_write; 36862306a36Sopenharmony_ci 36962306a36Sopenharmony_ci tsk = current; 37062306a36Sopenharmony_ci /* 37162306a36Sopenharmony_ci * The instruction that caused the program check has 37262306a36Sopenharmony_ci * been nullified. Don't signal single step via SIGTRAP. 37362306a36Sopenharmony_ci */ 37462306a36Sopenharmony_ci clear_thread_flag(TIF_PER_TRAP); 37562306a36Sopenharmony_ci 37662306a36Sopenharmony_ci if (kprobe_page_fault(regs, 14)) 37762306a36Sopenharmony_ci return 0; 37862306a36Sopenharmony_ci 37962306a36Sopenharmony_ci mm = tsk->mm; 38062306a36Sopenharmony_ci address = get_fault_address(regs); 38162306a36Sopenharmony_ci is_write = fault_is_write(regs); 38262306a36Sopenharmony_ci 38362306a36Sopenharmony_ci /* 38462306a36Sopenharmony_ci * Verify that the fault happened in user space, that 38562306a36Sopenharmony_ci * we are not in an interrupt and that there is a 38662306a36Sopenharmony_ci * user context. 38762306a36Sopenharmony_ci */ 38862306a36Sopenharmony_ci fault = VM_FAULT_BADCONTEXT; 38962306a36Sopenharmony_ci type = get_fault_type(regs); 39062306a36Sopenharmony_ci switch (type) { 39162306a36Sopenharmony_ci case KERNEL_FAULT: 39262306a36Sopenharmony_ci goto out; 39362306a36Sopenharmony_ci case USER_FAULT: 39462306a36Sopenharmony_ci case GMAP_FAULT: 39562306a36Sopenharmony_ci if (faulthandler_disabled() || !mm) 39662306a36Sopenharmony_ci goto out; 39762306a36Sopenharmony_ci break; 39862306a36Sopenharmony_ci } 39962306a36Sopenharmony_ci 40062306a36Sopenharmony_ci perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS, 1, regs, address); 40162306a36Sopenharmony_ci flags = FAULT_FLAG_DEFAULT; 40262306a36Sopenharmony_ci if (user_mode(regs)) 40362306a36Sopenharmony_ci flags |= FAULT_FLAG_USER; 40462306a36Sopenharmony_ci if (is_write) 40562306a36Sopenharmony_ci access = VM_WRITE; 40662306a36Sopenharmony_ci if (access == VM_WRITE) 40762306a36Sopenharmony_ci flags |= FAULT_FLAG_WRITE; 40862306a36Sopenharmony_ci if (!(flags & FAULT_FLAG_USER)) 40962306a36Sopenharmony_ci goto lock_mmap; 41062306a36Sopenharmony_ci vma = lock_vma_under_rcu(mm, address); 41162306a36Sopenharmony_ci if (!vma) 41262306a36Sopenharmony_ci goto lock_mmap; 41362306a36Sopenharmony_ci if (!(vma->vm_flags & access)) { 41462306a36Sopenharmony_ci vma_end_read(vma); 41562306a36Sopenharmony_ci goto lock_mmap; 41662306a36Sopenharmony_ci } 41762306a36Sopenharmony_ci fault = handle_mm_fault(vma, address, flags | FAULT_FLAG_VMA_LOCK, regs); 41862306a36Sopenharmony_ci if (!(fault & (VM_FAULT_RETRY | VM_FAULT_COMPLETED))) 41962306a36Sopenharmony_ci vma_end_read(vma); 42062306a36Sopenharmony_ci if (!(fault & VM_FAULT_RETRY)) { 42162306a36Sopenharmony_ci count_vm_vma_lock_event(VMA_LOCK_SUCCESS); 42262306a36Sopenharmony_ci if (likely(!(fault & VM_FAULT_ERROR))) 42362306a36Sopenharmony_ci fault = 0; 42462306a36Sopenharmony_ci goto out; 42562306a36Sopenharmony_ci } 42662306a36Sopenharmony_ci count_vm_vma_lock_event(VMA_LOCK_RETRY); 42762306a36Sopenharmony_ci /* Quick path to respond to signals */ 42862306a36Sopenharmony_ci if (fault_signal_pending(fault, regs)) { 42962306a36Sopenharmony_ci fault = VM_FAULT_SIGNAL; 43062306a36Sopenharmony_ci goto out; 43162306a36Sopenharmony_ci } 43262306a36Sopenharmony_cilock_mmap: 43362306a36Sopenharmony_ci mmap_read_lock(mm); 43462306a36Sopenharmony_ci 43562306a36Sopenharmony_ci gmap = NULL; 43662306a36Sopenharmony_ci if (IS_ENABLED(CONFIG_PGSTE) && type == GMAP_FAULT) { 43762306a36Sopenharmony_ci gmap = (struct gmap *) S390_lowcore.gmap; 43862306a36Sopenharmony_ci current->thread.gmap_addr = address; 43962306a36Sopenharmony_ci current->thread.gmap_write_flag = !!(flags & FAULT_FLAG_WRITE); 44062306a36Sopenharmony_ci current->thread.gmap_int_code = regs->int_code & 0xffff; 44162306a36Sopenharmony_ci address = __gmap_translate(gmap, address); 44262306a36Sopenharmony_ci if (address == -EFAULT) { 44362306a36Sopenharmony_ci fault = VM_FAULT_BADMAP; 44462306a36Sopenharmony_ci goto out_up; 44562306a36Sopenharmony_ci } 44662306a36Sopenharmony_ci if (gmap->pfault_enabled) 44762306a36Sopenharmony_ci flags |= FAULT_FLAG_RETRY_NOWAIT; 44862306a36Sopenharmony_ci } 44962306a36Sopenharmony_ci 45062306a36Sopenharmony_ciretry: 45162306a36Sopenharmony_ci fault = VM_FAULT_BADMAP; 45262306a36Sopenharmony_ci vma = find_vma(mm, address); 45362306a36Sopenharmony_ci if (!vma) 45462306a36Sopenharmony_ci goto out_up; 45562306a36Sopenharmony_ci 45662306a36Sopenharmony_ci if (unlikely(vma->vm_start > address)) { 45762306a36Sopenharmony_ci if (!(vma->vm_flags & VM_GROWSDOWN)) 45862306a36Sopenharmony_ci goto out_up; 45962306a36Sopenharmony_ci vma = expand_stack(mm, address); 46062306a36Sopenharmony_ci if (!vma) 46162306a36Sopenharmony_ci goto out; 46262306a36Sopenharmony_ci } 46362306a36Sopenharmony_ci 46462306a36Sopenharmony_ci /* 46562306a36Sopenharmony_ci * Ok, we have a good vm_area for this memory access, so 46662306a36Sopenharmony_ci * we can handle it.. 46762306a36Sopenharmony_ci */ 46862306a36Sopenharmony_ci fault = VM_FAULT_BADACCESS; 46962306a36Sopenharmony_ci if (unlikely(!(vma->vm_flags & access))) 47062306a36Sopenharmony_ci goto out_up; 47162306a36Sopenharmony_ci 47262306a36Sopenharmony_ci /* 47362306a36Sopenharmony_ci * If for any reason at all we couldn't handle the fault, 47462306a36Sopenharmony_ci * make sure we exit gracefully rather than endlessly redo 47562306a36Sopenharmony_ci * the fault. 47662306a36Sopenharmony_ci */ 47762306a36Sopenharmony_ci fault = handle_mm_fault(vma, address, flags, regs); 47862306a36Sopenharmony_ci if (fault_signal_pending(fault, regs)) { 47962306a36Sopenharmony_ci fault = VM_FAULT_SIGNAL; 48062306a36Sopenharmony_ci if (flags & FAULT_FLAG_RETRY_NOWAIT) 48162306a36Sopenharmony_ci goto out_up; 48262306a36Sopenharmony_ci goto out; 48362306a36Sopenharmony_ci } 48462306a36Sopenharmony_ci 48562306a36Sopenharmony_ci /* The fault is fully completed (including releasing mmap lock) */ 48662306a36Sopenharmony_ci if (fault & VM_FAULT_COMPLETED) { 48762306a36Sopenharmony_ci if (gmap) { 48862306a36Sopenharmony_ci mmap_read_lock(mm); 48962306a36Sopenharmony_ci goto out_gmap; 49062306a36Sopenharmony_ci } 49162306a36Sopenharmony_ci fault = 0; 49262306a36Sopenharmony_ci goto out; 49362306a36Sopenharmony_ci } 49462306a36Sopenharmony_ci 49562306a36Sopenharmony_ci if (unlikely(fault & VM_FAULT_ERROR)) 49662306a36Sopenharmony_ci goto out_up; 49762306a36Sopenharmony_ci 49862306a36Sopenharmony_ci if (fault & VM_FAULT_RETRY) { 49962306a36Sopenharmony_ci if (IS_ENABLED(CONFIG_PGSTE) && gmap && 50062306a36Sopenharmony_ci (flags & FAULT_FLAG_RETRY_NOWAIT)) { 50162306a36Sopenharmony_ci /* 50262306a36Sopenharmony_ci * FAULT_FLAG_RETRY_NOWAIT has been set, mmap_lock has 50362306a36Sopenharmony_ci * not been released 50462306a36Sopenharmony_ci */ 50562306a36Sopenharmony_ci current->thread.gmap_pfault = 1; 50662306a36Sopenharmony_ci fault = VM_FAULT_PFAULT; 50762306a36Sopenharmony_ci goto out_up; 50862306a36Sopenharmony_ci } 50962306a36Sopenharmony_ci flags &= ~FAULT_FLAG_RETRY_NOWAIT; 51062306a36Sopenharmony_ci flags |= FAULT_FLAG_TRIED; 51162306a36Sopenharmony_ci mmap_read_lock(mm); 51262306a36Sopenharmony_ci goto retry; 51362306a36Sopenharmony_ci } 51462306a36Sopenharmony_ciout_gmap: 51562306a36Sopenharmony_ci if (IS_ENABLED(CONFIG_PGSTE) && gmap) { 51662306a36Sopenharmony_ci address = __gmap_link(gmap, current->thread.gmap_addr, 51762306a36Sopenharmony_ci address); 51862306a36Sopenharmony_ci if (address == -EFAULT) { 51962306a36Sopenharmony_ci fault = VM_FAULT_BADMAP; 52062306a36Sopenharmony_ci goto out_up; 52162306a36Sopenharmony_ci } 52262306a36Sopenharmony_ci if (address == -ENOMEM) { 52362306a36Sopenharmony_ci fault = VM_FAULT_OOM; 52462306a36Sopenharmony_ci goto out_up; 52562306a36Sopenharmony_ci } 52662306a36Sopenharmony_ci } 52762306a36Sopenharmony_ci fault = 0; 52862306a36Sopenharmony_ciout_up: 52962306a36Sopenharmony_ci mmap_read_unlock(mm); 53062306a36Sopenharmony_ciout: 53162306a36Sopenharmony_ci return fault; 53262306a36Sopenharmony_ci} 53362306a36Sopenharmony_ci 53462306a36Sopenharmony_civoid do_protection_exception(struct pt_regs *regs) 53562306a36Sopenharmony_ci{ 53662306a36Sopenharmony_ci unsigned long trans_exc_code; 53762306a36Sopenharmony_ci int access; 53862306a36Sopenharmony_ci vm_fault_t fault; 53962306a36Sopenharmony_ci 54062306a36Sopenharmony_ci trans_exc_code = regs->int_parm_long; 54162306a36Sopenharmony_ci /* 54262306a36Sopenharmony_ci * Protection exceptions are suppressing, decrement psw address. 54362306a36Sopenharmony_ci * The exception to this rule are aborted transactions, for these 54462306a36Sopenharmony_ci * the PSW already points to the correct location. 54562306a36Sopenharmony_ci */ 54662306a36Sopenharmony_ci if (!(regs->int_code & 0x200)) 54762306a36Sopenharmony_ci regs->psw.addr = __rewind_psw(regs->psw, regs->int_code >> 16); 54862306a36Sopenharmony_ci /* 54962306a36Sopenharmony_ci * Check for low-address protection. This needs to be treated 55062306a36Sopenharmony_ci * as a special case because the translation exception code 55162306a36Sopenharmony_ci * field is not guaranteed to contain valid data in this case. 55262306a36Sopenharmony_ci */ 55362306a36Sopenharmony_ci if (unlikely(!(trans_exc_code & 4))) { 55462306a36Sopenharmony_ci do_low_address(regs); 55562306a36Sopenharmony_ci return; 55662306a36Sopenharmony_ci } 55762306a36Sopenharmony_ci if (unlikely(MACHINE_HAS_NX && (trans_exc_code & 0x80))) { 55862306a36Sopenharmony_ci regs->int_parm_long = (trans_exc_code & ~PAGE_MASK) | 55962306a36Sopenharmony_ci (regs->psw.addr & PAGE_MASK); 56062306a36Sopenharmony_ci access = VM_EXEC; 56162306a36Sopenharmony_ci fault = VM_FAULT_BADACCESS; 56262306a36Sopenharmony_ci } else { 56362306a36Sopenharmony_ci access = VM_WRITE; 56462306a36Sopenharmony_ci fault = do_exception(regs, access); 56562306a36Sopenharmony_ci } 56662306a36Sopenharmony_ci if (unlikely(fault)) 56762306a36Sopenharmony_ci do_fault_error(regs, fault); 56862306a36Sopenharmony_ci} 56962306a36Sopenharmony_ciNOKPROBE_SYMBOL(do_protection_exception); 57062306a36Sopenharmony_ci 57162306a36Sopenharmony_civoid do_dat_exception(struct pt_regs *regs) 57262306a36Sopenharmony_ci{ 57362306a36Sopenharmony_ci int access; 57462306a36Sopenharmony_ci vm_fault_t fault; 57562306a36Sopenharmony_ci 57662306a36Sopenharmony_ci access = VM_ACCESS_FLAGS; 57762306a36Sopenharmony_ci fault = do_exception(regs, access); 57862306a36Sopenharmony_ci if (unlikely(fault)) 57962306a36Sopenharmony_ci do_fault_error(regs, fault); 58062306a36Sopenharmony_ci} 58162306a36Sopenharmony_ciNOKPROBE_SYMBOL(do_dat_exception); 58262306a36Sopenharmony_ci 58362306a36Sopenharmony_ci#if IS_ENABLED(CONFIG_PGSTE) 58462306a36Sopenharmony_ci 58562306a36Sopenharmony_civoid do_secure_storage_access(struct pt_regs *regs) 58662306a36Sopenharmony_ci{ 58762306a36Sopenharmony_ci unsigned long addr = regs->int_parm_long & __FAIL_ADDR_MASK; 58862306a36Sopenharmony_ci struct vm_area_struct *vma; 58962306a36Sopenharmony_ci struct mm_struct *mm; 59062306a36Sopenharmony_ci struct page *page; 59162306a36Sopenharmony_ci struct gmap *gmap; 59262306a36Sopenharmony_ci int rc; 59362306a36Sopenharmony_ci 59462306a36Sopenharmony_ci /* 59562306a36Sopenharmony_ci * bit 61 tells us if the address is valid, if it's not we 59662306a36Sopenharmony_ci * have a major problem and should stop the kernel or send a 59762306a36Sopenharmony_ci * SIGSEGV to the process. Unfortunately bit 61 is not 59862306a36Sopenharmony_ci * reliable without the misc UV feature so we need to check 59962306a36Sopenharmony_ci * for that as well. 60062306a36Sopenharmony_ci */ 60162306a36Sopenharmony_ci if (uv_has_feature(BIT_UV_FEAT_MISC) && 60262306a36Sopenharmony_ci !test_bit_inv(61, ®s->int_parm_long)) { 60362306a36Sopenharmony_ci /* 60462306a36Sopenharmony_ci * When this happens, userspace did something that it 60562306a36Sopenharmony_ci * was not supposed to do, e.g. branching into secure 60662306a36Sopenharmony_ci * memory. Trigger a segmentation fault. 60762306a36Sopenharmony_ci */ 60862306a36Sopenharmony_ci if (user_mode(regs)) { 60962306a36Sopenharmony_ci send_sig(SIGSEGV, current, 0); 61062306a36Sopenharmony_ci return; 61162306a36Sopenharmony_ci } 61262306a36Sopenharmony_ci 61362306a36Sopenharmony_ci /* 61462306a36Sopenharmony_ci * The kernel should never run into this case and we 61562306a36Sopenharmony_ci * have no way out of this situation. 61662306a36Sopenharmony_ci */ 61762306a36Sopenharmony_ci panic("Unexpected PGM 0x3d with TEID bit 61=0"); 61862306a36Sopenharmony_ci } 61962306a36Sopenharmony_ci 62062306a36Sopenharmony_ci switch (get_fault_type(regs)) { 62162306a36Sopenharmony_ci case GMAP_FAULT: 62262306a36Sopenharmony_ci mm = current->mm; 62362306a36Sopenharmony_ci gmap = (struct gmap *)S390_lowcore.gmap; 62462306a36Sopenharmony_ci mmap_read_lock(mm); 62562306a36Sopenharmony_ci addr = __gmap_translate(gmap, addr); 62662306a36Sopenharmony_ci mmap_read_unlock(mm); 62762306a36Sopenharmony_ci if (IS_ERR_VALUE(addr)) { 62862306a36Sopenharmony_ci do_fault_error(regs, VM_FAULT_BADMAP); 62962306a36Sopenharmony_ci break; 63062306a36Sopenharmony_ci } 63162306a36Sopenharmony_ci fallthrough; 63262306a36Sopenharmony_ci case USER_FAULT: 63362306a36Sopenharmony_ci mm = current->mm; 63462306a36Sopenharmony_ci mmap_read_lock(mm); 63562306a36Sopenharmony_ci vma = find_vma(mm, addr); 63662306a36Sopenharmony_ci if (!vma) { 63762306a36Sopenharmony_ci mmap_read_unlock(mm); 63862306a36Sopenharmony_ci do_fault_error(regs, VM_FAULT_BADMAP); 63962306a36Sopenharmony_ci break; 64062306a36Sopenharmony_ci } 64162306a36Sopenharmony_ci page = follow_page(vma, addr, FOLL_WRITE | FOLL_GET); 64262306a36Sopenharmony_ci if (IS_ERR_OR_NULL(page)) { 64362306a36Sopenharmony_ci mmap_read_unlock(mm); 64462306a36Sopenharmony_ci break; 64562306a36Sopenharmony_ci } 64662306a36Sopenharmony_ci if (arch_make_page_accessible(page)) 64762306a36Sopenharmony_ci send_sig(SIGSEGV, current, 0); 64862306a36Sopenharmony_ci put_page(page); 64962306a36Sopenharmony_ci mmap_read_unlock(mm); 65062306a36Sopenharmony_ci break; 65162306a36Sopenharmony_ci case KERNEL_FAULT: 65262306a36Sopenharmony_ci page = phys_to_page(addr); 65362306a36Sopenharmony_ci if (unlikely(!try_get_page(page))) 65462306a36Sopenharmony_ci break; 65562306a36Sopenharmony_ci rc = arch_make_page_accessible(page); 65662306a36Sopenharmony_ci put_page(page); 65762306a36Sopenharmony_ci if (rc) 65862306a36Sopenharmony_ci BUG(); 65962306a36Sopenharmony_ci break; 66062306a36Sopenharmony_ci default: 66162306a36Sopenharmony_ci do_fault_error(regs, VM_FAULT_BADMAP); 66262306a36Sopenharmony_ci WARN_ON_ONCE(1); 66362306a36Sopenharmony_ci } 66462306a36Sopenharmony_ci} 66562306a36Sopenharmony_ciNOKPROBE_SYMBOL(do_secure_storage_access); 66662306a36Sopenharmony_ci 66762306a36Sopenharmony_civoid do_non_secure_storage_access(struct pt_regs *regs) 66862306a36Sopenharmony_ci{ 66962306a36Sopenharmony_ci unsigned long gaddr = regs->int_parm_long & __FAIL_ADDR_MASK; 67062306a36Sopenharmony_ci struct gmap *gmap = (struct gmap *)S390_lowcore.gmap; 67162306a36Sopenharmony_ci 67262306a36Sopenharmony_ci if (get_fault_type(regs) != GMAP_FAULT) { 67362306a36Sopenharmony_ci do_fault_error(regs, VM_FAULT_BADMAP); 67462306a36Sopenharmony_ci WARN_ON_ONCE(1); 67562306a36Sopenharmony_ci return; 67662306a36Sopenharmony_ci } 67762306a36Sopenharmony_ci 67862306a36Sopenharmony_ci if (gmap_convert_to_secure(gmap, gaddr) == -EINVAL) 67962306a36Sopenharmony_ci send_sig(SIGSEGV, current, 0); 68062306a36Sopenharmony_ci} 68162306a36Sopenharmony_ciNOKPROBE_SYMBOL(do_non_secure_storage_access); 68262306a36Sopenharmony_ci 68362306a36Sopenharmony_civoid do_secure_storage_violation(struct pt_regs *regs) 68462306a36Sopenharmony_ci{ 68562306a36Sopenharmony_ci unsigned long gaddr = regs->int_parm_long & __FAIL_ADDR_MASK; 68662306a36Sopenharmony_ci struct gmap *gmap = (struct gmap *)S390_lowcore.gmap; 68762306a36Sopenharmony_ci 68862306a36Sopenharmony_ci /* 68962306a36Sopenharmony_ci * If the VM has been rebooted, its address space might still contain 69062306a36Sopenharmony_ci * secure pages from the previous boot. 69162306a36Sopenharmony_ci * Clear the page so it can be reused. 69262306a36Sopenharmony_ci */ 69362306a36Sopenharmony_ci if (!gmap_destroy_page(gmap, gaddr)) 69462306a36Sopenharmony_ci return; 69562306a36Sopenharmony_ci /* 69662306a36Sopenharmony_ci * Either KVM messed up the secure guest mapping or the same 69762306a36Sopenharmony_ci * page is mapped into multiple secure guests. 69862306a36Sopenharmony_ci * 69962306a36Sopenharmony_ci * This exception is only triggered when a guest 2 is running 70062306a36Sopenharmony_ci * and can therefore never occur in kernel context. 70162306a36Sopenharmony_ci */ 70262306a36Sopenharmony_ci printk_ratelimited(KERN_WARNING 70362306a36Sopenharmony_ci "Secure storage violation in task: %s, pid %d\n", 70462306a36Sopenharmony_ci current->comm, current->pid); 70562306a36Sopenharmony_ci send_sig(SIGSEGV, current, 0); 70662306a36Sopenharmony_ci} 70762306a36Sopenharmony_ci 70862306a36Sopenharmony_ci#endif /* CONFIG_PGSTE */ 709