Merge branch 'siginfo-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/ebieder...

author Linus Torvalds <torvalds@linux-foundation.org>

Wed, 24 Oct 2018 10:22:39 +0000 (11:22 +0100)

committer Linus Torvalds <torvalds@linux-foundation.org>

Wed, 24 Oct 2018 10:22:39 +0000 (11:22 +0100)
author Linus Torvalds <torvalds@linux-foundation.org>
Wed, 24 Oct 2018 10:22:39 +0000 (11:22 +0100)
committer Linus Torvalds <torvalds@linux-foundation.org>
Wed, 24 Oct 2018 10:22:39 +0000 (11:22 +0100)
diff --cc arch/arm/vfp/vfpmodule.c
Simple merge
diff --cc arch/arm64/kernel/traps.c

index 4066da7,856b32a..5f4d9ac
--- 1/arch/arm64/kernel/traps.c
--- 2/arch/arm64/kernel/traps.c
+++ b/arch/arm64/kernel/traps.c
@@@ -353,12 -366,6 +368,9 @@@ void force_signal_inject(int signal, in
         const char *desc;
         struct pt_regs *regs = current_pt_regs();
   
-       clear_siginfo(&info);
- 
+ +      if (WARN_ON(!user_mode(regs)))
+ +              return;
+ +
         switch (signal) {
         case SIGILL:
                 desc = "undefined instruction";
diff --cc arch/arm64/mm/fault.c

index d0e638e,f0ccb20..7d9571f
--- 1/arch/arm64/mm/fault.c
--- 2/arch/arm64/mm/fault.c
+++ b/arch/arm64/mm/fault.c
@@@ -789,17 -767,11 +773,11 @@@ asmlinkage void __exception do_sp_pc_ab
         if (user_mode(regs)) {
                 if (instruction_pointer(regs) > TASK_SIZE)
                         arm64_apply_bp_hardening();
- -              local_irq_enable();
+ +              local_daif_restore(DAIF_PROCCTX);
         }
   
-       clear_siginfo(&info);
-       info.si_signo = SIGBUS;
-       info.si_errno = 0;
-       info.si_code  = BUS_ADRALN;
-       info.si_addr  = (void __user *)addr;
-       arm64_notify_die("SP/PC alignment exception", regs, &info, esr);
+       arm64_notify_die("SP/PC alignment exception", regs,
+                        SIGBUS, BUS_ADRALN, (void __user *)addr, esr);
   }
   
   int __init early_brk64(unsigned long addr, unsigned int esr,
diff --cc arch/powerpc/kernel/process.c
Simple merge
diff --cc arch/x86/include/asm/ptrace.h
Simple merge
diff --cc arch/x86/kernel/ptrace.c
Simple merge
diff --cc arch/x86/kernel/traps.c

index 5bd0a99,34a327f..8f6dcd8
--- 1/arch/x86/kernel/traps.c
--- 2/arch/x86/kernel/traps.c
+++ b/arch/x86/kernel/traps.c
@@@ -202,11 -202,8 +202,8 @@@ do_trap_no_signal(struct task_struct *t
                                                 error_code, trapnr))
                                 return 0;
                 }
-               return -1;
-       }
- 
-       if (!user_mode(regs)) {
+       } else if (!user_mode(regs)) {
- -              if (fixup_exception(regs, trapnr))
+ +              if (fixup_exception(regs, trapnr, error_code, 0))
                         return 0;
   
                 tsk->thread.error_code = error_code;
@@@ -560,19 -540,9 +544,19 @@@ do_general_protection(struct pt_regs *r
   
                 tsk->thread.error_code = error_code;
                 tsk->thread.trap_nr = X86_TRAP_GP;
-               if (notify_die(DIE_GPF, "general protection fault", regs, error_code,
+ +
+ +              /*
+ +               * To be potentially processing a kprobe fault and to
+ +               * trust the result from kprobe_running(), we have to
+ +               * be non-preemptible.
+ +               */
+ +              if (!preemptible() && kprobe_running() &&
+ +                  kprobe_fault_handler(regs, X86_TRAP_GP))
+ +                      return;
+ +
+               if (notify_die(DIE_GPF, desc, regs, error_code,
                                X86_TRAP_GP, SIGSEGV) != NOTIFY_STOP)
-                       die("general protection fault", regs, error_code);
+                       die(desc, regs, error_code);
                 return;
         }
   
diff --cc arch/x86/kvm/mmu.c
Simple merge
diff --cc arch/x86/mm/fault.c

index 2b1519b,8d77700..b24eb4e
--- 1/arch/x86/mm/fault.c
--- 2/arch/x86/mm/fault.c
+++ b/arch/x86/mm/fault.c
@@@ -1237,74 -1187,41 +1190,73 @@@ do_kern_addr_fault(struct pt_regs *regs
          * only copy the information from the master page table,
          * nothing more.
          *
- -       * This verifies that the fault happens in kernel space
- -       * (error_code & 4) == 0, and that the fault was not a
- -       * protection error (error_code & 9) == 0.
+ +       * Before doing this on-demand faulting, ensure that the
+ +       * fault is not any of the following:
+ +       * 1. A fault on a PTE with a reserved bit set.
+ +       * 2. A fault caused by a user-mode access.  (Do not demand-
+ +       *    fault kernel memory due to user-mode accesses).
+ +       * 3. A fault caused by a page-level protection violation.
+ +       *    (A demand fault would be on a non-present page which
+ +       *     would have X86_PF_PROT==0).
          */
- -      if (unlikely(fault_in_kernel_space(address))) {
- -              if (!(error_code & (X86_PF_RSVD | X86_PF_USER | X86_PF_PROT))) {
- -                      if (vmalloc_fault(address) >= 0)
- -                              return;
- -              }
- -
- -              /* Can handle a stale RO->RW TLB: */
- -              if (spurious_fault(error_code, address))
+ +      if (!(hw_error_code & (X86_PF_RSVD | X86_PF_USER | X86_PF_PROT))) {
+ +              if (vmalloc_fault(address) >= 0)
                         return;
+ +      }
   
- -              /* kprobes don't want to hook the spurious faults: */
- -              if (kprobes_fault(regs))
- -                      return;
- -              /*
- -               * Don't take the mm semaphore here. If we fixup a prefetch
- -               * fault we could otherwise deadlock:
- -               */
- -              bad_area_nosemaphore(regs, error_code, address);
+ +      /* Was the fault spurious, caused by lazy TLB invalidation? */
+ +      if (spurious_kernel_fault(hw_error_code, address))
+ +              return;
   
+ +      /* kprobes don't want to hook the spurious faults: */
+ +      if (kprobes_fault(regs))
                 return;
- -      }
+ +
+ +      /*
+ +       * Note, despite being a "bad area", there are quite a few
+ +       * acceptable reasons to get here, such as erratum fixups
+ +       * and handling kernel code that can fault, like get_user().
+ +       *
+ +       * Don't take the mm semaphore here. If we fixup a prefetch
+ +       * fault we could otherwise deadlock:
+ +       */
-       bad_area_nosemaphore(regs, hw_error_code, address, NULL);
++      bad_area_nosemaphore(regs, hw_error_code, address);
+ +}
+ +NOKPROBE_SYMBOL(do_kern_addr_fault);
+ +
+ +/* Handle faults in the user portion of the address space */
+ +static inline
+ +void do_user_addr_fault(struct pt_regs *regs,
+ +                      unsigned long hw_error_code,
+ +                      unsigned long address)
+ +{
+ +      unsigned long sw_error_code;
+ +      struct vm_area_struct *vma;
+ +      struct task_struct *tsk;
+ +      struct mm_struct *mm;
+ +      vm_fault_t fault, major = 0;
+ +      unsigned int flags = FAULT_FLAG_ALLOW_RETRY | FAULT_FLAG_KILLABLE;
-       u32 pkey;
+ +
+ +      tsk = current;
+ +      mm = tsk->mm;
   
         /* kprobes don't want to hook the spurious faults: */
         if (unlikely(kprobes_fault(regs)))
                 return;
   
- -      if (unlikely(error_code & X86_PF_RSVD))
- -              pgtable_bad(regs, error_code, address);
+ +      /*
+ +       * Reserved bits are never expected to be set on
+ +       * entries in the user portion of the page tables.
+ +       */
+ +      if (unlikely(hw_error_code & X86_PF_RSVD))
+ +              pgtable_bad(regs, hw_error_code, address);
   
- -      if (unlikely(smap_violation(error_code, regs))) {
- -              bad_area_nosemaphore(regs, error_code, address);
+ +      /*
+ +       * Check for invalid kernel (supervisor) access to user
+ +       * pages in the user address space.
+ +       */
+ +      if (unlikely(smap_violation(hw_error_code, regs))) {
-               bad_area_nosemaphore(regs, hw_error_code, address, NULL);
++              bad_area_nosemaphore(regs, hw_error_code, address);
                 return;
         }
   
@@@ -1313,7 -1230,7 +1265,7 @@@
          * in a region with pagefaults disabled then we must not take the fault
          */
         if (unlikely(faulthandler_disabled() || !mm)) {
-               bad_area_nosemaphore(regs, hw_error_code, address, NULL);
- -              bad_area_nosemaphore(regs, error_code, address);
++              bad_area_nosemaphore(regs, hw_error_code, address);
                 return;
         }
   
@@@ -1361,49 -1252,31 +1313,49 @@@
   
         perf_sw_event(PERF_COUNT_SW_PAGE_FAULTS, 1, regs, address);
   
- -      if (error_code & X86_PF_WRITE)
+ +      if (sw_error_code & X86_PF_WRITE)
                 flags |= FAULT_FLAG_WRITE;
- -      if (error_code & X86_PF_INSTR)
+ +      if (sw_error_code & X86_PF_INSTR)
                 flags |= FAULT_FLAG_INSTRUCTION;
   
+ +#ifdef CONFIG_X86_64
+ +      /*
+ +       * Instruction fetch faults in the vsyscall page might need
+ +       * emulation.  The vsyscall page is at a high address
+ +       * (>PAGE_OFFSET), but is considered to be part of the user
+ +       * address space.
+ +       *
+ +       * The vsyscall page does not have a "real" VMA, so do this
+ +       * emulation before we go searching for VMAs.
+ +       */
+ +      if ((sw_error_code & X86_PF_INSTR) && is_vsyscall_vaddr(address)) {
+ +              if (emulate_vsyscall(regs, address))
+ +                      return;
+ +      }
+ +#endif
+ +
         /*
- -       * When running in the kernel we expect faults to occur only to
- -       * addresses in user space.  All other faults represent errors in
- -       * the kernel and should generate an OOPS.  Unfortunately, in the
- -       * case of an erroneous fault occurring in a code path which already
- -       * holds mmap_sem we will deadlock attempting to validate the fault
- -       * against the address space.  Luckily the kernel only validly
- -       * references user space from well defined areas of code, which are
- -       * listed in the exceptions table.
+ +       * Kernel-mode access to the user address space should only occur
+ +       * on well-defined single instructions listed in the exception
+ +       * tables.  But, an erroneous kernel fault occurring outside one of
+ +       * those areas which also holds mmap_sem might deadlock attempting
+ +       * to validate the fault against the address space.
          *
- -       * As the vast majority of faults will be valid we will only perform
- -       * the source reference check when there is a possibility of a
- -       * deadlock. Attempt to lock the address space, if we cannot we then
- -       * validate the source. If this is invalid we can skip the address
- -       * space check, thus avoiding the deadlock:
+ +       * Only do the expensive exception table search when we might be at
+ +       * risk of a deadlock.  This happens if we
+ +       * 1. Failed to acquire mmap_sem, and
+ +       * 2. The access did not originate in userspace.  Note: either the
+ +       *    hardware or earlier page fault code may set X86_PF_USER
+ +       *    in sw_error_code.
          */
         if (unlikely(!down_read_trylock(&mm->mmap_sem))) {
- -              if (!(error_code & X86_PF_USER) &&
+ +              if (!(sw_error_code & X86_PF_USER) &&
                     !search_exception_tables(regs->ip)) {
- -                      bad_area_nosemaphore(regs, error_code, address);
+ +                      /*
+ +                       * Fault from code in kernel from
+ +                       * which we do not expect faults.
+ +                       */
-                       bad_area_nosemaphore(regs, sw_error_code, address, NULL);
++                      bad_area_nosemaphore(regs, sw_error_code, address);
                         return;
                 }
   retry:
@@@ -1499,7 -1369,7 +1448,7 @@@ good_area
   
         up_read(&mm->mmap_sem);
         if (unlikely(fault & VM_FAULT_ERROR)) {
-               mm_fault_error(regs, sw_error_code, address, &pkey, fault);
- -              mm_fault_error(regs, error_code, address, fault);
++              mm_fault_error(regs, sw_error_code, address, fault);
                 return;
         }
   
diff --cc drivers/tty/tty_io.c
Simple merge
diff --cc drivers/usb/core/devio.c
Simple merge
diff --cc drivers/usb/gadget/function/f_mass_storage.c
Simple merge
diff --cc include/linux/compat.h
Simple merge
diff --cc include/linux/ptrace.h
Simple merge
diff --cc include/linux/sched.h
Simple merge
diff --cc kernel/ptrace.c
Simple merge
diff --cc kernel/signal.c
Simple merge
diff --cc mm/oom_kill.c
Simple merge
diff --cc virt/kvm/arm/mmu.c
Simple merge
author	Linus Torvalds <torvalds@linux-foundation.org>
	Wed, 24 Oct 2018 10:22:39 +0000 (11:22 +0100)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Wed, 24 Oct 2018 10:22:39 +0000 (11:22 +0100)
		1	2
arch/arm/vfp/vfpmodule.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/arm64/kernel/traps.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/arm64/mm/fault.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/powerpc/kernel/process.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/include/asm/ptrace.h	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/ptrace.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/traps.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kvm/mmu.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/mm/fault.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/tty/tty_io.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/usb/core/devio.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/usb/gadget/function/f_mass_storage.c	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/compat.h	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/ptrace.h	patch \|	diff1 \|	diff2 \|	blob \| history
include/linux/sched.h	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/ptrace.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/signal.c	patch \|	diff1 \|	diff2 \|	blob \| history
mm/oom_kill.c	patch \|	diff1 \|	diff2 \|	blob \| history
virt/kvm/arm/mmu.c	patch \|	diff1 \|	diff2 \|	blob \| history