mirror of
https://github.com/hardkernel/linux.git
synced 2026-06-07 11:26:02 +09:00
FROMLIST: x86/mm: attempt speculative mm faults first
Attempt speculative mm fault handling first, and fall back to the existing (non-speculative) code if that fails. The speculative handling closely mirrors the non-speculative logic. This includes some x86 specific bits such as the access_error() call. This is why we chose to implement the speculative handling in arch/x86 rather than in common code. The vma is first looked up and copied, under protection of the rcu read lock. The mmap lock sequence count is used to verify the integrity of the copied vma, and passed to do_handle_mm_fault() to allow checking against races with mmap writers when finalizing the fault. Signed-off-by: Michel Lespinasse <michel@lespinasse.org> Link: https://lore.kernel.org/all/20220128131006.67712-14-michel@lespinasse.org/ Bug: 161210518 Signed-off-by: Suren Baghdasaryan <surenb@google.com> Change-Id: I2c078a173ee39f35af16daeee8c6a1466d10c3e8
This commit is contained in:
committed by
Todd Kjos
parent
0823d516af
commit
4dea585cfe
@@ -1226,6 +1226,10 @@ void do_user_addr_fault(struct pt_regs *regs,
|
||||
struct mm_struct *mm;
|
||||
vm_fault_t fault;
|
||||
unsigned int flags = FAULT_FLAG_DEFAULT;
|
||||
#ifdef CONFIG_SPECULATIVE_PAGE_FAULT
|
||||
struct vm_area_struct pvma;
|
||||
unsigned long seq;
|
||||
#endif
|
||||
|
||||
tsk = current;
|
||||
mm = tsk->mm;
|
||||
@@ -1323,6 +1327,43 @@ void do_user_addr_fault(struct pt_regs *regs,
|
||||
}
|
||||
#endif
|
||||
|
||||
#ifdef CONFIG_SPECULATIVE_PAGE_FAULT
|
||||
count_vm_event(SPF_ATTEMPT);
|
||||
seq = mmap_seq_read_start(mm);
|
||||
if (seq & 1)
|
||||
goto spf_abort;
|
||||
rcu_read_lock();
|
||||
vma = __find_vma(mm, address);
|
||||
if (!vma || vma->vm_start > address) {
|
||||
rcu_read_unlock();
|
||||
goto spf_abort;
|
||||
}
|
||||
pvma = *vma;
|
||||
rcu_read_unlock();
|
||||
if (!mmap_seq_read_check(mm, seq))
|
||||
goto spf_abort;
|
||||
vma = &pvma;
|
||||
if (unlikely(access_error(error_code, vma)))
|
||||
goto spf_abort;
|
||||
fault = do_handle_mm_fault(vma, address,
|
||||
flags | FAULT_FLAG_SPECULATIVE, seq, regs);
|
||||
|
||||
if (!(fault & VM_FAULT_RETRY))
|
||||
goto done;
|
||||
|
||||
/* Quick path to respond to signals */
|
||||
if (fault_signal_pending(fault, regs)) {
|
||||
if (!user_mode(regs))
|
||||
kernelmode_fixup_or_oops(regs, error_code, address,
|
||||
SIGBUS, BUS_ADRERR,
|
||||
ARCH_DEFAULT_PKEY);
|
||||
return;
|
||||
}
|
||||
|
||||
spf_abort:
|
||||
count_vm_event(SPF_ABORT);
|
||||
#endif
|
||||
|
||||
/*
|
||||
* Kernel-mode access to the user address space should only occur
|
||||
* on well-defined single instructions listed in the exception
|
||||
@@ -1420,6 +1461,9 @@ good_area:
|
||||
}
|
||||
|
||||
mmap_read_unlock(mm);
|
||||
#ifdef CONFIG_SPECULATIVE_PAGE_FAULT
|
||||
done:
|
||||
#endif
|
||||
if (likely(!(fault & VM_FAULT_ERROR)))
|
||||
return;
|
||||
|
||||
|
||||
@@ -322,6 +322,11 @@ struct anon_vma_name {
|
||||
* per VM-area/task. A VM area is any part of the process virtual memory
|
||||
* space that has a special rule for the page-fault handlers (ie a shared
|
||||
* library, the executable area etc).
|
||||
*
|
||||
* Note that speculative page faults make an on-stack copy of the VMA,
|
||||
* so the structure size matters.
|
||||
* (TODO - it would be preferable to copy only the required vma attributes
|
||||
* rather than the entire vma).
|
||||
*/
|
||||
struct vm_area_struct {
|
||||
/* The first cache line has the info for VMA tree walking. */
|
||||
|
||||
@@ -130,6 +130,10 @@ enum vm_event_item { PGPGIN, PGPGOUT, PSWPIN, PSWPOUT,
|
||||
#ifdef CONFIG_X86
|
||||
DIRECT_MAP_LEVEL2_SPLIT,
|
||||
DIRECT_MAP_LEVEL3_SPLIT,
|
||||
#endif
|
||||
#ifdef CONFIG_SPECULATIVE_PAGE_FAULT
|
||||
SPF_ATTEMPT,
|
||||
SPF_ABORT,
|
||||
#endif
|
||||
NR_VM_EVENT_ITEMS
|
||||
};
|
||||
|
||||
@@ -1379,6 +1379,10 @@ const char * const vmstat_text[] = {
|
||||
"direct_map_level2_splits",
|
||||
"direct_map_level3_splits",
|
||||
#endif
|
||||
#ifdef CONFIG_SPECULATIVE_PAGE_FAULT
|
||||
"spf_attempt",
|
||||
"spf_abort",
|
||||
#endif
|
||||
#endif /* CONFIG_VM_EVENT_COUNTERS || CONFIG_MEMCG */
|
||||
};
|
||||
#endif /* CONFIG_PROC_FS || CONFIG_SYSFS || CONFIG_NUMA || CONFIG_MEMCG */
|
||||
|
||||
Reference in New Issue
Block a user