216 lines
6.9 KiB
Diff
216 lines
6.9 KiB
Diff
From b3eb743c32515bf8fca7b619dd2a2c64b5812dd8 Mon Sep 17 00:00:00 2001
|
|
From: Rik van Riel <riel@surriel.com>
|
|
Date: Tue, 25 Feb 2025 22:00:43 -0500
|
|
Subject: x86/mm: Handle global ASID context switch and TLB flush
|
|
|
|
Do context switch and TLB flush support for processes that use a global
|
|
ASID and PCID across all CPUs.
|
|
|
|
At both context switch time and TLB flush time, it needs to be checked whether
|
|
a task is switching to a global ASID, and, if so, reload the TLB with the new
|
|
ASID as appropriate.
|
|
|
|
In both code paths, the TLB flush is avoided if a global ASID is used, because
|
|
the global ASIDs are always kept up to date across CPUs, even when the
|
|
process is not running on a CPU.
|
|
|
|
[ bp:
|
|
- Massage
|
|
- :%s/\<static_cpu_has\>/cpu_feature_enabled/cgi
|
|
]
|
|
|
|
Signed-off-by: Rik van Riel <riel@surriel.com>
|
|
Signed-off-by: Borislav Petkov (AMD) <bp@alien8.de>
|
|
Link: https://lore.kernel.org/r/20250226030129.530345-9-riel@surriel.com
|
|
---
|
|
arch/x86/include/asm/tlbflush.h | 14 ++++++
|
|
arch/x86/mm/tlb.c | 77 ++++++++++++++++++++++++++++++---
|
|
2 files changed, 84 insertions(+), 7 deletions(-)
|
|
|
|
--- a/arch/x86/include/asm/tlbflush.h
|
|
+++ b/arch/x86/include/asm/tlbflush.h
|
|
@@ -240,6 +240,11 @@ static inline bool is_dyn_asid(u16 asid)
|
|
return asid < TLB_NR_DYN_ASIDS;
|
|
}
|
|
|
|
+static inline bool is_global_asid(u16 asid)
|
|
+{
|
|
+ return !is_dyn_asid(asid);
|
|
+}
|
|
+
|
|
#ifdef CONFIG_BROADCAST_TLB_FLUSH
|
|
static inline u16 mm_global_asid(struct mm_struct *mm)
|
|
{
|
|
@@ -266,9 +271,18 @@ static inline void mm_assign_global_asid
|
|
mm->context.asid_transition = true;
|
|
smp_store_release(&mm->context.global_asid, asid);
|
|
}
|
|
+
|
|
+static inline bool mm_in_asid_transition(struct mm_struct *mm)
|
|
+{
|
|
+ if (!cpu_feature_enabled(X86_FEATURE_INVLPGB))
|
|
+ return false;
|
|
+
|
|
+ return mm && READ_ONCE(mm->context.asid_transition);
|
|
+}
|
|
#else
|
|
static inline u16 mm_global_asid(struct mm_struct *mm) { return 0; }
|
|
static inline void mm_assign_global_asid(struct mm_struct *mm, u16 asid) { }
|
|
+static inline bool mm_in_asid_transition(struct mm_struct *mm) { return false; }
|
|
#endif /* CONFIG_BROADCAST_TLB_FLUSH */
|
|
|
|
#ifdef CONFIG_PARAVIRT
|
|
--- a/arch/x86/mm/tlb.c
|
|
+++ b/arch/x86/mm/tlb.c
|
|
@@ -227,6 +227,20 @@ static void choose_new_asid(struct mm_st
|
|
return;
|
|
}
|
|
|
|
+ /*
|
|
+ * TLB consistency for global ASIDs is maintained with hardware assisted
|
|
+ * remote TLB flushing. Global ASIDs are always up to date.
|
|
+ */
|
|
+ if (cpu_feature_enabled(X86_FEATURE_INVLPGB)) {
|
|
+ u16 global_asid = mm_global_asid(next);
|
|
+
|
|
+ if (global_asid) {
|
|
+ *new_asid = global_asid;
|
|
+ *need_flush = false;
|
|
+ return;
|
|
+ }
|
|
+ }
|
|
+
|
|
if (this_cpu_read(cpu_tlbstate.invalidate_other))
|
|
clear_asid_other();
|
|
|
|
@@ -400,6 +414,23 @@ void mm_free_global_asid(struct mm_struc
|
|
}
|
|
|
|
/*
|
|
+ * Is the mm transitioning from a CPU-local ASID to a global ASID?
|
|
+ */
|
|
+static bool mm_needs_global_asid(struct mm_struct *mm, u16 asid)
|
|
+{
|
|
+ u16 global_asid = mm_global_asid(mm);
|
|
+
|
|
+ if (!cpu_feature_enabled(X86_FEATURE_INVLPGB))
|
|
+ return false;
|
|
+
|
|
+ /* Process is transitioning to a global ASID */
|
|
+ if (global_asid && asid != global_asid)
|
|
+ return true;
|
|
+
|
|
+ return false;
|
|
+}
|
|
+
|
|
+/*
|
|
* Given an ASID, flush the corresponding user ASID. We can delay this
|
|
* until the next time we switch to it.
|
|
*
|
|
@@ -704,7 +735,8 @@ void switch_mm_irqs_off(struct mm_struct
|
|
*/
|
|
if (prev == next) {
|
|
/* Not actually switching mm's */
|
|
- VM_WARN_ON(this_cpu_read(cpu_tlbstate.ctxs[prev_asid].ctx_id) !=
|
|
+ VM_WARN_ON(is_dyn_asid(prev_asid) &&
|
|
+ this_cpu_read(cpu_tlbstate.ctxs[prev_asid].ctx_id) !=
|
|
next->context.ctx_id);
|
|
|
|
/*
|
|
@@ -721,6 +753,20 @@ void switch_mm_irqs_off(struct mm_struct
|
|
!cpumask_test_cpu(cpu, mm_cpumask(next))))
|
|
cpumask_set_cpu(cpu, mm_cpumask(next));
|
|
|
|
+ /* Check if the current mm is transitioning to a global ASID */
|
|
+ if (mm_needs_global_asid(next, prev_asid)) {
|
|
+ next_tlb_gen = atomic64_read(&next->context.tlb_gen);
|
|
+ choose_new_asid(next, next_tlb_gen, &new_asid, &need_flush);
|
|
+ goto reload_tlb;
|
|
+ }
|
|
+
|
|
+ /*
|
|
+ * Broadcast TLB invalidation keeps this ASID up to date
|
|
+ * all the time.
|
|
+ */
|
|
+ if (is_global_asid(prev_asid))
|
|
+ return;
|
|
+
|
|
/*
|
|
* If the CPU is not in lazy TLB mode, we are just switching
|
|
* from one thread in a process to another thread in the same
|
|
@@ -755,6 +801,13 @@ void switch_mm_irqs_off(struct mm_struct
|
|
cond_mitigation(tsk);
|
|
|
|
/*
|
|
+ * Let nmi_uaccess_okay() and finish_asid_transition()
|
|
+ * know that CR3 is changing.
|
|
+ */
|
|
+ this_cpu_write(cpu_tlbstate.loaded_mm, LOADED_MM_SWITCHING);
|
|
+ barrier();
|
|
+
|
|
+ /*
|
|
* Leave this CPU in prev's mm_cpumask. Atomic writes to
|
|
* mm_cpumask can be expensive under contention. The CPU
|
|
* will be removed lazily at TLB flush time.
|
|
@@ -768,14 +821,12 @@ void switch_mm_irqs_off(struct mm_struct
|
|
next_tlb_gen = atomic64_read(&next->context.tlb_gen);
|
|
|
|
choose_new_asid(next, next_tlb_gen, &new_asid, &need_flush);
|
|
-
|
|
- /* Let nmi_uaccess_okay() know that we're changing CR3. */
|
|
- this_cpu_write(cpu_tlbstate.loaded_mm, LOADED_MM_SWITCHING);
|
|
- barrier();
|
|
}
|
|
|
|
+reload_tlb:
|
|
new_lam = mm_lam_cr3_mask(next);
|
|
if (need_flush) {
|
|
+ VM_WARN_ON_ONCE(is_global_asid(new_asid));
|
|
this_cpu_write(cpu_tlbstate.ctxs[new_asid].ctx_id, next->context.ctx_id);
|
|
this_cpu_write(cpu_tlbstate.ctxs[new_asid].tlb_gen, next_tlb_gen);
|
|
load_new_mm_cr3(next->pgd, new_asid, new_lam, true);
|
|
@@ -894,7 +945,7 @@ static void flush_tlb_func(void *info)
|
|
const struct flush_tlb_info *f = info;
|
|
struct mm_struct *loaded_mm = this_cpu_read(cpu_tlbstate.loaded_mm);
|
|
u32 loaded_mm_asid = this_cpu_read(cpu_tlbstate.loaded_mm_asid);
|
|
- u64 local_tlb_gen = this_cpu_read(cpu_tlbstate.ctxs[loaded_mm_asid].tlb_gen);
|
|
+ u64 local_tlb_gen;
|
|
bool local = smp_processor_id() == f->initiating_cpu;
|
|
unsigned long nr_invalidate = 0;
|
|
u64 mm_tlb_gen;
|
|
@@ -917,6 +968,16 @@ static void flush_tlb_func(void *info)
|
|
if (unlikely(loaded_mm == &init_mm))
|
|
return;
|
|
|
|
+ /* Reload the ASID if transitioning into or out of a global ASID */
|
|
+ if (mm_needs_global_asid(loaded_mm, loaded_mm_asid)) {
|
|
+ switch_mm_irqs_off(NULL, loaded_mm, NULL);
|
|
+ loaded_mm_asid = this_cpu_read(cpu_tlbstate.loaded_mm_asid);
|
|
+ }
|
|
+
|
|
+ /* Broadcast ASIDs are always kept up to date with INVLPGB. */
|
|
+ if (is_global_asid(loaded_mm_asid))
|
|
+ return;
|
|
+
|
|
VM_WARN_ON(this_cpu_read(cpu_tlbstate.ctxs[loaded_mm_asid].ctx_id) !=
|
|
loaded_mm->context.ctx_id);
|
|
|
|
@@ -934,6 +995,8 @@ static void flush_tlb_func(void *info)
|
|
return;
|
|
}
|
|
|
|
+ local_tlb_gen = this_cpu_read(cpu_tlbstate.ctxs[loaded_mm_asid].tlb_gen);
|
|
+
|
|
if (unlikely(f->new_tlb_gen != TLB_GENERATION_INVALID &&
|
|
f->new_tlb_gen <= local_tlb_gen)) {
|
|
/*
|
|
@@ -1101,7 +1164,7 @@ STATIC_NOPV void native_flush_tlb_multi(
|
|
* up on the new contents of what used to be page tables, while
|
|
* doing a speculative memory access.
|
|
*/
|
|
- if (info->freed_tables)
|
|
+ if (info->freed_tables || mm_in_asid_transition(info->mm))
|
|
on_each_cpu_mask(cpumask, flush_tlb_func, (void *)info, true);
|
|
else
|
|
on_each_cpu_cond_mask(should_flush_tlb, flush_tlb_func,
|