Commit 9b19700e authored by Ard Biesheuvel's avatar Ard Biesheuvel Committed by Will Deacon

arm64: fpsimd: Drop unneeded 'busy' flag

Kernel mode NEON will preserve the user mode FPSIMD state by saving it
into the task struct before clobbering the registers. In order to avoid
the need for preserving kernel mode state too, we disallow nested use of
kernel mode NEON, i..e, use in softirq context while the interrupted
task context was using kernel mode NEON too.

Originally, this policy was implemented using a per-CPU flag which was
exposed via may_use_simd(), requiring the users of the kernel mode NEON
to deal with the possibility that it might return false, and having NEON
and non-NEON code paths. This policy was changed by commit
13150149 ("arm64: fpsimd: run kernel mode NEON with softirqs
disabled"), and now, softirq processing is disabled entirely instead,
and so may_use_simd() can never fail when called from task or softirq
context.

This means we can drop the fpsimd_context_busy flag entirely, and
instead, ensure that we disable softirq processing in places where we
formerly relied on the flag for preventing races in the FPSIMD preserve
routines.
Signed-off-by: default avatarArd Biesheuvel <ardb@kernel.org>
Reviewed-by: default avatarMark Brown <broonie@kernel.org>
Tested-by: default avatarGeert Uytterhoeven <geert+renesas@glider.be>
Link: https://lore.kernel.org/r/20231208113218.3001940-7-ardb@google.com
[will: Folded in fix from CAMj1kXFhzbJRyWHELCivQW1yJaF=p07LLtbuyXYX3G1WtsdyQg@mail.gmail.com]
Signed-off-by: default avatarWill Deacon <will@kernel.org>
parent 2cc14f52
...@@ -12,8 +12,6 @@ ...@@ -12,8 +12,6 @@
#include <linux/preempt.h> #include <linux/preempt.h>
#include <linux/types.h> #include <linux/types.h>
DECLARE_PER_CPU(bool, fpsimd_context_busy);
#ifdef CONFIG_KERNEL_MODE_NEON #ifdef CONFIG_KERNEL_MODE_NEON
/* /*
...@@ -28,17 +26,10 @@ static __must_check inline bool may_use_simd(void) ...@@ -28,17 +26,10 @@ static __must_check inline bool may_use_simd(void)
/* /*
* We must make sure that the SVE has been initialized properly * We must make sure that the SVE has been initialized properly
* before using the SIMD in kernel. * before using the SIMD in kernel.
* fpsimd_context_busy is only set while preemption is disabled,
* and is clear whenever preemption is enabled. Since
* this_cpu_read() is atomic w.r.t. preemption, fpsimd_context_busy
* cannot change under our feet -- if it's set we cannot be
* migrated, and if it's clear we cannot be migrated to a CPU
* where it is set.
*/ */
return !WARN_ON(!system_capabilities_finalized()) && return !WARN_ON(!system_capabilities_finalized()) &&
system_supports_fpsimd() && system_supports_fpsimd() &&
!in_hardirq() && !irqs_disabled() && !in_nmi() && !in_hardirq() && !irqs_disabled() && !in_nmi();
!this_cpu_read(fpsimd_context_busy);
} }
#else /* ! CONFIG_KERNEL_MODE_NEON */ #else /* ! CONFIG_KERNEL_MODE_NEON */
......
...@@ -85,13 +85,13 @@ ...@@ -85,13 +85,13 @@
* softirq kicks in. Upon vcpu_put(), KVM will save the vcpu FP state and * softirq kicks in. Upon vcpu_put(), KVM will save the vcpu FP state and
* flag the register state as invalid. * flag the register state as invalid.
* *
* In order to allow softirq handlers to use FPSIMD, kernel_neon_begin() may * In order to allow softirq handlers to use FPSIMD, kernel_neon_begin() may be
* save the task's FPSIMD context back to task_struct from softirq context. * called from softirq context, which will save the task's FPSIMD context back
* To prevent this from racing with the manipulation of the task's FPSIMD state * to task_struct. To prevent this from racing with the manipulation of the
* from task context and thereby corrupting the state, it is necessary to * task's FPSIMD state from task context and thereby corrupting the state, it
* protect any manipulation of a task's fpsimd_state or TIF_FOREIGN_FPSTATE * is necessary to protect any manipulation of a task's fpsimd_state or
* flag with {, __}get_cpu_fpsimd_context(). This will still allow softirqs to * TIF_FOREIGN_FPSTATE flag with get_cpu_fpsimd_context(), which will suspend
* run but prevent them to use FPSIMD. * softirq servicing entirely until put_cpu_fpsimd_context() is called.
* *
* For a certain task, the sequence may look something like this: * For a certain task, the sequence may look something like this:
* - the task gets scheduled in; if both the task's fpsimd_cpu field * - the task gets scheduled in; if both the task's fpsimd_cpu field
...@@ -209,27 +209,14 @@ static inline void sme_free(struct task_struct *t) { } ...@@ -209,27 +209,14 @@ static inline void sme_free(struct task_struct *t) { }
#endif #endif
DEFINE_PER_CPU(bool, fpsimd_context_busy);
EXPORT_PER_CPU_SYMBOL(fpsimd_context_busy);
static void fpsimd_bind_task_to_cpu(void); static void fpsimd_bind_task_to_cpu(void);
static void __get_cpu_fpsimd_context(void)
{
bool busy = __this_cpu_xchg(fpsimd_context_busy, true);
WARN_ON(busy);
}
/* /*
* Claim ownership of the CPU FPSIMD context for use by the calling context. * Claim ownership of the CPU FPSIMD context for use by the calling context.
* *
* The caller may freely manipulate the FPSIMD context metadata until * The caller may freely manipulate the FPSIMD context metadata until
* put_cpu_fpsimd_context() is called. * put_cpu_fpsimd_context() is called.
* *
* The double-underscore version must only be called if you know the task
* can't be preempted.
*
* On RT kernels local_bh_disable() is not sufficient because it only * On RT kernels local_bh_disable() is not sufficient because it only
* serializes soft interrupt related sections via a local lock, but stays * serializes soft interrupt related sections via a local lock, but stays
* preemptible. Disabling preemption is the right choice here as bottom * preemptible. Disabling preemption is the right choice here as bottom
...@@ -242,14 +229,6 @@ static void get_cpu_fpsimd_context(void) ...@@ -242,14 +229,6 @@ static void get_cpu_fpsimd_context(void)
local_bh_disable(); local_bh_disable();
else else
preempt_disable(); preempt_disable();
__get_cpu_fpsimd_context();
}
static void __put_cpu_fpsimd_context(void)
{
bool busy = __this_cpu_xchg(fpsimd_context_busy, false);
WARN_ON(!busy); /* No matching get_cpu_fpsimd_context()? */
} }
/* /*
...@@ -261,18 +240,12 @@ static void __put_cpu_fpsimd_context(void) ...@@ -261,18 +240,12 @@ static void __put_cpu_fpsimd_context(void)
*/ */
static void put_cpu_fpsimd_context(void) static void put_cpu_fpsimd_context(void)
{ {
__put_cpu_fpsimd_context();
if (!IS_ENABLED(CONFIG_PREEMPT_RT)) if (!IS_ENABLED(CONFIG_PREEMPT_RT))
local_bh_enable(); local_bh_enable();
else else
preempt_enable(); preempt_enable();
} }
static bool have_cpu_fpsimd_context(void)
{
return !preemptible() && __this_cpu_read(fpsimd_context_busy);
}
unsigned int task_get_vl(const struct task_struct *task, enum vec_type type) unsigned int task_get_vl(const struct task_struct *task, enum vec_type type)
{ {
return task->thread.vl[type]; return task->thread.vl[type];
...@@ -383,7 +356,7 @@ static void task_fpsimd_load(void) ...@@ -383,7 +356,7 @@ static void task_fpsimd_load(void)
bool restore_ffr; bool restore_ffr;
WARN_ON(!system_supports_fpsimd()); WARN_ON(!system_supports_fpsimd());
WARN_ON(!have_cpu_fpsimd_context()); WARN_ON(preemptible());
if (system_supports_sve() || system_supports_sme()) { if (system_supports_sve() || system_supports_sme()) {
switch (current->thread.fp_type) { switch (current->thread.fp_type) {
...@@ -467,7 +440,7 @@ static void fpsimd_save(void) ...@@ -467,7 +440,7 @@ static void fpsimd_save(void)
unsigned int vl; unsigned int vl;
WARN_ON(!system_supports_fpsimd()); WARN_ON(!system_supports_fpsimd());
WARN_ON(!have_cpu_fpsimd_context()); WARN_ON(preemptible());
if (test_thread_flag(TIF_FOREIGN_FPSTATE)) if (test_thread_flag(TIF_FOREIGN_FPSTATE))
return; return;
...@@ -1507,7 +1480,7 @@ void fpsimd_thread_switch(struct task_struct *next) ...@@ -1507,7 +1480,7 @@ void fpsimd_thread_switch(struct task_struct *next)
if (!system_supports_fpsimd()) if (!system_supports_fpsimd())
return; return;
__get_cpu_fpsimd_context(); WARN_ON_ONCE(!irqs_disabled());
/* Save unsaved fpsimd state, if any: */ /* Save unsaved fpsimd state, if any: */
fpsimd_save(); fpsimd_save();
...@@ -1523,8 +1496,6 @@ void fpsimd_thread_switch(struct task_struct *next) ...@@ -1523,8 +1496,6 @@ void fpsimd_thread_switch(struct task_struct *next)
update_tsk_thread_flag(next, TIF_FOREIGN_FPSTATE, update_tsk_thread_flag(next, TIF_FOREIGN_FPSTATE,
wrong_task || wrong_cpu); wrong_task || wrong_cpu);
__put_cpu_fpsimd_context();
} }
static void fpsimd_flush_thread_vl(enum vec_type type) static void fpsimd_flush_thread_vl(enum vec_type type)
...@@ -1826,13 +1797,15 @@ static void fpsimd_flush_cpu_state(void) ...@@ -1826,13 +1797,15 @@ static void fpsimd_flush_cpu_state(void)
*/ */
void fpsimd_save_and_flush_cpu_state(void) void fpsimd_save_and_flush_cpu_state(void)
{ {
unsigned long flags;
if (!system_supports_fpsimd()) if (!system_supports_fpsimd())
return; return;
WARN_ON(preemptible()); WARN_ON(preemptible());
__get_cpu_fpsimd_context(); local_irq_save(flags);
fpsimd_save(); fpsimd_save();
fpsimd_flush_cpu_state(); fpsimd_flush_cpu_state();
__put_cpu_fpsimd_context(); local_irq_restore(flags);
} }
#ifdef CONFIG_KERNEL_MODE_NEON #ifdef CONFIG_KERNEL_MODE_NEON
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment