Skip to content

Commit 82e0191

Browse files
Suzuki K Poulosectmarinas
authored andcommitted
arm64: Support systems without FP/ASIMD
The arm64 kernel assumes that FP/ASIMD units are always present and accesses the FP/ASIMD specific registers unconditionally. This could cause problems when they are absent. This patch adds the support for kernel handling systems without FP/ASIMD by skipping the register access within the kernel. For kvm, we trap the accesses to FP/ASIMD and inject an undefined instruction exception to the VM. The callers of the exported kernel_neon_begin_partial() should make sure that the FP/ASIMD is supported. Cc: Will Deacon <[email protected]> Cc: Christoffer Dall <[email protected]> Cc: Ard Biesheuvel <[email protected]> Signed-off-by: Suzuki K Poulose <[email protected]> Reviewed-by: Marc Zyngier <[email protected]> [[email protected]: add comment on the ARM64_HAS_NO_FPSIMD conflict and the new location] Signed-off-by: Catalin Marinas <[email protected]>
1 parent a4023f6 commit 82e0191

File tree

7 files changed

+65
-4
lines changed

7 files changed

+65
-4
lines changed

arch/arm64/include/asm/cpufeature.h

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,8 +38,13 @@
3838
#define ARM64_HAS_32BIT_EL0 13
3939
#define ARM64_HYP_OFFSET_LOW 14
4040
#define ARM64_MISMATCHED_CACHE_LINE_SIZE 15
41+
/*
42+
* The macro below will be moved to asm/cpucaps.h together with the
43+
* ARM64_NCAPS update.
44+
*/
45+
#define ARM64_HAS_NO_FPSIMD 16
4146

42-
#define ARM64_NCAPS 16
47+
#define ARM64_NCAPS 17
4348

4449
#ifndef __ASSEMBLY__
4550

@@ -231,6 +236,11 @@ static inline bool system_supports_mixed_endian_el0(void)
231236
return id_aa64mmfr0_mixed_endian_el0(read_system_reg(SYS_ID_AA64MMFR0_EL1));
232237
}
233238

239+
static inline bool system_supports_fpsimd(void)
240+
{
241+
return !cpus_have_const_cap(ARM64_HAS_NO_FPSIMD);
242+
}
243+
234244
#endif /* __ASSEMBLY__ */
235245

236246
#endif

arch/arm64/include/asm/neon.h

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,8 +9,9 @@
99
*/
1010

1111
#include <linux/types.h>
12+
#include <asm/fpsimd.h>
1213

13-
#define cpu_has_neon() (1)
14+
#define cpu_has_neon() system_supports_fpsimd()
1415

1516
#define kernel_neon_begin() kernel_neon_begin_partial(32)
1617

arch/arm64/kernel/cpufeature.c

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -746,6 +746,14 @@ static bool hyp_offset_low(const struct arm64_cpu_capabilities *entry,
746746
return idmap_addr > GENMASK(VA_BITS - 2, 0) && !is_kernel_in_hyp_mode();
747747
}
748748

749+
static bool has_no_fpsimd(const struct arm64_cpu_capabilities *entry, int __unused)
750+
{
751+
u64 pfr0 = read_system_reg(SYS_ID_AA64PFR0_EL1);
752+
753+
return cpuid_feature_extract_signed_field(pfr0,
754+
ID_AA64PFR0_FP_SHIFT) < 0;
755+
}
756+
749757
static const struct arm64_cpu_capabilities arm64_features[] = {
750758
{
751759
.desc = "GIC system register CPU interface",
@@ -829,6 +837,13 @@ static const struct arm64_cpu_capabilities arm64_features[] = {
829837
.def_scope = SCOPE_SYSTEM,
830838
.matches = hyp_offset_low,
831839
},
840+
{
841+
/* FP/SIMD is not implemented */
842+
.capability = ARM64_HAS_NO_FPSIMD,
843+
.def_scope = SCOPE_SYSTEM,
844+
.min_field_value = 0,
845+
.matches = has_no_fpsimd,
846+
},
832847
{},
833848
};
834849

arch/arm64/kernel/fpsimd.c

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -127,6 +127,8 @@ void do_fpsimd_exc(unsigned int esr, struct pt_regs *regs)
127127

128128
void fpsimd_thread_switch(struct task_struct *next)
129129
{
130+
if (!system_supports_fpsimd())
131+
return;
130132
/*
131133
* Save the current FPSIMD state to memory, but only if whatever is in
132134
* the registers is in fact the most recent userland FPSIMD state of
@@ -157,6 +159,8 @@ void fpsimd_thread_switch(struct task_struct *next)
157159

158160
void fpsimd_flush_thread(void)
159161
{
162+
if (!system_supports_fpsimd())
163+
return;
160164
memset(&current->thread.fpsimd_state, 0, sizeof(struct fpsimd_state));
161165
fpsimd_flush_task_state(current);
162166
set_thread_flag(TIF_FOREIGN_FPSTATE);
@@ -168,6 +172,8 @@ void fpsimd_flush_thread(void)
168172
*/
169173
void fpsimd_preserve_current_state(void)
170174
{
175+
if (!system_supports_fpsimd())
176+
return;
171177
preempt_disable();
172178
if (!test_thread_flag(TIF_FOREIGN_FPSTATE))
173179
fpsimd_save_state(&current->thread.fpsimd_state);
@@ -181,6 +187,8 @@ void fpsimd_preserve_current_state(void)
181187
*/
182188
void fpsimd_restore_current_state(void)
183189
{
190+
if (!system_supports_fpsimd())
191+
return;
184192
preempt_disable();
185193
if (test_and_clear_thread_flag(TIF_FOREIGN_FPSTATE)) {
186194
struct fpsimd_state *st = &current->thread.fpsimd_state;
@@ -199,6 +207,8 @@ void fpsimd_restore_current_state(void)
199207
*/
200208
void fpsimd_update_current_state(struct fpsimd_state *state)
201209
{
210+
if (!system_supports_fpsimd())
211+
return;
202212
preempt_disable();
203213
fpsimd_load_state(state);
204214
if (test_and_clear_thread_flag(TIF_FOREIGN_FPSTATE)) {
@@ -228,6 +238,8 @@ static DEFINE_PER_CPU(struct fpsimd_partial_state, softirq_fpsimdstate);
228238
*/
229239
void kernel_neon_begin_partial(u32 num_regs)
230240
{
241+
if (WARN_ON(!system_supports_fpsimd()))
242+
return;
231243
if (in_interrupt()) {
232244
struct fpsimd_partial_state *s = this_cpu_ptr(
233245
in_irq() ? &hardirq_fpsimdstate : &softirq_fpsimdstate);
@@ -252,6 +264,8 @@ EXPORT_SYMBOL(kernel_neon_begin_partial);
252264

253265
void kernel_neon_end(void)
254266
{
267+
if (!system_supports_fpsimd())
268+
return;
255269
if (in_interrupt()) {
256270
struct fpsimd_partial_state *s = this_cpu_ptr(
257271
in_irq() ? &hardirq_fpsimdstate : &softirq_fpsimdstate);

arch/arm64/kvm/handle_exit.c

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,16 @@ static int handle_smc(struct kvm_vcpu *vcpu, struct kvm_run *run)
5757
return 1;
5858
}
5959

60+
/*
61+
* Guest access to FP/ASIMD registers are routed to this handler only
62+
* when the system doesn't support FP/ASIMD.
63+
*/
64+
static int handle_no_fpsimd(struct kvm_vcpu *vcpu, struct kvm_run *run)
65+
{
66+
kvm_inject_undefined(vcpu);
67+
return 1;
68+
}
69+
6070
/**
6171
* kvm_handle_wfx - handle a wait-for-interrupts or wait-for-event
6272
* instruction executed by a guest
@@ -144,6 +154,7 @@ static exit_handle_fn arm_exit_handlers[] = {
144154
[ESR_ELx_EC_BREAKPT_LOW]= kvm_handle_guest_debug,
145155
[ESR_ELx_EC_BKPT32] = kvm_handle_guest_debug,
146156
[ESR_ELx_EC_BRK64] = kvm_handle_guest_debug,
157+
[ESR_ELx_EC_FP_ASIMD] = handle_no_fpsimd,
147158
};
148159

149160
static exit_handle_fn kvm_get_exit_handler(struct kvm_vcpu *vcpu)

arch/arm64/kvm/hyp/hyp-entry.S

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -106,9 +106,16 @@ el1_trap:
106106
* x0: ESR_EC
107107
*/
108108

109-
/* Guest accessed VFP/SIMD registers, save host, restore Guest */
109+
/*
110+
* We trap the first access to the FP/SIMD to save the host context
111+
* and restore the guest context lazily.
112+
* If FP/SIMD is not implemented, handle the trap and inject an
113+
* undefined instruction exception to the guest.
114+
*/
115+
alternative_if_not ARM64_HAS_NO_FPSIMD
110116
cmp x0, #ESR_ELx_EC_FP_ASIMD
111117
b.eq __fpsimd_guest_restore
118+
alternative_else_nop_endif
112119

113120
mrs x1, tpidr_el2
114121
mov x0, #ARM_EXCEPTION_TRAP

arch/arm64/kvm/hyp/switch.c

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@
2121
#include <asm/kvm_asm.h>
2222
#include <asm/kvm_emulate.h>
2323
#include <asm/kvm_hyp.h>
24+
#include <asm/fpsimd.h>
2425

2526
static bool __hyp_text __fpsimd_enabled_nvhe(void)
2627
{
@@ -76,9 +77,11 @@ static void __hyp_text __activate_traps(struct kvm_vcpu *vcpu)
7677
* traps are only taken to EL2 if the operation would not otherwise
7778
* trap to EL1. Therefore, always make sure that for 32-bit guests,
7879
* we set FPEXC.EN to prevent traps to EL1, when setting the TFP bit.
80+
* If FP/ASIMD is not implemented, FPEXC is UNDEFINED and any access to
81+
* it will cause an exception.
7982
*/
8083
val = vcpu->arch.hcr_el2;
81-
if (!(val & HCR_RW)) {
84+
if (!(val & HCR_RW) && system_supports_fpsimd()) {
8285
write_sysreg(1 << 30, fpexc32_el2);
8386
isb();
8487
}

0 commit comments

Comments
 (0)