[kvm-unit-tests PATCH v3 3/4] riscv: lib: Add SSE assembly entry handling
Clément Léger
cleger at rivosinc.com
Mon Nov 25 06:13:01 PST 2024
On 25/11/2024 14:50, Andrew Jones wrote:
> On Mon, Nov 25, 2024 at 12:54:47PM +0100, Clément Léger wrote:
>> Add a SSE entry assembly code to handle SSE events. Events should be
>> registered with a struct sse_handler_arg containing a correct stack and
>> handler function.
>>
>> Signed-off-by: Clément Léger <cleger at rivosinc.com>
>> ---
>> riscv/Makefile | 1 +
>> lib/riscv/asm/sse.h | 16 +++++++
>> lib/riscv/sse-entry.S | 100 ++++++++++++++++++++++++++++++++++++++++
>> lib/riscv/asm-offsets.c | 9 ++++
>> 4 files changed, 126 insertions(+)
>> create mode 100644 lib/riscv/asm/sse.h
>> create mode 100644 lib/riscv/sse-entry.S
>>
>> diff --git a/riscv/Makefile b/riscv/Makefile
>> index 5b5e157c..c278ec5c 100644
>> --- a/riscv/Makefile
>> +++ b/riscv/Makefile
>> @@ -41,6 +41,7 @@ cflatobjs += lib/riscv/sbi.o
>> cflatobjs += lib/riscv/setjmp.o
>> cflatobjs += lib/riscv/setup.o
>> cflatobjs += lib/riscv/smp.o
>> +cflatobjs += lib/riscv/sse-entry.o
>> cflatobjs += lib/riscv/stack.o
>> cflatobjs += lib/riscv/timer.o
>> ifeq ($(ARCH),riscv32)
>> diff --git a/lib/riscv/asm/sse.h b/lib/riscv/asm/sse.h
>> new file mode 100644
>> index 00000000..557f6680
>> --- /dev/null
>> +++ b/lib/riscv/asm/sse.h
>> @@ -0,0 +1,16 @@
>> +/* SPDX-License-Identifier: GPL-2.0-only */
>> +#ifndef _ASMRISCV_SSE_H_
>> +#define _ASMRISCV_SSE_H_
>> +
>> +typedef void (*sse_handler_fn)(void *data, struct pt_regs *regs, unsigned int hartid);
>> +
>> +struct sse_handler_arg {
>> + unsigned long reg_tmp;
>> + sse_handler_fn handler;
>> + void *handler_data;
>> + void *stack;
>> +};
>
> It still feels wrong to put a test-specific struct definition in lib. It's
> test-specific, because the SSE register function doesn't define it
> (otherwise we'd put the definition in lib/riscv/asm/sbi.h with the rest of
> the defines that come straight from the spec). Now, if we foresee using
> sse_event_register() outside of SBI SSE testing, then it would make sense
> to come up with a common struct, but it doesn't look like we have plans
> for that now, and sse_event_register() isn't in lib/riscv/sbi.c yet.
>
>> +
>> +extern void sse_entry(void);
>> +
>> +#endif /* _ASMRISCV_SSE_H_ */
>> diff --git a/lib/riscv/sse-entry.S b/lib/riscv/sse-entry.S
>> new file mode 100644
>> index 00000000..f1244e17
>> --- /dev/null
>> +++ b/lib/riscv/sse-entry.S
>> @@ -0,0 +1,100 @@
>> +/* SPDX-License-Identifier: GPL-2.0-only */
>> +/*
>> + * SBI SSE entry code
>> + *
>> + * Copyright (C) 2024, Rivos Inc., Clément Léger <cleger at rivosinc.com>
>> + */
>> +#include <asm/asm.h>
>> +#include <asm/asm-offsets.h>
>> +#include <asm/csr.h>
>> +
>> +.global sse_entry
>> +sse_entry:
>
> sse_entry is also test-specific unless we export sse_event_register().
>
>> + /* Save stack temporarily */
>> + REG_S sp, SSE_REG_TMP(a7)
>> + /* Set entry stack */
>> + REG_L sp, SSE_HANDLER_STACK(a7)
>> +
>> + addi sp, sp, -(PT_SIZE)
>> + REG_S ra, PT_RA(sp)
>> + REG_S s0, PT_S0(sp)
>> + REG_S s1, PT_S1(sp)
>> + REG_S s2, PT_S2(sp)
>> + REG_S s3, PT_S3(sp)
>> + REG_S s4, PT_S4(sp)
>> + REG_S s5, PT_S5(sp)
>> + REG_S s6, PT_S6(sp)
>> + REG_S s7, PT_S7(sp)
>> + REG_S s8, PT_S8(sp)
>> + REG_S s9, PT_S9(sp)
>> + REG_S s10, PT_S10(sp)
>> + REG_S s11, PT_S11(sp)
>> + REG_S tp, PT_TP(sp)
>> + REG_S t0, PT_T0(sp)
>> + REG_S t1, PT_T1(sp)
>> + REG_S t2, PT_T2(sp)
>> + REG_S t3, PT_T3(sp)
>> + REG_S t4, PT_T4(sp)
>> + REG_S t5, PT_T5(sp)
>> + REG_S t6, PT_T6(sp)
>> + REG_S gp, PT_GP(sp)
>> + REG_S a0, PT_A0(sp)
>> + REG_S a1, PT_A1(sp)
>> + REG_S a2, PT_A2(sp)
>> + REG_S a3, PT_A3(sp)
>> + REG_S a4, PT_A4(sp)
>> + REG_S a5, PT_A5(sp)
>> + csrr a1, CSR_SEPC
>> + REG_S a1, PT_EPC(sp)
>> + csrr a2, CSR_SSTATUS
>> + REG_S a2, PT_STATUS(sp)
>> +
>> + REG_L a0, SSE_REG_TMP(a7)
>> + REG_S a0, PT_SP(sp)
>> +
>> + REG_L t0, SSE_HANDLER(a7)
>> + REG_L a0, SSE_HANDLER_DATA(a7)
>> + mv a1, sp
>> + mv a2, a6
>> + jalr t0
>> +
>> +
>> + REG_L a1, PT_EPC(sp)
>> + REG_L a2, PT_STATUS(sp)
>> + csrw CSR_SEPC, a1
>> + csrw CSR_SSTATUS, a2
>> +
>> + REG_L ra, PT_RA(sp)
>> + REG_L s0, PT_S0(sp)
>> + REG_L s1, PT_S1(sp)
>> + REG_L s2, PT_S2(sp)
>> + REG_L s3, PT_S3(sp)
>> + REG_L s4, PT_S4(sp)
>> + REG_L s5, PT_S5(sp)
>> + REG_L s6, PT_S6(sp)
>> + REG_L s7, PT_S7(sp)
>> + REG_L s8, PT_S8(sp)
>> + REG_L s9, PT_S9(sp)
>> + REG_L s10, PT_S10(sp)
>> + REG_L s11, PT_S11(sp)
>> + REG_L tp, PT_TP(sp)
>> + REG_L t0, PT_T0(sp)
>> + REG_L t1, PT_T1(sp)
>> + REG_L t2, PT_T2(sp)
>> + REG_L t3, PT_T3(sp)
>> + REG_L t4, PT_T4(sp)
>> + REG_L t5, PT_T5(sp)
>> + REG_L t6, PT_T6(sp)
>> + REG_L gp, PT_GP(sp)
>> + REG_L a0, PT_A0(sp)
>> + REG_L a1, PT_A1(sp)
>> + REG_L a2, PT_A2(sp)
>> + REG_L a3, PT_A3(sp)
>> + REG_L a4, PT_A4(sp)
>> + REG_L a5, PT_A5(sp)
>> +
>> + REG_L sp, PT_SP(sp)
>> +
>> + li a7, ASM_SBI_EXT_SSE
>> + li a6, ASM_SBI_EXT_SSE_COMPLETE
>> + ecall
>> diff --git a/lib/riscv/asm-offsets.c b/lib/riscv/asm-offsets.c
>> index 6c511c14..b3465eeb 100644
>> --- a/lib/riscv/asm-offsets.c
>> +++ b/lib/riscv/asm-offsets.c
>> @@ -3,7 +3,9 @@
>> #include <elf.h>
>> #include <asm/processor.h>
>> #include <asm/ptrace.h>
>> +#include <asm/sbi.h>
>> #include <asm/smp.h>
>> +#include <asm/sse.h>
>>
>> int main(void)
>> {
>> @@ -63,5 +65,12 @@ int main(void)
>> OFFSET(THREAD_INFO_HARTID, thread_info, hartid);
>> DEFINE(THREAD_INFO_SIZE, sizeof(struct thread_info));
>>
>> + OFFSET(SSE_REG_TMP, sse_handler_arg, reg_tmp);
>> + OFFSET(SSE_HANDLER, sse_handler_arg, handler);
>> + OFFSET(SSE_HANDLER_DATA, sse_handler_arg, handler_data);
>> + OFFSET(SSE_HANDLER_STACK, sse_handler_arg, stack);
>
> I think I prefer just hard coding the offsets in defines and then using
> static asserts to ensure they stay as expected. Below is a diff I applied
> which moves some stuff around. Let me know what you think.
>
> Thanks,
> drew
>
>> + DEFINE(ASM_SBI_EXT_SSE, SBI_EXT_SSE);
>> + DEFINE(ASM_SBI_EXT_SSE_COMPLETE, SBI_EXT_SSE_COMPLETE);
>> +
>> return 0;
>> }
>> --
>> 2.45.2
>>
>
> diff --git a/lib/riscv/asm-offsets.c b/lib/riscv/asm-offsets.c
> index b3465eebbaa2..402eb4d90a8e 100644
> --- a/lib/riscv/asm-offsets.c
> +++ b/lib/riscv/asm-offsets.c
> @@ -5,7 +5,6 @@
> #include <asm/ptrace.h>
> #include <asm/sbi.h>
> #include <asm/smp.h>
> -#include <asm/sse.h>
>
> int main(void)
> {
> @@ -65,10 +64,8 @@ int main(void)
> OFFSET(THREAD_INFO_HARTID, thread_info, hartid);
> DEFINE(THREAD_INFO_SIZE, sizeof(struct thread_info));
>
> - OFFSET(SSE_REG_TMP, sse_handler_arg, reg_tmp);
> - OFFSET(SSE_HANDLER, sse_handler_arg, handler);
> - OFFSET(SSE_HANDLER_DATA, sse_handler_arg, handler_data);
> - OFFSET(SSE_HANDLER_STACK, sse_handler_arg, stack);
> + DEFINE(ASM_SBI_EXT_HSM, SBI_EXT_HSM);
> + DEFINE(ASM_SBI_EXT_HSM_HART_STOP, SBI_EXT_HSM_HART_STOP);
> DEFINE(ASM_SBI_EXT_SSE, SBI_EXT_SSE);
> DEFINE(ASM_SBI_EXT_SSE_COMPLETE, SBI_EXT_SSE_COMPLETE);
>
> diff --git a/lib/riscv/asm/sse.h b/lib/riscv/asm/sse.h
> deleted file mode 100644
> index 557f6680e90c..000000000000
> --- a/lib/riscv/asm/sse.h
> +++ /dev/null
> @@ -1,16 +0,0 @@
> -/* SPDX-License-Identifier: GPL-2.0-only */
> -#ifndef _ASMRISCV_SSE_H_
> -#define _ASMRISCV_SSE_H_
> -
> -typedef void (*sse_handler_fn)(void *data, struct pt_regs *regs, unsigned int hartid);
> -
> -struct sse_handler_arg {
> - unsigned long reg_tmp;
> - sse_handler_fn handler;
> - void *handler_data;
> - void *stack;
> -};
> -
> -extern void sse_entry(void);
> -
> -#endif /* _ASMRISCV_SSE_H_ */
> diff --git a/lib/riscv/sse-entry.S b/lib/riscv/sse-entry.S
> deleted file mode 100644
> index f1244e17fe08..000000000000
> --- a/lib/riscv/sse-entry.S
> +++ /dev/null
> @@ -1,100 +0,0 @@
> -/* SPDX-License-Identifier: GPL-2.0-only */
> -/*
> - * SBI SSE entry code
> - *
> - * Copyright (C) 2024, Rivos Inc., Clément Léger <cleger at rivosinc.com>
> - */
> -#include <asm/asm.h>
> -#include <asm/asm-offsets.h>
> -#include <asm/csr.h>
> -
> -.global sse_entry
> -sse_entry:
> - /* Save stack temporarily */
> - REG_S sp, SSE_REG_TMP(a7)
> - /* Set entry stack */
> - REG_L sp, SSE_HANDLER_STACK(a7)
> -
> - addi sp, sp, -(PT_SIZE)
> - REG_S ra, PT_RA(sp)
> - REG_S s0, PT_S0(sp)
> - REG_S s1, PT_S1(sp)
> - REG_S s2, PT_S2(sp)
> - REG_S s3, PT_S3(sp)
> - REG_S s4, PT_S4(sp)
> - REG_S s5, PT_S5(sp)
> - REG_S s6, PT_S6(sp)
> - REG_S s7, PT_S7(sp)
> - REG_S s8, PT_S8(sp)
> - REG_S s9, PT_S9(sp)
> - REG_S s10, PT_S10(sp)
> - REG_S s11, PT_S11(sp)
> - REG_S tp, PT_TP(sp)
> - REG_S t0, PT_T0(sp)
> - REG_S t1, PT_T1(sp)
> - REG_S t2, PT_T2(sp)
> - REG_S t3, PT_T3(sp)
> - REG_S t4, PT_T4(sp)
> - REG_S t5, PT_T5(sp)
> - REG_S t6, PT_T6(sp)
> - REG_S gp, PT_GP(sp)
> - REG_S a0, PT_A0(sp)
> - REG_S a1, PT_A1(sp)
> - REG_S a2, PT_A2(sp)
> - REG_S a3, PT_A3(sp)
> - REG_S a4, PT_A4(sp)
> - REG_S a5, PT_A5(sp)
> - csrr a1, CSR_SEPC
> - REG_S a1, PT_EPC(sp)
> - csrr a2, CSR_SSTATUS
> - REG_S a2, PT_STATUS(sp)
> -
> - REG_L a0, SSE_REG_TMP(a7)
> - REG_S a0, PT_SP(sp)
> -
> - REG_L t0, SSE_HANDLER(a7)
> - REG_L a0, SSE_HANDLER_DATA(a7)
> - mv a1, sp
> - mv a2, a6
> - jalr t0
> -
> -
> - REG_L a1, PT_EPC(sp)
> - REG_L a2, PT_STATUS(sp)
> - csrw CSR_SEPC, a1
> - csrw CSR_SSTATUS, a2
> -
> - REG_L ra, PT_RA(sp)
> - REG_L s0, PT_S0(sp)
> - REG_L s1, PT_S1(sp)
> - REG_L s2, PT_S2(sp)
> - REG_L s3, PT_S3(sp)
> - REG_L s4, PT_S4(sp)
> - REG_L s5, PT_S5(sp)
> - REG_L s6, PT_S6(sp)
> - REG_L s7, PT_S7(sp)
> - REG_L s8, PT_S8(sp)
> - REG_L s9, PT_S9(sp)
> - REG_L s10, PT_S10(sp)
> - REG_L s11, PT_S11(sp)
> - REG_L tp, PT_TP(sp)
> - REG_L t0, PT_T0(sp)
> - REG_L t1, PT_T1(sp)
> - REG_L t2, PT_T2(sp)
> - REG_L t3, PT_T3(sp)
> - REG_L t4, PT_T4(sp)
> - REG_L t5, PT_T5(sp)
> - REG_L t6, PT_T6(sp)
> - REG_L gp, PT_GP(sp)
> - REG_L a0, PT_A0(sp)
> - REG_L a1, PT_A1(sp)
> - REG_L a2, PT_A2(sp)
> - REG_L a3, PT_A3(sp)
> - REG_L a4, PT_A4(sp)
> - REG_L a5, PT_A5(sp)
> -
> - REG_L sp, PT_SP(sp)
> -
> - li a7, ASM_SBI_EXT_SSE
> - li a6, ASM_SBI_EXT_SSE_COMPLETE
> - ecall
> diff --git a/riscv/Makefile b/riscv/Makefile
> index 81b75ad52411..62a2efc18492 100644
> --- a/riscv/Makefile
> +++ b/riscv/Makefile
> @@ -41,7 +41,6 @@ cflatobjs += lib/riscv/sbi.o
> cflatobjs += lib/riscv/setjmp.o
> cflatobjs += lib/riscv/setup.o
> cflatobjs += lib/riscv/smp.o
> -cflatobjs += lib/riscv/sse-entry.o
> cflatobjs += lib/riscv/stack.o
> cflatobjs += lib/riscv/timer.o
> ifeq ($(ARCH),riscv32)
> diff --git a/riscv/sbi-asm.S b/riscv/sbi-asm.S
> index 923c2ceca5db..5c50606e9940 100644
> --- a/riscv/sbi-asm.S
> +++ b/riscv/sbi-asm.S
> @@ -6,6 +6,7 @@
> */
> #define __ASSEMBLY__
> #include <asm/asm.h>
> +#include <asm/asm-offsets.h>
> #include <asm/csr.h>
>
> #include "sbi-tests.h"
> @@ -58,8 +59,8 @@ sbi_hsm_check:
> 7: lb t0, 0(t1)
> pause
> beqz t0, 7b
> - li a7, 0x48534d /* SBI_EXT_HSM */
> - li a6, 1 /* SBI_EXT_HSM_HART_STOP */
> + li a7, ASM_SBI_EXT_HSM
> + li a6, ASM_SBI_EXT_HSM_HART_STOP
> ecall
> 8: pause
> j 8b
> @@ -129,3 +130,94 @@ sbi_susp_resume:
> call longjmp
> 6: pause /* unreachable */
> j 6b
> +
> +.global sse_entry
> +sse_entry:
> + /* Save stack temporarily */
> + REG_S sp, SBI_SSE_REG_TMP(a7)
> + /* Set entry stack */
> + REG_L sp, SBI_SSE_HANDLER_STACK(a7)
> +
> + addi sp, sp, -(PT_SIZE)
> + REG_S ra, PT_RA(sp)
> + REG_S s0, PT_S0(sp)
> + REG_S s1, PT_S1(sp)
> + REG_S s2, PT_S2(sp)
> + REG_S s3, PT_S3(sp)
> + REG_S s4, PT_S4(sp)
> + REG_S s5, PT_S5(sp)
> + REG_S s6, PT_S6(sp)
> + REG_S s7, PT_S7(sp)
> + REG_S s8, PT_S8(sp)
> + REG_S s9, PT_S9(sp)
> + REG_S s10, PT_S10(sp)
> + REG_S s11, PT_S11(sp)
> + REG_S tp, PT_TP(sp)
> + REG_S t0, PT_T0(sp)
> + REG_S t1, PT_T1(sp)
> + REG_S t2, PT_T2(sp)
> + REG_S t3, PT_T3(sp)
> + REG_S t4, PT_T4(sp)
> + REG_S t5, PT_T5(sp)
> + REG_S t6, PT_T6(sp)
> + REG_S gp, PT_GP(sp)
> + REG_S a0, PT_A0(sp)
> + REG_S a1, PT_A1(sp)
> + REG_S a2, PT_A2(sp)
> + REG_S a3, PT_A3(sp)
> + REG_S a4, PT_A4(sp)
> + REG_S a5, PT_A5(sp)
> + csrr a1, CSR_SEPC
> + REG_S a1, PT_EPC(sp)
> + csrr a2, CSR_SSTATUS
> + REG_S a2, PT_STATUS(sp)
> +
> + REG_L a0, SBI_SSE_REG_TMP(a7)
> + REG_S a0, PT_SP(sp)
> +
> + REG_L t0, SBI_SSE_HANDLER(a7)
> + REG_L a0, SBI_SSE_HANDLER_DATA(a7)
> + mv a1, sp
> + mv a2, a6
> + jalr t0
> +
> +
> + REG_L a1, PT_EPC(sp)
> + REG_L a2, PT_STATUS(sp)
> + csrw CSR_SEPC, a1
> + csrw CSR_SSTATUS, a2
> +
> + REG_L ra, PT_RA(sp)
> + REG_L s0, PT_S0(sp)
> + REG_L s1, PT_S1(sp)
> + REG_L s2, PT_S2(sp)
> + REG_L s3, PT_S3(sp)
> + REG_L s4, PT_S4(sp)
> + REG_L s5, PT_S5(sp)
> + REG_L s6, PT_S6(sp)
> + REG_L s7, PT_S7(sp)
> + REG_L s8, PT_S8(sp)
> + REG_L s9, PT_S9(sp)
> + REG_L s10, PT_S10(sp)
> + REG_L s11, PT_S11(sp)
> + REG_L tp, PT_TP(sp)
> + REG_L t0, PT_T0(sp)
> + REG_L t1, PT_T1(sp)
> + REG_L t2, PT_T2(sp)
> + REG_L t3, PT_T3(sp)
> + REG_L t4, PT_T4(sp)
> + REG_L t5, PT_T5(sp)
> + REG_L t6, PT_T6(sp)
> + REG_L gp, PT_GP(sp)
> + REG_L a0, PT_A0(sp)
> + REG_L a1, PT_A1(sp)
> + REG_L a2, PT_A2(sp)
> + REG_L a3, PT_A3(sp)
> + REG_L a4, PT_A4(sp)
> + REG_L a5, PT_A5(sp)
> +
> + REG_L sp, PT_SP(sp)
> +
> + li a7, ASM_SBI_EXT_SSE
> + li a6, ASM_SBI_EXT_SSE_COMPLETE
> + ecall
> diff --git a/riscv/sbi-sse.c b/riscv/sbi-sse.c
> index a230c600a5a2..85521546838c 100644
> --- a/riscv/sbi-sse.c
> +++ b/riscv/sbi-sse.c
> @@ -16,12 +16,12 @@
> #include <asm/processor.h>
> #include <asm/sbi.h>
> #include <asm/setup.h>
> -#include <asm/sse.h>
>
> #include "sbi-tests.h"
>
> #define SSE_STACK_SIZE PAGE_SIZE
>
> +void sse_entry(void);
> void check_sse(void);
>
> struct sse_event_info {
> diff --git a/riscv/sbi-tests.h b/riscv/sbi-tests.h
> index ce129968fe99..163751ba9ca6 100644
> --- a/riscv/sbi-tests.h
> +++ b/riscv/sbi-tests.h
> @@ -33,4 +33,25 @@
> #define SBI_SUSP_TEST_HARTID (1 << 2)
> #define SBI_SUSP_TEST_MASK 7
>
> +#define SBI_SSE_REG_TMP 0
> +#define SBI_SSE_HANDLER 8
> +#define SBI_SSE_HANDLER_DATA 16
> +#define SBI_SSE_HANDLER_STACK 24
> +
> +#ifndef __ASSEMBLY__
> +
> +typedef void (*sse_handler_fn)(void *data, struct pt_regs *regs, unsigned int hartid);
> +
> +struct sse_handler_arg {
> + unsigned long reg_tmp;
> + sse_handler_fn handler;
> + void *handler_data;
> + void *stack;
> +};
> +_Static_assert(offsetof(struct sse_handler_arg, reg_tmp) == SBI_SSE_REG_TMP);
> +_Static_assert(offsetof(struct sse_handler_arg, handler) == SBI_SSE_HANDLER);
> +_Static_assert(offsetof(struct sse_handler_arg, handler_data) == SBI_SSE_HANDLER_DATA);
> +_Static_assert(offsetof(struct sse_handler_arg, stack) == SBI_SSE_HANDLER_STACK);
> +
I'm not a huge fan but in the end, the result is the same and it suits
you ;) Let's go for it, I'll integrate that in the series (minus the HSM
stuff).
Thanks !
Clément
> +#endif /* !__ASSEMBLY__ */
> #endif /* _RISCV_SBI_TESTS_H_ */
More information about the kvm-riscv
mailing list