[PATCH v4] lib: sbi: Improve csr read and write

Xiang W wxjstz at 126.com
Thu May 26 08:19:27 PDT 2022


在 2022-05-26星期四的 20:35 +0530,Anup Patel写道:
> On Thu, May 26, 2022 at 8:12 PM Xiang W <wxjstz at 126.com> wrote:
> > 
> > Reduce the overhead of csr read and write code by producing a small
> > piece of code to perform csr read and write.
> > 
> > Signed-off-by: Xiang W <wxjstz at 126.com>
> > ---
> > Changes in v4:
> > - add fence.i sync instruction memory
> > 
> > Changes in v3:
> > - Prevent unnecessary optimizations by the compiler
> > 
> > Changes in v2:
> > - Fix thread safety related bugs as suggested by Anup
> > 
> >  lib/sbi/riscv_asm.c | 145 ++++----------------------------------------
> >  1 file changed, 13 insertions(+), 132 deletions(-)
> > 
> > diff --git a/lib/sbi/riscv_asm.c b/lib/sbi/riscv_asm.c
> > index a09cf78..452cb19 100644
> > --- a/lib/sbi/riscv_asm.c
> > +++ b/lib/sbi/riscv_asm.c
> > @@ -9,6 +9,7 @@
> > 
> >  #include <sbi/riscv_asm.h>
> >  #include <sbi/riscv_encoding.h>
> > +#include <sbi/riscv_barrier.h>
> >  #include <sbi/sbi_error.h>
> >  #include <sbi/sbi_platform.h>
> >  #include <sbi/sbi_console.h>
> > @@ -93,142 +94,22 @@ void misa_string(int xlen, char *out, unsigned int out_sz)
> > 
> >  unsigned long csr_read_num(int csr_num)
> >  {
> > -#define switchcase_csr_read(__csr_num, __val)          \
> > -       case __csr_num:                                 \
> > -               __val = csr_read(__csr_num);            \
> > -               break;
> > -#define switchcase_csr_read_2(__csr_num, __val)        \
> > -       switchcase_csr_read(__csr_num + 0, __val)       \
> > -       switchcase_csr_read(__csr_num + 1, __val)
> > -#define switchcase_csr_read_4(__csr_num, __val)        \
> > -       switchcase_csr_read_2(__csr_num + 0, __val)     \
> > -       switchcase_csr_read_2(__csr_num + 2, __val)
> > -#define switchcase_csr_read_8(__csr_num, __val)        \
> > -       switchcase_csr_read_4(__csr_num + 0, __val)     \
> > -       switchcase_csr_read_4(__csr_num + 4, __val)
> > -#define switchcase_csr_read_16(__csr_num, __val)       \
> > -       switchcase_csr_read_8(__csr_num + 0, __val)     \
> > -       switchcase_csr_read_8(__csr_num + 8, __val)
> > -#define switchcase_csr_read_32(__csr_num, __val)       \
> > -       switchcase_csr_read_16(__csr_num + 0, __val)    \
> > -       switchcase_csr_read_16(__csr_num + 16, __val)
> > -#define switchcase_csr_read_64(__csr_num, __val)       \
> > -       switchcase_csr_read_32(__csr_num + 0, __val)    \
> > -       switchcase_csr_read_32(__csr_num + 32, __val)
> > -
> > -       unsigned long ret = 0;
> > -
> > -       switch (csr_num) {
> > -       switchcase_csr_read_16(CSR_PMPCFG0, ret)
> > -       switchcase_csr_read_64(CSR_PMPADDR0, ret)
> > -       switchcase_csr_read(CSR_MCYCLE, ret)
> > -       switchcase_csr_read(CSR_MINSTRET, ret)
> > -       switchcase_csr_read(CSR_MHPMCOUNTER3, ret)
> > -       switchcase_csr_read_4(CSR_MHPMCOUNTER4, ret)
> > -       switchcase_csr_read_8(CSR_MHPMCOUNTER8, ret)
> > -       switchcase_csr_read_16(CSR_MHPMCOUNTER16, ret)
> > -       switchcase_csr_read(CSR_MCOUNTINHIBIT, ret)
> > -       switchcase_csr_read(CSR_MHPMEVENT3, ret)
> > -       switchcase_csr_read_4(CSR_MHPMEVENT4, ret)
> > -       switchcase_csr_read_8(CSR_MHPMEVENT8, ret)
> > -       switchcase_csr_read_16(CSR_MHPMEVENT16, ret)
> > -#if __riscv_xlen == 32
> > -       switchcase_csr_read(CSR_MCYCLEH, ret)
> > -       switchcase_csr_read(CSR_MINSTRETH, ret)
> > -       switchcase_csr_read(CSR_MHPMCOUNTER3H, ret)
> > -       switchcase_csr_read_4(CSR_MHPMCOUNTER4H, ret)
> > -       switchcase_csr_read_8(CSR_MHPMCOUNTER8H, ret)
> > -       switchcase_csr_read_16(CSR_MHPMCOUNTER16H, ret)
> > -       /**
> > -        * The CSR range MHPMEVENT[3-16]H are available only if sscofpmf
> > -        * extension is present. The caller must ensure that.
> > -        */
> > -       switchcase_csr_read(CSR_MHPMEVENT3H, ret)
> > -       switchcase_csr_read_4(CSR_MHPMEVENT4H, ret)
> > -       switchcase_csr_read_8(CSR_MHPMEVENT8H, ret)
> > -       switchcase_csr_read_16(CSR_MHPMEVENT16H, ret)
> > -#endif
> > -
> > -       default:
> > -               sbi_panic("%s: Unknown CSR %#x", __func__, csr_num);
> > -               break;
> > -       };
> > -
> > -       return ret;
> > -
> > -#undef switchcase_csr_read_64
> > -#undef switchcase_csr_read_32
> > -#undef switchcase_csr_read_16
> > -#undef switchcase_csr_read_8
> > -#undef switchcase_csr_read_4
> > -#undef switchcase_csr_read_2
> > -#undef switchcase_csr_read
> > +       volatile uint32_t opcode_buff[2];
> > +       typedef unsigned long (*read_f)(void);
> > +       opcode_buff[0] = (csr_num << 20) | 0x00002573; /* csrr a0, csr */
> > +       opcode_buff[1] = 0x00008067; /* ret */
> > +       RISCV_FENCE_I;
> > +       return ((read_f)opcode_buff)();
> >  }
> > 
> >  void csr_write_num(int csr_num, unsigned long val)
> >  {
> > -#define switchcase_csr_write(__csr_num, __val)         \
> > -       case __csr_num:                                 \
> > -               csr_write(__csr_num, __val);            \
> > -               break;
> > -#define switchcase_csr_write_2(__csr_num, __val)       \
> > -       switchcase_csr_write(__csr_num + 0, __val)      \
> > -       switchcase_csr_write(__csr_num + 1, __val)
> > -#define switchcase_csr_write_4(__csr_num, __val)       \
> > -       switchcase_csr_write_2(__csr_num + 0, __val)    \
> > -       switchcase_csr_write_2(__csr_num + 2, __val)
> > -#define switchcase_csr_write_8(__csr_num, __val)       \
> > -       switchcase_csr_write_4(__csr_num + 0, __val)    \
> > -       switchcase_csr_write_4(__csr_num + 4, __val)
> > -#define switchcase_csr_write_16(__csr_num, __val)      \
> > -       switchcase_csr_write_8(__csr_num + 0, __val)    \
> > -       switchcase_csr_write_8(__csr_num + 8, __val)
> > -#define switchcase_csr_write_32(__csr_num, __val)      \
> > -       switchcase_csr_write_16(__csr_num + 0, __val)   \
> > -       switchcase_csr_write_16(__csr_num + 16, __val)
> > -#define switchcase_csr_write_64(__csr_num, __val)      \
> > -       switchcase_csr_write_32(__csr_num + 0, __val)   \
> > -       switchcase_csr_write_32(__csr_num + 32, __val)
> > -
> > -       switch (csr_num) {
> > -       switchcase_csr_write_16(CSR_PMPCFG0, val)
> > -       switchcase_csr_write_64(CSR_PMPADDR0, val)
> > -       switchcase_csr_write(CSR_MCYCLE, val)
> > -       switchcase_csr_write(CSR_MINSTRET, val)
> > -       switchcase_csr_write(CSR_MHPMCOUNTER3, val)
> > -       switchcase_csr_write_4(CSR_MHPMCOUNTER4, val)
> > -       switchcase_csr_write_8(CSR_MHPMCOUNTER8, val)
> > -       switchcase_csr_write_16(CSR_MHPMCOUNTER16, val)
> > -#if __riscv_xlen == 32
> > -       switchcase_csr_write(CSR_MCYCLEH, val)
> > -       switchcase_csr_write(CSR_MINSTRETH, val)
> > -       switchcase_csr_write(CSR_MHPMCOUNTER3H, val)
> > -       switchcase_csr_write_4(CSR_MHPMCOUNTER4H, val)
> > -       switchcase_csr_write_8(CSR_MHPMCOUNTER8H, val)
> > -       switchcase_csr_write_16(CSR_MHPMCOUNTER16H, val)
> > -       switchcase_csr_write(CSR_MHPMEVENT3H, val)
> > -       switchcase_csr_write_4(CSR_MHPMEVENT4H, val)
> > -       switchcase_csr_write_8(CSR_MHPMEVENT8H, val)
> > -       switchcase_csr_write_16(CSR_MHPMEVENT16H, val)
> > -#endif
> > -       switchcase_csr_write(CSR_MCOUNTINHIBIT, val)
> > -       switchcase_csr_write(CSR_MHPMEVENT3, val)
> > -       switchcase_csr_write_4(CSR_MHPMEVENT4, val)
> > -       switchcase_csr_write_8(CSR_MHPMEVENT8, val)
> > -       switchcase_csr_write_16(CSR_MHPMEVENT16, val)
> > -
> > -       default:
> > -               sbi_panic("%s: Unknown CSR %#x", __func__, csr_num);
> > -               break;
> > -       };
> > -
> > -#undef switchcase_csr_write_64
> > -#undef switchcase_csr_write_32
> > -#undef switchcase_csr_write_16
> > -#undef switchcase_csr_write_8
> > -#undef switchcase_csr_write_4
> > -#undef switchcase_csr_write_2
> > -#undef switchcase_csr_write
> > +       volatile uint32_t opcode_buff[2];
> > +       typedef void (*write_f)(unsigned long val);
> > +       opcode_buff[0] = (csr_num << 20) | 0x00051073; /* csrw csr, a0 */
> > +       opcode_buff[1] = 0x00008067; /* ret */
> > +       RISCV_FENCE_I;
> 
> I agree we need FENCE.I in the path but this is
> like a big hammer in the execution path.
> 
> This is now much slower compared to the existing
> approach because every CSR access using this
> function will execute FENCE.I
I passed the qemu test, and it can be run normally with
or without fence.i. But I'm not sure if the exception
happens on other platform or we have a more lightweight
way.

Regards,
Xiang W
> 
> Regards,
> Anup
> 
> > +       ((write_f)opcode_buff)(val);
> >  }
> > 
> >  static unsigned long ctz(unsigned long x)
> > --
> > 2.30.2
> > 
> > 
> > --
> > opensbi mailing list
> > opensbi at lists.infradead.org
> > http://lists.infradead.org/mailman/listinfo/opensbi





More information about the opensbi mailing list