[PATCH v2 3/8] ARM: add macro to perform far branches (b/bl)
Ard Biesheuvel
ard.biesheuvel at linaro.org
Wed Mar 18 03:07:17 PDT 2015
On 13 March 2015 at 13:07, Ard Biesheuvel <ard.biesheuvel at linaro.org> wrote:
> These macros execute PC-relative branches, but with a larger
> reach than the 24 bits that are available in the b and bl opcodes.
>
> Acked-by: Nicolas Pitre <nico at linaro.org>
> Signed-off-by: Ard Biesheuvel <ard.biesheuvel at linaro.org>
> ---
> arch/arm/include/asm/assembler.h | 83 ++++++++++++++++++++++++++++++++++++++++
> 1 file changed, 83 insertions(+)
>
> diff --git a/arch/arm/include/asm/assembler.h b/arch/arm/include/asm/assembler.h
> index f67fd3afebdf..2e7f55194782 100644
> --- a/arch/arm/include/asm/assembler.h
> +++ b/arch/arm/include/asm/assembler.h
> @@ -88,6 +88,17 @@
> #endif
>
> /*
> + * The program counter is always ahead of the address of the currently
> + * executing instruction by PC_BIAS bytes, whose value differs depending
> + * on the execution mode.
> + */
> +#ifdef CONFIG_THUMB2_KERNEL
> +#define PC_BIAS 4
> +#else
> +#define PC_BIAS 8
> +#endif
> +
> +/*
> * Enable and disable interrupts
> */
> #if __LINUX_ARM_ARCH__ >= 6
> @@ -108,6 +119,78 @@
> .endm
> #endif
>
> + /*
> + * Macros to emit relative conditional branches that may exceed the
> + * range of the 24-bit immediate of the ordinary b/bl instructions.
> + * NOTE: this doesn't work with locally defined symbols, as they
> + * lack the ARM/Thumb annotation (even if they are annotated as
> + * functions)
> + */
> + .macro b_far, target, tmpreg, c=
> +#if defined(CONFIG_CPU_32v7) || defined(CONFIG_CPU_32v7M)
> + movt\c \tmpreg, #:upper16:(\target - (8888f + PC_BIAS))
> + movw\c \tmpreg, #:lower16:(\target - (8888f + PC_BIAS))
> +8888: add\c pc, pc, \tmpreg
> +#else
> + ldr\c \tmpreg, 8889f
> +8888: add\c pc, pc, \tmpreg
> + .ifnb \c
> + b 8890f
> + .endif
> +8889: .long \target - (8888b + PC_BIAS)
> +8890:
> +#endif
> + .endm
Actually, I have found something better:
add\c \tmpreg, pc, #:pc_g0_nc:\target - PC_BIAS
add\c \tmpreg, \tmpreg, #:pc_g1_nc:\target - PC_BIAS + 4
add\c pc, \tmpreg, #:pc_g2:\target - PC_BIAS + 8
This uses a PC-relative group relocation to split the offset into
12-bit chunks and poke them into the add instructions
This way, we don't need the literal at all.
Note that add with pc as destination is ARM-only, so we should
probably retain the v7 movw/movt regardless
> +
> + .macro bl_far, target, c=
> +#if defined(CONFIG_CPU_32v7) || defined(CONFIG_CPU_32v7M)
> + movt\c ip, #:upper16:(\target - (8887f + PC_BIAS))
> + movw\c ip, #:lower16:(\target - (8887f + PC_BIAS))
> +8887: add\c ip, ip, pc
> + blx\c ip
> +#else
> + adr\c lr, 8887f
> + b_far \target, ip, \c
> +8887:
> +#endif
> + .endm
> +
> + /*
> + * Macros to emit absolute conditional branches: these are preferred
> + * over the far variants above because they use fewer instructions
> + * and/or use implicit literals that the assembler can group together
> + * to optimize cache utilization. However, they can only be used to
> + * call functions at their link time address, which rules out early boot
> + * code that executes with the MMU off.
> + * The v7 variant uses a movt/movw pair to prevent potential D-cache
> + * stalls on the literal, so using these macros is preferred over using
> + * 'ldr pc, =XXX' directly (unless no scratch register is available)
> + * NOTE: this doesn't work with locally defined symbols, as they
> + * lack the ARM/Thumb annotation (even if they are annotated as
> + * functions)
> + */
> + .macro b_abs, target, tmpreg, c=
> +#if defined(CONFIG_CPU_32v7) || defined(CONFIG_CPU_32v7M)
> + movt\c \tmpreg, #:upper16:\target
> + movw\c \tmpreg, #:lower16:\target
> + bx\c \tmpreg
> +#else
> + ldr\c pc, =\target
> +#endif
> + .endm
> +
> + .macro bl_abs, target, c=
> +#if defined(CONFIG_CPU_32v7) || defined(CONFIG_CPU_32v7M)
> + movt\c lr, #:upper16:\target
> + movw\c lr, #:lower16:\target
> + blx\c lr
> +#else
> + adr\c lr, BSYM(8886f)
> + ldr\c pc, =\target
> +8886:
> +#endif
> + .endm
> +
> .macro asm_trace_hardirqs_off
> #if defined(CONFIG_TRACE_IRQFLAGS)
> stmdb sp!, {r0-r3, ip, lr}
> --
> 1.8.3.2
>
More information about the linux-arm-kernel
mailing list