lib/aarch32/misc_helpers.S - sandbox/arthur/trustedfirmware-a - TrustedFirmware Git Browser

 /*
  * Copyright (c) 2016-2021, ARM Limited and Contributors. All rights reserved.
  *
  * SPDX-License-Identifier: BSD-3-Clause
  */

 #include <arch.h>
 #include <asm_macros.S>
 #include <assert_macros.S>
 #include <common/bl_common.h>
 #include <lib/xlat_tables/xlat_tables_defs.h>

 	.globl	smc
 	.globl	zeromem
 	.globl	zero_normalmem
 	.globl	memcpy4
 	.globl	disable_mmu_icache_secure
 	.globl	disable_mmu_secure
 	.globl	fixup_gdt_reloc

 #define PAGE_START_MASK		~(PAGE_SIZE_MASK)

 func smc
 	/*
 	 * For AArch32 only r0-r3 will be in the registers;
 	 * rest r4-r6 will be pushed on to the stack. So here, we'll
 	 * have to load them from the stack to registers r4-r6 explicitly.
 	 * Clobbers: r4-r6
 	 */
 	ldm	sp, {r4, r5, r6}
 	smc	#0
 endfunc smc

 /* -----------------------------------------------------------------------
  * void zeromem(void *mem, unsigned int length)
  *
  * Initialise a region in normal memory to 0. This functions complies with the
  * AAPCS and can be called from C code.
  *
  * -----------------------------------------------------------------------
  */
 func zeromem
 	/*
 	 * Readable names for registers
 	 *
 	 * Registers r0, r1 and r2 are also set by zeromem which
 	 * branches into the fallback path directly, so cursor, length and
 	 * stop_address should not be retargeted to other registers.
 	 */
 	cursor       .req r0 /* Start address and then current address */
 	length       .req r1 /* Length in bytes of the region to zero out */
 	/*
 	 * Reusing the r1 register as length is only used at the beginning of
 	 * the function.
 	 */
 	stop_address .req r1  /* Address past the last zeroed byte */
 	zeroreg1     .req r2  /* Source register filled with 0 */
 	zeroreg2     .req r3  /* Source register filled with 0 */
 	tmp	     .req r12 /* Temporary scratch register */

 	mov	zeroreg1, #0

 	/* stop_address is the address past the last to zero */
 	add	stop_address, cursor, length

 	/*
 	 * Length cannot be used anymore as it shares the same register with
 	 * stop_address.
 	 */
 	.unreq	length

 	/*
 	 * If the start address is already aligned to 8 bytes, skip this loop.
 	 */
 	tst	cursor, #(8-1)
 	beq	.Lzeromem_8bytes_aligned

 	/* Calculate the next address aligned to 8 bytes */
 	orr	tmp, cursor, #(8-1)
 	adds	tmp, tmp, #1
 	/* If it overflows, fallback to byte per byte zeroing */
 	beq	.Lzeromem_1byte_aligned
 	/* If the next aligned address is after the stop address, fall back */
 	cmp	tmp, stop_address
 	bhs	.Lzeromem_1byte_aligned

 	/* zero byte per byte */
 1:
 	strb	zeroreg1, [cursor], #1
 	cmp	cursor, tmp
 	bne	1b

 	/* zero 8 bytes at a time */
 .Lzeromem_8bytes_aligned:

 	/* Calculate the last 8 bytes aligned address. */
 	bic	tmp, stop_address, #(8-1)

 	cmp	cursor, tmp
 	bhs	2f

 	mov	zeroreg2, #0
 1:
 	stmia	cursor!, {zeroreg1, zeroreg2}
 	cmp	cursor, tmp
 	blo	1b
 2:

 	/* zero byte per byte */
 .Lzeromem_1byte_aligned:
 	cmp	cursor, stop_address
 	beq	2f
 1:
 	strb	zeroreg1, [cursor], #1
 	cmp	cursor, stop_address
 	bne	1b
 2:
 	bx	lr

 	.unreq	cursor
 	/*
 	 * length is already unreq'ed to reuse the register for another
 	 * variable.
 	 */
 	.unreq	stop_address
 	.unreq	zeroreg1
 	.unreq	zeroreg2
 	.unreq	tmp
 endfunc zeromem

 /*
  * AArch32 does not have special ways of zeroing normal memory as AArch64 does
  * using the DC ZVA instruction, so we just alias zero_normalmem to zeromem.
  */
 .equ	zero_normalmem, zeromem

 /* --------------------------------------------------------------------------
  * void memcpy4(void *dest, const void *src, unsigned int length)
  *
  * Copy length bytes from memory area src to memory area dest.
  * The memory areas should not overlap.
  * Destination and source addresses must be 4-byte aligned.
  * --------------------------------------------------------------------------
  */
 func memcpy4
 #if ENABLE_ASSERTIONS
 	orr	r3, r0, r1
 	tst	r3, #0x3
 	ASM_ASSERT(eq)
 #endif
 /* copy 4 bytes at a time */
 m_loop4:
 	cmp	r2, #4
 	blo	m_loop1
 	ldr	r3, [r1], #4
 	str	r3, [r0], #4
 	subs	r2, r2, #4
 	bne	m_loop4
 	bx	lr

 /* copy byte per byte */
 m_loop1:
 	ldrb	r3, [r1], #1
 	strb	r3, [r0], #1
 	subs	r2, r2, #1
 	bne	m_loop1
 	bx	lr
 endfunc memcpy4

 /* ---------------------------------------------------------------------------
  * Disable the MMU in Secure State
  * ---------------------------------------------------------------------------
  */

 func disable_mmu_secure
 	mov	r1, #(SCTLR_M_BIT | SCTLR_C_BIT)
 do_disable_mmu:
 #if ERRATA_A9_794073
 	stcopr	r0, BPIALL
 	dsb
 #endif
 	ldcopr	r0, SCTLR
 	bic	r0, r0, r1
 	stcopr	r0, SCTLR
 	isb				// ensure MMU is off
 	dsb	sy
 	bx	lr
 endfunc disable_mmu_secure


 func disable_mmu_icache_secure
 	ldr	r1, =(SCTLR_M_BIT | SCTLR_C_BIT | SCTLR_I_BIT)
 	b	do_disable_mmu
 endfunc disable_mmu_icache_secure

 /* ---------------------------------------------------------------------------
  * Helper to fixup Global Descriptor table (GDT) and dynamic relocations
  * (.rel.dyn) at runtime.
  *
  * This function is meant to be used when the firmware is compiled with -fpie
  * and linked with -pie options. We rely on the linker script exporting
  * appropriate markers for start and end of the section. For GOT, we
  * expect __GOT_START__ and __GOT_END__. Similarly for .rela.dyn, we expect
  * __RELA_START__ and __RELA_END__.
  *
  * The function takes the limits of the memory to apply fixups to as
  * arguments (which is usually the limits of the relocable BL image).
  *   r0 -  the start of the fixup region
  *   r1 -  the limit of the fixup region
  * These addresses have to be 4KB page aligned.
  * ---------------------------------------------------------------------------
  */

 /* Relocation codes */
 #define R_ARM_RELATIVE 	23

 func fixup_gdt_reloc
 	mov	r6, r0
 	mov	r7, r1

 #if ENABLE_ASSERTIONS
 	/* Test if the limits are 4K aligned */
 	orr	r0, r0, r1
 	mov	r1, #(PAGE_SIZE_MASK)
 	tst	r0, r1
 	ASM_ASSERT(eq)
 #endif
 	/*
 	 * Calculate the offset based on return address in lr.
 	 * Assume that this function is called within a page at the start of
 	 * fixup region.
 	 */
 	ldr	r1, =PAGE_START_MASK
 	and	r2, lr, r1
 	subs	r0, r2, r6	/* Diff(S) = Current Address - Compiled Address */
 	beq	3f		/* Diff(S) = 0. No relocation needed */

 	ldr	r1, =__GOT_START__
 	add	r1, r1, r0
 	ldr	r2, =__GOT_END__
 	add	r2, r2, r0

 	/*
 	 * GOT is an array of 32_bit addresses which must be fixed up as
 	 * new_addr = old_addr + Diff(S).
 	 * The new_addr is the address currently the binary is executing from
 	 * and old_addr is the address at compile time.
 	 */
 1:	ldr	r3, [r1]

 	/* Skip adding offset if address is < lower limit */
 	cmp	r3, r6
 	blo	2f

 	/* Skip adding offset if address is > upper limit */
 	cmp	r3, r7
 	bhi	2f
 	add	r3, r3, r0
 	str	r3, [r1]

 2:	add	r1, r1, #4
 	cmp	r1, r2
 	blo	1b

 	/* Starting dynamic relocations. Use ldr to get RELA_START and END */
 3:	ldr	r1, =__RELA_START__
 	add	r1, r1, r0
 	ldr	r2, =__RELA_END__
 	add	r2, r2, r0

 	/*
 	 * According to ELF-32 specification, the RELA data structure is as
 	 * follows:
 	 *	typedef struct {
 	 *		Elf32_Addr r_offset;
 	 *		Elf32_Xword r_info;
 	 *	} Elf32_Rela;
 	 *
 	 * r_offset is address of reference
 	 * r_info is symbol index and type of relocation (in this case
 	 * code 23  which corresponds to R_ARM_RELATIVE).
 	 *
 	 * Size of Elf32_Rela structure is 8 bytes.
 	 */

 	/* Skip R_ARM_NONE entry with code 0 */
 1:	ldr	r3, [r1, #4]
 	ands	r3, r3, #0xff
 	beq	2f

 #if ENABLE_ASSERTIONS
 	/* Assert that the relocation type is R_ARM_RELATIVE */
 	cmp	r3, #R_ARM_RELATIVE
 	ASM_ASSERT(eq)
 #endif
 	ldr	r3, [r1]	/* r_offset */
 	add	r3, r0, r3	/* Diff(S) + r_offset */
 	ldr 	r4, [r3]

 	/* Skip adding offset if address is < lower limit */
 	cmp	r4, r6
 	blo	2f

 	/* Skip adding offset if address is > upper limit */
 	cmp	r4, r7
 	bhi	2f

 	add 	r4, r0, r4
 	str	r4, [r3]

 2:	add	r1, r1, #8
 	cmp	r1, r2
 	blo	1b
 	bx	lr
 endfunc fixup_gdt_reloc
	/*
	* Copyright (c) 2016-2021, ARM Limited and Contributors. All rights reserved.
	*
	* SPDX-License-Identifier: BSD-3-Clause
	*/

	#include <arch.h>
	#include <asm_macros.S>
	#include <assert_macros.S>
	#include <common/bl_common.h>
	#include <lib/xlat_tables/xlat_tables_defs.h>

	.globl smc
	.globl zeromem
	.globl zero_normalmem
	.globl memcpy4
	.globl disable_mmu_icache_secure
	.globl disable_mmu_secure
	.globl fixup_gdt_reloc

	#define PAGE_START_MASK ~(PAGE_SIZE_MASK)

	func smc
	/*
	* For AArch32 only r0-r3 will be in the registers;
	* rest r4-r6 will be pushed on to the stack. So here, we'll
	* have to load them from the stack to registers r4-r6 explicitly.
	* Clobbers: r4-r6
	*/
	ldm sp, {r4, r5, r6}
	smc #0
	endfunc smc

	/* -----------------------------------------------------------------------
	* void zeromem(void *mem, unsigned int length)
	*
	* Initialise a region in normal memory to 0. This functions complies with the
	* AAPCS and can be called from C code.
	*
	* -----------------------------------------------------------------------
	*/
	func zeromem
	/*
	* Readable names for registers
	*
	* Registers r0, r1 and r2 are also set by zeromem which
	* branches into the fallback path directly, so cursor, length and
	* stop_address should not be retargeted to other registers.
	*/
	cursor .req r0 /* Start address and then current address */
	length .req r1 /* Length in bytes of the region to zero out */
	/*
	* Reusing the r1 register as length is only used at the beginning of
	* the function.
	*/
	stop_address .req r1 /* Address past the last zeroed byte */
	zeroreg1 .req r2 /* Source register filled with 0 */
	zeroreg2 .req r3 /* Source register filled with 0 */
	tmp .req r12 /* Temporary scratch register */

	mov zeroreg1, #0

	/* stop_address is the address past the last to zero */
	add stop_address, cursor, length

	/*
	* Length cannot be used anymore as it shares the same register with
	* stop_address.
	*/
	.unreq length

	/*
	* If the start address is already aligned to 8 bytes, skip this loop.
	*/
	tst cursor, #(8-1)
	beq .Lzeromem_8bytes_aligned

	/* Calculate the next address aligned to 8 bytes */
	orr tmp, cursor, #(8-1)
	adds tmp, tmp, #1
	/* If it overflows, fallback to byte per byte zeroing */
	beq .Lzeromem_1byte_aligned
	/* If the next aligned address is after the stop address, fall back */
	cmp tmp, stop_address
	bhs .Lzeromem_1byte_aligned

	/* zero byte per byte */
	1:
	strb zeroreg1, [cursor], #1
	cmp cursor, tmp
	bne 1b

	/* zero 8 bytes at a time */
	.Lzeromem_8bytes_aligned:

	/* Calculate the last 8 bytes aligned address. */
	bic tmp, stop_address, #(8-1)

	cmp cursor, tmp
	bhs 2f

	mov zeroreg2, #0
	1:
	stmia cursor!, {zeroreg1, zeroreg2}
	cmp cursor, tmp
	blo 1b
	2:

	/* zero byte per byte */
	.Lzeromem_1byte_aligned:
	cmp cursor, stop_address
	beq 2f
	1:
	strb zeroreg1, [cursor], #1
	cmp cursor, stop_address
	bne 1b
	2:
	bx lr

	.unreq cursor
	/*
	* length is already unreq'ed to reuse the register for another
	* variable.
	*/
	.unreq stop_address
	.unreq zeroreg1
	.unreq zeroreg2
	.unreq tmp
	endfunc zeromem

	/*
	* AArch32 does not have special ways of zeroing normal memory as AArch64 does
	* using the DC ZVA instruction, so we just alias zero_normalmem to zeromem.
	*/
	.equ zero_normalmem, zeromem

	/* --------------------------------------------------------------------------
	* void memcpy4(void dest, const void src, unsigned int length)
	*
	* Copy length bytes from memory area src to memory area dest.
	* The memory areas should not overlap.
	* Destination and source addresses must be 4-byte aligned.
	* --------------------------------------------------------------------------
	*/
	func memcpy4
	#if ENABLE_ASSERTIONS
	orr r3, r0, r1
	tst r3, #0x3
	ASM_ASSERT(eq)
	#endif
	/* copy 4 bytes at a time */
	m_loop4:
	cmp r2, #4
	blo m_loop1
	ldr r3, [r1], #4
	str r3, [r0], #4
	subs r2, r2, #4
	bne m_loop4
	bx lr

	/* copy byte per byte */
	m_loop1:
	ldrb r3, [r1], #1
	strb r3, [r0], #1
	subs r2, r2, #1
	bne m_loop1
	bx lr
	endfunc memcpy4

	/* ---------------------------------------------------------------------------
	* Disable the MMU in Secure State
	* ---------------------------------------------------------------------------
	*/

	func disable_mmu_secure
	mov r1, #(SCTLR_M_BIT \| SCTLR_C_BIT)
	do_disable_mmu:
	#if ERRATA_A9_794073
	stcopr r0, BPIALL
	dsb
	#endif
	ldcopr r0, SCTLR
	bic r0, r0, r1
	stcopr r0, SCTLR
	isb // ensure MMU is off
	dsb sy
	bx lr
	endfunc disable_mmu_secure


	func disable_mmu_icache_secure
	ldr r1, =(SCTLR_M_BIT \| SCTLR_C_BIT \| SCTLR_I_BIT)
	b do_disable_mmu
	endfunc disable_mmu_icache_secure

	/* ---------------------------------------------------------------------------
	* Helper to fixup Global Descriptor table (GDT) and dynamic relocations
	* (.rel.dyn) at runtime.
	*
	* This function is meant to be used when the firmware is compiled with -fpie
	* and linked with -pie options. We rely on the linker script exporting
	* appropriate markers for start and end of the section. For GOT, we
	* expect __GOT_START__ and __GOT_END__. Similarly for .rela.dyn, we expect
	* __RELA_START__ and __RELA_END__.
	*
	* The function takes the limits of the memory to apply fixups to as
	* arguments (which is usually the limits of the relocable BL image).
	* r0 - the start of the fixup region
	* r1 - the limit of the fixup region
	* These addresses have to be 4KB page aligned.
	* ---------------------------------------------------------------------------
	*/

	/* Relocation codes */
	#define R_ARM_RELATIVE 23

	func fixup_gdt_reloc
	mov r6, r0
	mov r7, r1

	#if ENABLE_ASSERTIONS
	/* Test if the limits are 4K aligned */
	orr r0, r0, r1
	mov r1, #(PAGE_SIZE_MASK)
	tst r0, r1
	ASM_ASSERT(eq)
	#endif
	/*
	* Calculate the offset based on return address in lr.
	* Assume that this function is called within a page at the start of
	* fixup region.
	*/
	ldr r1, =PAGE_START_MASK
	and r2, lr, r1
	subs r0, r2, r6 /* Diff(S) = Current Address - Compiled Address */
	beq 3f /* Diff(S) = 0. No relocation needed */

	ldr r1, =__GOT_START__
	add r1, r1, r0
	ldr r2, =__GOT_END__
	add r2, r2, r0

	/*
	* GOT is an array of 32_bit addresses which must be fixed up as
	* new_addr = old_addr + Diff(S).
	* The new_addr is the address currently the binary is executing from
	* and old_addr is the address at compile time.
	*/
	1: ldr r3, [r1]

	/* Skip adding offset if address is < lower limit */
	cmp r3, r6
	blo 2f

	/* Skip adding offset if address is > upper limit */
	cmp r3, r7
	bhi 2f
	add r3, r3, r0
	str r3, [r1]

	2: add r1, r1, #4
	cmp r1, r2
	blo 1b

	/* Starting dynamic relocations. Use ldr to get RELA_START and END */
	3: ldr r1, =__RELA_START__
	add r1, r1, r0
	ldr r2, =__RELA_END__
	add r2, r2, r0

	/*
	* According to ELF-32 specification, the RELA data structure is as
	* follows:
	* typedef struct {
	* Elf32_Addr r_offset;
	* Elf32_Xword r_info;
	* } Elf32_Rela;
	*
	* r_offset is address of reference
	* r_info is symbol index and type of relocation (in this case
	* code 23 which corresponds to R_ARM_RELATIVE).
	*
	* Size of Elf32_Rela structure is 8 bytes.
	*/

	/* Skip R_ARM_NONE entry with code 0 */
	1: ldr r3, [r1, #4]
	ands r3, r3, #0xff
	beq 2f

	#if ENABLE_ASSERTIONS
	/* Assert that the relocation type is R_ARM_RELATIVE */
	cmp r3, #R_ARM_RELATIVE
	ASM_ASSERT(eq)
	#endif
	ldr r3, [r1] /* r_offset */
	add r3, r0, r3 /* Diff(S) + r_offset */
	ldr r4, [r3]

	/* Skip adding offset if address is < lower limit */
	cmp r4, r6
	blo 2f

	/* Skip adding offset if address is > upper limit */
	cmp r4, r7
	bhi 2f

	add r4, r0, r4
	str r4, [r3]

	2: add r1, r1, #8
	cmp r1, r2
	blo 1b
	bx lr
	endfunc fixup_gdt_reloc