|  | /* | 
|  | * Copyright (c) 2016-2021, ARM Limited and Contributors. All rights reserved. | 
|  | * | 
|  | * SPDX-License-Identifier: BSD-3-Clause | 
|  | */ | 
|  |  | 
|  | #include <arch.h> | 
|  | #include <asm_macros.S> | 
|  | #include <assert_macros.S> | 
|  | #include <common/bl_common.h> | 
|  | #include <lib/xlat_tables/xlat_tables_defs.h> | 
|  |  | 
|  | .globl	smc | 
|  | .globl	zeromem | 
|  | .globl	zero_normalmem | 
|  | .globl	memcpy4 | 
|  | .globl	disable_mmu_icache_secure | 
|  | .globl	disable_mmu_secure | 
|  | .globl	fixup_gdt_reloc | 
|  |  | 
|  | #define PAGE_START_MASK		~(PAGE_SIZE_MASK) | 
|  |  | 
|  | func smc | 
|  | /* | 
|  | * For AArch32 only r0-r3 will be in the registers; | 
|  | * rest r4-r6 will be pushed on to the stack. So here, we'll | 
|  | * have to load them from the stack to registers r4-r6 explicitly. | 
|  | * Clobbers: r4-r6 | 
|  | */ | 
|  | ldm	sp, {r4, r5, r6} | 
|  | smc	#0 | 
|  | endfunc smc | 
|  |  | 
|  | /* ----------------------------------------------------------------------- | 
|  | * void zeromem(void *mem, unsigned int length) | 
|  | * | 
|  | * Initialise a region in normal memory to 0. This functions complies with the | 
|  | * AAPCS and can be called from C code. | 
|  | * | 
|  | * ----------------------------------------------------------------------- | 
|  | */ | 
|  | func zeromem | 
|  | /* | 
|  | * Readable names for registers | 
|  | * | 
|  | * Registers r0, r1 and r2 are also set by zeromem which | 
|  | * branches into the fallback path directly, so cursor, length and | 
|  | * stop_address should not be retargeted to other registers. | 
|  | */ | 
|  | cursor       .req r0 /* Start address and then current address */ | 
|  | length       .req r1 /* Length in bytes of the region to zero out */ | 
|  | /* | 
|  | * Reusing the r1 register as length is only used at the beginning of | 
|  | * the function. | 
|  | */ | 
|  | stop_address .req r1  /* Address past the last zeroed byte */ | 
|  | zeroreg1     .req r2  /* Source register filled with 0 */ | 
|  | zeroreg2     .req r3  /* Source register filled with 0 */ | 
|  | tmp	     .req r12 /* Temporary scratch register */ | 
|  |  | 
|  | mov	zeroreg1, #0 | 
|  |  | 
|  | /* stop_address is the address past the last to zero */ | 
|  | add	stop_address, cursor, length | 
|  |  | 
|  | /* | 
|  | * Length cannot be used anymore as it shares the same register with | 
|  | * stop_address. | 
|  | */ | 
|  | .unreq	length | 
|  |  | 
|  | /* | 
|  | * If the start address is already aligned to 8 bytes, skip this loop. | 
|  | */ | 
|  | tst	cursor, #(8-1) | 
|  | beq	.Lzeromem_8bytes_aligned | 
|  |  | 
|  | /* Calculate the next address aligned to 8 bytes */ | 
|  | orr	tmp, cursor, #(8-1) | 
|  | adds	tmp, tmp, #1 | 
|  | /* If it overflows, fallback to byte per byte zeroing */ | 
|  | beq	.Lzeromem_1byte_aligned | 
|  | /* If the next aligned address is after the stop address, fall back */ | 
|  | cmp	tmp, stop_address | 
|  | bhs	.Lzeromem_1byte_aligned | 
|  |  | 
|  | /* zero byte per byte */ | 
|  | 1: | 
|  | strb	zeroreg1, [cursor], #1 | 
|  | cmp	cursor, tmp | 
|  | bne	1b | 
|  |  | 
|  | /* zero 8 bytes at a time */ | 
|  | .Lzeromem_8bytes_aligned: | 
|  |  | 
|  | /* Calculate the last 8 bytes aligned address. */ | 
|  | bic	tmp, stop_address, #(8-1) | 
|  |  | 
|  | cmp	cursor, tmp | 
|  | bhs	2f | 
|  |  | 
|  | mov	zeroreg2, #0 | 
|  | 1: | 
|  | stmia	cursor!, {zeroreg1, zeroreg2} | 
|  | cmp	cursor, tmp | 
|  | blo	1b | 
|  | 2: | 
|  |  | 
|  | /* zero byte per byte */ | 
|  | .Lzeromem_1byte_aligned: | 
|  | cmp	cursor, stop_address | 
|  | beq	2f | 
|  | 1: | 
|  | strb	zeroreg1, [cursor], #1 | 
|  | cmp	cursor, stop_address | 
|  | bne	1b | 
|  | 2: | 
|  | bx	lr | 
|  |  | 
|  | .unreq	cursor | 
|  | /* | 
|  | * length is already unreq'ed to reuse the register for another | 
|  | * variable. | 
|  | */ | 
|  | .unreq	stop_address | 
|  | .unreq	zeroreg1 | 
|  | .unreq	zeroreg2 | 
|  | .unreq	tmp | 
|  | endfunc zeromem | 
|  |  | 
|  | /* | 
|  | * AArch32 does not have special ways of zeroing normal memory as AArch64 does | 
|  | * using the DC ZVA instruction, so we just alias zero_normalmem to zeromem. | 
|  | */ | 
|  | .equ	zero_normalmem, zeromem | 
|  |  | 
|  | /* -------------------------------------------------------------------------- | 
|  | * void memcpy4(void *dest, const void *src, unsigned int length) | 
|  | * | 
|  | * Copy length bytes from memory area src to memory area dest. | 
|  | * The memory areas should not overlap. | 
|  | * Destination and source addresses must be 4-byte aligned. | 
|  | * -------------------------------------------------------------------------- | 
|  | */ | 
|  | func memcpy4 | 
|  | #if ENABLE_ASSERTIONS | 
|  | orr	r3, r0, r1 | 
|  | tst	r3, #0x3 | 
|  | ASM_ASSERT(eq) | 
|  | #endif | 
|  | /* copy 4 bytes at a time */ | 
|  | m_loop4: | 
|  | cmp	r2, #4 | 
|  | blo	m_loop1 | 
|  | ldr	r3, [r1], #4 | 
|  | str	r3, [r0], #4 | 
|  | subs	r2, r2, #4 | 
|  | bne	m_loop4 | 
|  | bx	lr | 
|  |  | 
|  | /* copy byte per byte */ | 
|  | m_loop1: | 
|  | ldrb	r3, [r1], #1 | 
|  | strb	r3, [r0], #1 | 
|  | subs	r2, r2, #1 | 
|  | bne	m_loop1 | 
|  | bx	lr | 
|  | endfunc memcpy4 | 
|  |  | 
|  | /* --------------------------------------------------------------------------- | 
|  | * Disable the MMU in Secure State | 
|  | * --------------------------------------------------------------------------- | 
|  | */ | 
|  |  | 
|  | func disable_mmu_secure | 
|  | mov	r1, #(SCTLR_M_BIT | SCTLR_C_BIT) | 
|  | do_disable_mmu: | 
|  | #if ERRATA_A9_794073 | 
|  | stcopr	r0, BPIALL | 
|  | dsb | 
|  | #endif | 
|  | ldcopr	r0, SCTLR | 
|  | bic	r0, r0, r1 | 
|  | stcopr	r0, SCTLR | 
|  | isb				// ensure MMU is off | 
|  | dsb	sy | 
|  | bx	lr | 
|  | endfunc disable_mmu_secure | 
|  |  | 
|  |  | 
|  | func disable_mmu_icache_secure | 
|  | ldr	r1, =(SCTLR_M_BIT | SCTLR_C_BIT | SCTLR_I_BIT) | 
|  | b	do_disable_mmu | 
|  | endfunc disable_mmu_icache_secure | 
|  |  | 
|  | /* --------------------------------------------------------------------------- | 
|  | * Helper to fixup Global Descriptor table (GDT) and dynamic relocations | 
|  | * (.rel.dyn) at runtime. | 
|  | * | 
|  | * This function is meant to be used when the firmware is compiled with -fpie | 
|  | * and linked with -pie options. We rely on the linker script exporting | 
|  | * appropriate markers for start and end of the section. For GOT, we | 
|  | * expect __GOT_START__ and __GOT_END__. Similarly for .rela.dyn, we expect | 
|  | * __RELA_START__ and __RELA_END__. | 
|  | * | 
|  | * The function takes the limits of the memory to apply fixups to as | 
|  | * arguments (which is usually the limits of the relocable BL image). | 
|  | *   r0 -  the start of the fixup region | 
|  | *   r1 -  the limit of the fixup region | 
|  | * These addresses have to be 4KB page aligned. | 
|  | * --------------------------------------------------------------------------- | 
|  | */ | 
|  |  | 
|  | /* Relocation codes */ | 
|  | #define R_ARM_RELATIVE 	23 | 
|  |  | 
|  | func fixup_gdt_reloc | 
|  | mov	r6, r0 | 
|  | mov	r7, r1 | 
|  |  | 
|  | #if ENABLE_ASSERTIONS | 
|  | /* Test if the limits are 4K aligned */ | 
|  | orr	r0, r0, r1 | 
|  | mov	r1, #(PAGE_SIZE_MASK) | 
|  | tst	r0, r1 | 
|  | ASM_ASSERT(eq) | 
|  | #endif | 
|  | /* | 
|  | * Calculate the offset based on return address in lr. | 
|  | * Assume that this function is called within a page at the start of | 
|  | * fixup region. | 
|  | */ | 
|  | ldr	r1, =PAGE_START_MASK | 
|  | and	r2, lr, r1 | 
|  | subs	r0, r2, r6	/* Diff(S) = Current Address - Compiled Address */ | 
|  | beq	3f		/* Diff(S) = 0. No relocation needed */ | 
|  |  | 
|  | ldr	r1, =__GOT_START__ | 
|  | add	r1, r1, r0 | 
|  | ldr	r2, =__GOT_END__ | 
|  | add	r2, r2, r0 | 
|  |  | 
|  | /* | 
|  | * GOT is an array of 32_bit addresses which must be fixed up as | 
|  | * new_addr = old_addr + Diff(S). | 
|  | * The new_addr is the address currently the binary is executing from | 
|  | * and old_addr is the address at compile time. | 
|  | */ | 
|  | 1:	ldr	r3, [r1] | 
|  |  | 
|  | /* Skip adding offset if address is < lower limit */ | 
|  | cmp	r3, r6 | 
|  | blo	2f | 
|  |  | 
|  | /* Skip adding offset if address is > upper limit */ | 
|  | cmp	r3, r7 | 
|  | bhi	2f | 
|  | add	r3, r3, r0 | 
|  | str	r3, [r1] | 
|  |  | 
|  | 2:	add	r1, r1, #4 | 
|  | cmp	r1, r2 | 
|  | blo	1b | 
|  |  | 
|  | /* Starting dynamic relocations. Use ldr to get RELA_START and END */ | 
|  | 3:	ldr	r1, =__RELA_START__ | 
|  | add	r1, r1, r0 | 
|  | ldr	r2, =__RELA_END__ | 
|  | add	r2, r2, r0 | 
|  |  | 
|  | /* | 
|  | * According to ELF-32 specification, the RELA data structure is as | 
|  | * follows: | 
|  | *	typedef struct { | 
|  | *		Elf32_Addr r_offset; | 
|  | *		Elf32_Xword r_info; | 
|  | *	} Elf32_Rela; | 
|  | * | 
|  | * r_offset is address of reference | 
|  | * r_info is symbol index and type of relocation (in this case | 
|  | * code 23  which corresponds to R_ARM_RELATIVE). | 
|  | * | 
|  | * Size of Elf32_Rela structure is 8 bytes. | 
|  | */ | 
|  |  | 
|  | /* Skip R_ARM_NONE entry with code 0 */ | 
|  | 1:	ldr	r3, [r1, #4] | 
|  | ands	r3, r3, #0xff | 
|  | beq	2f | 
|  |  | 
|  | #if ENABLE_ASSERTIONS | 
|  | /* Assert that the relocation type is R_ARM_RELATIVE */ | 
|  | cmp	r3, #R_ARM_RELATIVE | 
|  | ASM_ASSERT(eq) | 
|  | #endif | 
|  | ldr	r3, [r1]	/* r_offset */ | 
|  | add	r3, r0, r3	/* Diff(S) + r_offset */ | 
|  | ldr 	r4, [r3] | 
|  |  | 
|  | /* Skip adding offset if address is < lower limit */ | 
|  | cmp	r4, r6 | 
|  | blo	2f | 
|  |  | 
|  | /* Skip adding offset if address is > upper limit */ | 
|  | cmp	r4, r7 | 
|  | bhi	2f | 
|  |  | 
|  | add 	r4, r0, r4 | 
|  | str	r4, [r3] | 
|  |  | 
|  | 2:	add	r1, r1, #8 | 
|  | cmp	r1, r2 | 
|  | blo	1b | 
|  | bx	lr | 
|  | endfunc fixup_gdt_reloc |