https://bugzilla.tianocore.org/show_bug.cgi?id=1373 Replace BSD 2-Clause License with BSD+Patent License. This change is based on the following emails: https://lists.01.org/pipermail/edk2-devel/2019-February/036260.html https://lists.01.org/pipermail/edk2-devel/2018-October/030385.html RFCs with detailed process for the license change: V3: https://lists.01.org/pipermail/edk2-devel/2019-March/038116.html V2: https://lists.01.org/pipermail/edk2-devel/2019-March/037669.html V1: https://lists.01.org/pipermail/edk2-devel/2019-March/037500.html Contributed-under: TianoCore Contribution Agreement 1.1 Signed-off-by: Michael D Kinney <michael.d.kinney@intel.com> Reviewed-by: Liming Gao <liming.gao@intel.com>
		
			
				
	
	
		
			171 lines
		
	
	
		
			4.3 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
			
		
		
	
	
			171 lines
		
	
	
		
			4.3 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
#------------------------------------------------------------------------------
 | 
						|
#
 | 
						|
# CopyMem() worker for ARM
 | 
						|
#
 | 
						|
# This file started out as C code that did 64 bit moves if the buffer was
 | 
						|
# 32-bit aligned, else it does a byte copy. It also does a byte copy for
 | 
						|
# any trailing bytes. It was updated to do 32-byte copies using stm/ldm.
 | 
						|
#
 | 
						|
# Copyright (c) 2008 - 2010, Apple Inc. All rights reserved.<BR>
 | 
						|
# Copyright (c) 2016, Linaro Ltd. All rights reserved.<BR>
 | 
						|
# SPDX-License-Identifier: BSD-2-Clause-Patent
 | 
						|
#
 | 
						|
#------------------------------------------------------------------------------
 | 
						|
 | 
						|
    .text
 | 
						|
    .thumb
 | 
						|
    .syntax unified
 | 
						|
 | 
						|
/**
 | 
						|
  Copy Length bytes from Source to Destination. Overlap is OK.
 | 
						|
 | 
						|
  This implementation
 | 
						|
 | 
						|
  @param  Destination Target of copy
 | 
						|
  @param  Source      Place to copy from
 | 
						|
  @param  Length      Number of bytes to copy
 | 
						|
 | 
						|
  @return Destination
 | 
						|
 | 
						|
 | 
						|
VOID *
 | 
						|
EFIAPI
 | 
						|
InternalMemCopyMem (
 | 
						|
  OUT     VOID                      *DestinationBuffer,
 | 
						|
  IN      CONST VOID                *SourceBuffer,
 | 
						|
  IN      UINTN                     Length
 | 
						|
  )
 | 
						|
**/
 | 
						|
    .type   ASM_PFX(InternalMemCopyMem), %function
 | 
						|
ASM_GLOBAL ASM_PFX(InternalMemCopyMem)
 | 
						|
ASM_PFX(InternalMemCopyMem):
 | 
						|
    push    {r4-r11, lr}
 | 
						|
    // Save the input parameters in extra registers (r11 = destination, r14 = source, r12 = length)
 | 
						|
    mov     r11, r0
 | 
						|
    mov     r10, r0
 | 
						|
    mov     r12, r2
 | 
						|
    mov     r14, r1
 | 
						|
 | 
						|
    cmp     r11, r1
 | 
						|
    // If (dest < source)
 | 
						|
    bcc     memcopy_check_optim_default
 | 
						|
 | 
						|
    // If (source + length < dest)
 | 
						|
    rsb     r3, r1, r11
 | 
						|
    cmp     r12, r3
 | 
						|
    bcc     memcopy_check_optim_default
 | 
						|
    b       memcopy_check_optim_overlap
 | 
						|
 | 
						|
memcopy_check_optim_default:
 | 
						|
    // Check if we can use an optimized path ((length >= 32) && destination word-aligned && source word-aligned) for the memcopy (optimized path if r0 == 1)
 | 
						|
    tst     r0, #0xF
 | 
						|
    it      ne
 | 
						|
    movne.n r0, #0
 | 
						|
    bne     memcopy_default
 | 
						|
    tst     r1, #0xF
 | 
						|
    it      ne
 | 
						|
    movne.n r3, #0
 | 
						|
    it      eq
 | 
						|
    moveq.n r3, #1
 | 
						|
    cmp     r2, #31
 | 
						|
    it      ls
 | 
						|
    movls.n r0, #0
 | 
						|
    bls     memcopy_default
 | 
						|
    and     r0, r3, #1
 | 
						|
    b       memcopy_default
 | 
						|
 | 
						|
memcopy_check_optim_overlap:
 | 
						|
    // r10 = dest_end, r14 = source_end
 | 
						|
    add     r10, r11, r12
 | 
						|
    add     r14, r12, r1
 | 
						|
 | 
						|
    // Are we in the optimized case ((length >= 32) && dest_end word-aligned && source_end word-aligned)
 | 
						|
    cmp     r2, #31
 | 
						|
    it      ls
 | 
						|
    movls.n r0, #0
 | 
						|
    it      hi
 | 
						|
    movhi.n r0, #1
 | 
						|
    tst     r10, #0xF
 | 
						|
    it      ne
 | 
						|
    movne.n r0, #0
 | 
						|
    tst     r14, #0xF
 | 
						|
    it      ne
 | 
						|
    movne.n r0, #0
 | 
						|
    b       memcopy_overlapped
 | 
						|
 | 
						|
memcopy_overlapped_non_optim:
 | 
						|
    // We read 1 byte from the end of the source buffer
 | 
						|
    sub     r3, r14, #1
 | 
						|
    sub     r12, r12, #1
 | 
						|
    ldrb    r3, [r3, #0]
 | 
						|
    sub     r2, r10, #1
 | 
						|
    cmp     r12, #0
 | 
						|
    // We write 1 byte at the end of the dest buffer
 | 
						|
    sub     r10, r10, #1
 | 
						|
    sub     r14, r14, #1
 | 
						|
    strb    r3, [r2, #0]
 | 
						|
    bne     memcopy_overlapped_non_optim
 | 
						|
    b       memcopy_end
 | 
						|
 | 
						|
// r10 = dest_end, r14 = source_end
 | 
						|
memcopy_overlapped:
 | 
						|
    // Are we in the optimized case ?
 | 
						|
    cmp     r0, #0
 | 
						|
    beq     memcopy_overlapped_non_optim
 | 
						|
 | 
						|
    // Optimized Overlapped - Read 32 bytes
 | 
						|
    sub     r14, r14, #32
 | 
						|
    sub     r12, r12, #32
 | 
						|
    cmp     r12, #31
 | 
						|
    ldmia   r14, {r2-r9}
 | 
						|
 | 
						|
    // If length is less than 32 then disable optim
 | 
						|
    it      ls
 | 
						|
    movls.n r0, #0
 | 
						|
 | 
						|
    cmp     r12, #0
 | 
						|
 | 
						|
    // Optimized Overlapped - Write 32 bytes
 | 
						|
    sub     r10, r10, #32
 | 
						|
    stmia   r10, {r2-r9}
 | 
						|
 | 
						|
    // while (length != 0)
 | 
						|
    bne     memcopy_overlapped
 | 
						|
    b       memcopy_end
 | 
						|
 | 
						|
memcopy_default_non_optim:
 | 
						|
    // Byte copy
 | 
						|
    ldrb    r3, [r14], #1
 | 
						|
    sub     r12, r12, #1
 | 
						|
    strb    r3, [r10], #1
 | 
						|
 | 
						|
memcopy_default:
 | 
						|
    cmp     r12, #0
 | 
						|
    beq     memcopy_end
 | 
						|
 | 
						|
// r10 = dest, r14 = source
 | 
						|
memcopy_default_loop:
 | 
						|
    cmp     r0, #0
 | 
						|
    beq     memcopy_default_non_optim
 | 
						|
 | 
						|
    // Optimized memcopy - Read 32 Bytes
 | 
						|
    sub     r12, r12, #32
 | 
						|
    cmp     r12, #31
 | 
						|
    ldmia   r14!, {r2-r9}
 | 
						|
 | 
						|
    // If length is less than 32 then disable optim
 | 
						|
    it      ls
 | 
						|
    movls.n r0, #0
 | 
						|
 | 
						|
    cmp     r12, #0
 | 
						|
 | 
						|
    // Optimized memcopy - Write 32 Bytes
 | 
						|
    stmia   r10!, {r2-r9}
 | 
						|
 | 
						|
    // while (length != 0)
 | 
						|
    bne     memcopy_default_loop
 | 
						|
 | 
						|
memcopy_end:
 | 
						|
    mov     r0, r11
 | 
						|
    pop     {r4-r11, pc}
 |