MdePkg BaseMemoryLibSse2: Add SSE2 implementation of API IsZeroBuffer()
Add the implementation of API IsZeroBuffer() via assembly in BaseMemoryLibSse2. The assembly codes use SSE2 XMM registers and related instructions. Cc: Michael D Kinney <michael.d.kinney@intel.com> Cc: Liming Gao <liming.gao@intel.com> Cc: Jiewen Yao <jiewen.yao@intel.com> Contributed-under: TianoCore Contribution Agreement 1.0 Signed-off-by: Hao Wu <hao.a.wu@intel.com> Reviewed-by: Liming Gao <liming.gao@intel.com>
This commit is contained in:
74
MdePkg/Library/BaseMemoryLibSse2/Ia32/IsZeroBuffer.nasm
Normal file
74
MdePkg/Library/BaseMemoryLibSse2/Ia32/IsZeroBuffer.nasm
Normal file
@@ -0,0 +1,74 @@
|
||||
;------------------------------------------------------------------------------
|
||||
;
|
||||
; Copyright (c) 2016, Intel Corporation. All rights reserved.<BR>
|
||||
; This program and the accompanying materials
|
||||
; are licensed and made available under the terms and conditions of the BSD License
|
||||
; which accompanies this distribution. The full text of the license may be found at
|
||||
; http://opensource.org/licenses/bsd-license.php.
|
||||
;
|
||||
; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
|
||||
; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
|
||||
;
|
||||
; Module Name:
|
||||
;
|
||||
; IsZeroBuffer.nasm
|
||||
;
|
||||
; Abstract:
|
||||
;
|
||||
; IsZeroBuffer function
|
||||
;
|
||||
; Notes:
|
||||
;
|
||||
;------------------------------------------------------------------------------
|
||||
|
||||
SECTION .text
|
||||
|
||||
;------------------------------------------------------------------------------
|
||||
; BOOLEAN
|
||||
; EFIAPI
|
||||
; InternalMemIsZeroBuffer (
|
||||
; IN CONST VOID *Buffer,
|
||||
; IN UINTN Length
|
||||
; );
|
||||
;------------------------------------------------------------------------------
|
||||
global ASM_PFX(InternalMemIsZeroBuffer)
|
||||
ASM_PFX(InternalMemIsZeroBuffer):
|
||||
push edi
|
||||
mov edi, [esp + 8] ; edi <- Buffer
|
||||
mov edx, [esp + 12] ; edx <- Length
|
||||
xor ecx, ecx ; ecx <- 0
|
||||
sub ecx, edi
|
||||
and ecx, 15 ; ecx + edi aligns on 16-byte boundary
|
||||
jz @Is16BytesZero
|
||||
cmp ecx, edx
|
||||
cmova ecx, edx ; bytes before the 16-byte boundary
|
||||
sub edx, ecx
|
||||
xor eax, eax ; eax <- 0, also set ZF
|
||||
repe scasb
|
||||
jnz @ReturnFalse ; ZF=0 means non-zero element found
|
||||
@Is16BytesZero:
|
||||
mov ecx, edx
|
||||
and edx, 15
|
||||
shr ecx, 4
|
||||
jz @IsBytesZero
|
||||
.0:
|
||||
pxor xmm0, xmm0 ; xmm0 <- 0
|
||||
pcmpeqb xmm0, [edi] ; check zero for 16 bytes
|
||||
pmovmskb eax, xmm0 ; eax <- compare results
|
||||
cmp eax, 0xffff
|
||||
jnz @ReturnFalse
|
||||
add edi, 16
|
||||
loop .0
|
||||
@IsBytesZero:
|
||||
mov ecx, edx
|
||||
xor eax, eax ; eax <- 0, also set ZF
|
||||
repe scasb
|
||||
jnz @ReturnFalse ; ZF=0 means non-zero element found
|
||||
pop edi
|
||||
mov eax, 1 ; return TRUE
|
||||
ret
|
||||
@ReturnFalse:
|
||||
pop edi
|
||||
xor eax, eax
|
||||
ret ; return FALSE
|
||||
|
Reference in New Issue
Block a user