mirror of https://github.com/acidanthera/audk.git
MdePkg BaseMemoryLibSse2: Add SSE2 implementation of API IsZeroBuffer()
Add the implementation of API IsZeroBuffer() via assembly in BaseMemoryLibSse2. The assembly codes use SSE2 XMM registers and related instructions. Cc: Michael D Kinney <michael.d.kinney@intel.com> Cc: Liming Gao <liming.gao@intel.com> Cc: Jiewen Yao <jiewen.yao@intel.com> Contributed-under: TianoCore Contribution Agreement 1.0 Signed-off-by: Hao Wu <hao.a.wu@intel.com> Reviewed-by: Liming Gao <liming.gao@intel.com>
This commit is contained in:
parent
02b5cf7fb1
commit
102b4c7cdd
|
@ -3,7 +3,7 @@
|
||||||
#
|
#
|
||||||
# Base Memory Library that uses SSE2 registers for high performance.
|
# Base Memory Library that uses SSE2 registers for high performance.
|
||||||
#
|
#
|
||||||
# Copyright (c) 2007 - 2014, Intel Corporation. All rights reserved.<BR>
|
# Copyright (c) 2007 - 2016, Intel Corporation. All rights reserved.<BR>
|
||||||
#
|
#
|
||||||
# This program and the accompanying materials
|
# This program and the accompanying materials
|
||||||
# are licensed and made available under the terms and conditions of the BSD License
|
# are licensed and made available under the terms and conditions of the BSD License
|
||||||
|
@ -42,6 +42,7 @@
|
||||||
SetMem16Wrapper.c
|
SetMem16Wrapper.c
|
||||||
SetMemWrapper.c
|
SetMemWrapper.c
|
||||||
CopyMemWrapper.c
|
CopyMemWrapper.c
|
||||||
|
IsZeroBufferWrapper.c
|
||||||
MemLibGuid.c
|
MemLibGuid.c
|
||||||
|
|
||||||
[Sources.Ia32]
|
[Sources.Ia32]
|
||||||
|
@ -89,6 +90,7 @@
|
||||||
Ia32/SetMem.asm
|
Ia32/SetMem.asm
|
||||||
Ia32/CopyMem.nasm
|
Ia32/CopyMem.nasm
|
||||||
Ia32/CopyMem.asm
|
Ia32/CopyMem.asm
|
||||||
|
Ia32/IsZeroBuffer.nasm
|
||||||
|
|
||||||
[Sources.X64]
|
[Sources.X64]
|
||||||
X64/ScanMem64.nasm
|
X64/ScanMem64.nasm
|
||||||
|
@ -135,6 +137,7 @@
|
||||||
X64/SetMem.S
|
X64/SetMem.S
|
||||||
X64/CopyMem.nasm
|
X64/CopyMem.nasm
|
||||||
X64/CopyMem.S
|
X64/CopyMem.S
|
||||||
|
X64/IsZeroBuffer.nasm
|
||||||
|
|
||||||
[Packages]
|
[Packages]
|
||||||
MdePkg/MdePkg.dec
|
MdePkg/MdePkg.dec
|
||||||
|
|
|
@ -0,0 +1,74 @@
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
;
|
||||||
|
; Copyright (c) 2016, Intel Corporation. All rights reserved.<BR>
|
||||||
|
; This program and the accompanying materials
|
||||||
|
; are licensed and made available under the terms and conditions of the BSD License
|
||||||
|
; which accompanies this distribution. The full text of the license may be found at
|
||||||
|
; http://opensource.org/licenses/bsd-license.php.
|
||||||
|
;
|
||||||
|
; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
|
||||||
|
; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
|
||||||
|
;
|
||||||
|
; Module Name:
|
||||||
|
;
|
||||||
|
; IsZeroBuffer.nasm
|
||||||
|
;
|
||||||
|
; Abstract:
|
||||||
|
;
|
||||||
|
; IsZeroBuffer function
|
||||||
|
;
|
||||||
|
; Notes:
|
||||||
|
;
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
SECTION .text
|
||||||
|
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
; BOOLEAN
|
||||||
|
; EFIAPI
|
||||||
|
; InternalMemIsZeroBuffer (
|
||||||
|
; IN CONST VOID *Buffer,
|
||||||
|
; IN UINTN Length
|
||||||
|
; );
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
global ASM_PFX(InternalMemIsZeroBuffer)
|
||||||
|
ASM_PFX(InternalMemIsZeroBuffer):
|
||||||
|
push edi
|
||||||
|
mov edi, [esp + 8] ; edi <- Buffer
|
||||||
|
mov edx, [esp + 12] ; edx <- Length
|
||||||
|
xor ecx, ecx ; ecx <- 0
|
||||||
|
sub ecx, edi
|
||||||
|
and ecx, 15 ; ecx + edi aligns on 16-byte boundary
|
||||||
|
jz @Is16BytesZero
|
||||||
|
cmp ecx, edx
|
||||||
|
cmova ecx, edx ; bytes before the 16-byte boundary
|
||||||
|
sub edx, ecx
|
||||||
|
xor eax, eax ; eax <- 0, also set ZF
|
||||||
|
repe scasb
|
||||||
|
jnz @ReturnFalse ; ZF=0 means non-zero element found
|
||||||
|
@Is16BytesZero:
|
||||||
|
mov ecx, edx
|
||||||
|
and edx, 15
|
||||||
|
shr ecx, 4
|
||||||
|
jz @IsBytesZero
|
||||||
|
.0:
|
||||||
|
pxor xmm0, xmm0 ; xmm0 <- 0
|
||||||
|
pcmpeqb xmm0, [edi] ; check zero for 16 bytes
|
||||||
|
pmovmskb eax, xmm0 ; eax <- compare results
|
||||||
|
cmp eax, 0xffff
|
||||||
|
jnz @ReturnFalse
|
||||||
|
add edi, 16
|
||||||
|
loop .0
|
||||||
|
@IsBytesZero:
|
||||||
|
mov ecx, edx
|
||||||
|
xor eax, eax ; eax <- 0, also set ZF
|
||||||
|
repe scasb
|
||||||
|
jnz @ReturnFalse ; ZF=0 means non-zero element found
|
||||||
|
pop edi
|
||||||
|
mov eax, 1 ; return TRUE
|
||||||
|
ret
|
||||||
|
@ReturnFalse:
|
||||||
|
pop edi
|
||||||
|
xor eax, eax
|
||||||
|
ret ; return FALSE
|
||||||
|
|
|
@ -0,0 +1,54 @@
|
||||||
|
/** @file
|
||||||
|
Implementation of IsZeroBuffer function.
|
||||||
|
|
||||||
|
The following BaseMemoryLib instances contain the same copy of this file:
|
||||||
|
|
||||||
|
BaseMemoryLib
|
||||||
|
BaseMemoryLibMmx
|
||||||
|
BaseMemoryLibSse2
|
||||||
|
BaseMemoryLibRepStr
|
||||||
|
BaseMemoryLibOptDxe
|
||||||
|
BaseMemoryLibOptPei
|
||||||
|
PeiMemoryLib
|
||||||
|
UefiMemoryLib
|
||||||
|
|
||||||
|
Copyright (c) 2016, Intel Corporation. All rights reserved.<BR>
|
||||||
|
This program and the accompanying materials
|
||||||
|
are licensed and made available under the terms and conditions of the BSD License
|
||||||
|
which accompanies this distribution. The full text of the license may be found at
|
||||||
|
http://opensource.org/licenses/bsd-license.php
|
||||||
|
|
||||||
|
THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
|
||||||
|
WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
|
||||||
|
|
||||||
|
**/
|
||||||
|
|
||||||
|
#include "MemLibInternals.h"
|
||||||
|
|
||||||
|
/**
|
||||||
|
Checks if the contents of a buffer are all zeros.
|
||||||
|
|
||||||
|
This function checks whether the contents of a buffer are all zeros. If the
|
||||||
|
contents are all zeros, return TRUE. Otherwise, return FALSE.
|
||||||
|
|
||||||
|
If Length > 0 and Buffer is NULL, then ASSERT().
|
||||||
|
If Length is greater than (MAX_ADDRESS - Buffer + 1), then ASSERT().
|
||||||
|
|
||||||
|
@param Buffer The pointer to the buffer to be checked.
|
||||||
|
@param Length The size of the buffer (in bytes) to be checked.
|
||||||
|
|
||||||
|
@retval TRUE Contents of the buffer are all zeros.
|
||||||
|
@retval FALSE Contents of the buffer are not all zeros.
|
||||||
|
|
||||||
|
**/
|
||||||
|
BOOLEAN
|
||||||
|
EFIAPI
|
||||||
|
IsZeroBuffer (
|
||||||
|
IN CONST VOID *Buffer,
|
||||||
|
IN UINTN Length
|
||||||
|
)
|
||||||
|
{
|
||||||
|
ASSERT (!(Buffer == NULL && Length > 0));
|
||||||
|
ASSERT ((Length - 1) <= (MAX_ADDRESS - (UINTN)Buffer));
|
||||||
|
return InternalMemIsZeroBuffer (Buffer, Length);
|
||||||
|
}
|
|
@ -9,7 +9,7 @@
|
||||||
BaseMemoryLibOptDxe
|
BaseMemoryLibOptDxe
|
||||||
BaseMemoryLibOptPei
|
BaseMemoryLibOptPei
|
||||||
|
|
||||||
Copyright (c) 2006 - 2010, Intel Corporation. All rights reserved.<BR>
|
Copyright (c) 2006 - 2016, Intel Corporation. All rights reserved.<BR>
|
||||||
This program and the accompanying materials
|
This program and the accompanying materials
|
||||||
are licensed and made available under the terms and conditions of the BSD License
|
are licensed and made available under the terms and conditions of the BSD License
|
||||||
which accompanies this distribution. The full text of the license may be found at
|
which accompanies this distribution. The full text of the license may be found at
|
||||||
|
@ -231,4 +231,21 @@ InternalMemScanMem64 (
|
||||||
IN UINT64 Value
|
IN UINT64 Value
|
||||||
);
|
);
|
||||||
|
|
||||||
|
/**
|
||||||
|
Checks whether the contents of a buffer are all zeros.
|
||||||
|
|
||||||
|
@param Buffer The pointer to the buffer to be checked.
|
||||||
|
@param Length The size of the buffer (in bytes) to be checked.
|
||||||
|
|
||||||
|
@retval TRUE Contents of the buffer are all zeros.
|
||||||
|
@retval FALSE Contents of the buffer are not all zeros.
|
||||||
|
|
||||||
|
**/
|
||||||
|
BOOLEAN
|
||||||
|
EFIAPI
|
||||||
|
InternalMemIsZeroBuffer (
|
||||||
|
IN CONST VOID *Buffer,
|
||||||
|
IN UINTN Length
|
||||||
|
);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -0,0 +1,76 @@
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
;
|
||||||
|
; Copyright (c) 2016, Intel Corporation. All rights reserved.<BR>
|
||||||
|
; This program and the accompanying materials
|
||||||
|
; are licensed and made available under the terms and conditions of the BSD License
|
||||||
|
; which accompanies this distribution. The full text of the license may be found at
|
||||||
|
; http://opensource.org/licenses/bsd-license.php.
|
||||||
|
;
|
||||||
|
; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
|
||||||
|
; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
|
||||||
|
;
|
||||||
|
; Module Name:
|
||||||
|
;
|
||||||
|
; IsZeroBuffer.nasm
|
||||||
|
;
|
||||||
|
; Abstract:
|
||||||
|
;
|
||||||
|
; IsZeroBuffer function
|
||||||
|
;
|
||||||
|
; Notes:
|
||||||
|
;
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
DEFAULT REL
|
||||||
|
SECTION .text
|
||||||
|
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
; BOOLEAN
|
||||||
|
; EFIAPI
|
||||||
|
; InternalMemIsZeroBuffer (
|
||||||
|
; IN CONST VOID *Buffer,
|
||||||
|
; IN UINTN Length
|
||||||
|
; );
|
||||||
|
;------------------------------------------------------------------------------
|
||||||
|
global ASM_PFX(InternalMemIsZeroBuffer)
|
||||||
|
ASM_PFX(InternalMemIsZeroBuffer):
|
||||||
|
push rdi
|
||||||
|
mov rdi, rcx ; rdi <- Buffer
|
||||||
|
xor rcx, rcx ; rcx <- 0
|
||||||
|
sub rcx, rdi
|
||||||
|
and rcx, 15 ; rcx + rdi aligns on 16-byte boundary
|
||||||
|
jz @Is16BytesZero
|
||||||
|
cmp rcx, rdx ; Length already in rdx
|
||||||
|
cmova rcx, rdx ; bytes before the 16-byte boundary
|
||||||
|
sub rdx, rcx
|
||||||
|
xor rax, rax ; rax <- 0, also set ZF
|
||||||
|
repe scasb
|
||||||
|
jnz @ReturnFalse ; ZF=0 means non-zero element found
|
||||||
|
@Is16BytesZero:
|
||||||
|
mov rcx, rdx
|
||||||
|
and rdx, 15
|
||||||
|
shr rcx, 4
|
||||||
|
jz @IsBytesZero
|
||||||
|
.0:
|
||||||
|
pxor xmm0, xmm0 ; xmm0 <- 0
|
||||||
|
pcmpeqb xmm0, [rdi] ; check zero for 16 bytes
|
||||||
|
pmovmskb eax, xmm0 ; eax <- compare results
|
||||||
|
; nasm doesn't support 64-bit destination
|
||||||
|
; for pmovmskb
|
||||||
|
cmp eax, 0xffff
|
||||||
|
jnz @ReturnFalse
|
||||||
|
add rdi, 16
|
||||||
|
loop .0
|
||||||
|
@IsBytesZero:
|
||||||
|
mov rcx, rdx
|
||||||
|
xor rax, rax ; rax <- 0, also set ZF
|
||||||
|
repe scasb
|
||||||
|
jnz @ReturnFalse ; ZF=0 means non-zero element found
|
||||||
|
pop rdi
|
||||||
|
mov rax, 1 ; return TRUE
|
||||||
|
ret
|
||||||
|
@ReturnFalse:
|
||||||
|
pop rdi
|
||||||
|
xor rax, rax
|
||||||
|
ret ; return FALSE
|
||||||
|
|
Loading…
Reference in New Issue