mirror of https://github.com/acidanthera/audk.git
85 lines
2.7 KiB
NASM
85 lines
2.7 KiB
NASM
;------------------------------------------------------------------------------
|
|
;
|
|
; Copyright (c) 2006, Intel Corporation. All rights reserved.<BR>
|
|
; This program and the accompanying materials
|
|
; are licensed and made available under the terms and conditions of the BSD License
|
|
; which accompanies this distribution. The full text of the license may be found at
|
|
; http://opensource.org/licenses/bsd-license.php.
|
|
;
|
|
; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
|
|
; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
|
|
;
|
|
; Module Name:
|
|
;
|
|
; CopyMem.nasm
|
|
;
|
|
; Abstract:
|
|
;
|
|
; CopyMem function
|
|
;
|
|
; Notes:
|
|
;
|
|
;------------------------------------------------------------------------------
|
|
|
|
SECTION .text
|
|
|
|
;------------------------------------------------------------------------------
|
|
; VOID *
|
|
; InternalMemCopyMem (
|
|
; IN VOID *Destination,
|
|
; IN VOID *Source,
|
|
; IN UINTN Count
|
|
; );
|
|
;------------------------------------------------------------------------------
|
|
global ASM_PFX(InternalMemCopyMem)
|
|
ASM_PFX(InternalMemCopyMem):
|
|
push esi
|
|
push edi
|
|
mov esi, [esp + 16] ; esi <- Source
|
|
mov edi, [esp + 12] ; edi <- Destination
|
|
mov edx, [esp + 20] ; edx <- Count
|
|
lea eax, [esi + edx - 1] ; eax <- End of Source
|
|
cmp esi, edi
|
|
jae .0
|
|
cmp eax, edi ; Overlapped?
|
|
jae @CopyBackward ; Copy backward if overlapped
|
|
.0:
|
|
xor ecx, ecx
|
|
sub ecx, edi
|
|
and ecx, 15 ; ecx + edi aligns on 16-byte boundary
|
|
jz .1
|
|
cmp ecx, edx
|
|
cmova ecx, edx
|
|
sub edx, ecx ; edx <- remaining bytes to copy
|
|
rep movsb
|
|
.1:
|
|
mov ecx, edx
|
|
and edx, 15
|
|
shr ecx, 4 ; ecx <- # of DQwords to copy
|
|
jz @CopyBytes
|
|
add esp, -16
|
|
movdqu [esp], xmm0 ; save xmm0
|
|
.2:
|
|
movdqu xmm0, [esi] ; esi may not be 16-bytes aligned
|
|
movntdq [edi], xmm0 ; edi should be 16-bytes aligned
|
|
add esi, 16
|
|
add edi, 16
|
|
loop .2
|
|
mfence
|
|
movdqu xmm0, [esp] ; restore xmm0
|
|
add esp, 16 ; stack cleanup
|
|
jmp @CopyBytes
|
|
@CopyBackward:
|
|
mov esi, eax ; esi <- Last byte in Source
|
|
lea edi, [edi + edx - 1] ; edi <- Last byte in Destination
|
|
std
|
|
@CopyBytes:
|
|
mov ecx, edx
|
|
rep movsb
|
|
cld
|
|
mov eax, [esp + 12] ; eax <- Destination as return value
|
|
pop edi
|
|
pop esi
|
|
ret
|
|
|