mirror of https://github.com/acidanthera/audk.git
74 lines
2.4 KiB
ArmAsm
74 lines
2.4 KiB
ArmAsm
#
|
|
# ConvertAsm.py: Automatically generated from SetMem.asm
|
|
#
|
|
#------------------------------------------------------------------------------
|
|
#
|
|
# Copyright (c) 2006 - 2008, Intel Corporation
|
|
# All rights reserved. This program and the accompanying materials
|
|
# are licensed and made available under the terms and conditions of the BSD License
|
|
# which accompanies this distribution. The full text of the license may be found at
|
|
# http://opensource.org/licenses/bsd-license.php
|
|
#
|
|
# THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
|
|
#
|
|
# Module Name:
|
|
#
|
|
# SetMem.S
|
|
#
|
|
# Abstract:
|
|
#
|
|
# SetMem function
|
|
#
|
|
# Notes:
|
|
#
|
|
#------------------------------------------------------------------------------
|
|
|
|
|
|
#------------------------------------------------------------------------------
|
|
# VOID *
|
|
# EFIAPI
|
|
# InternalMemSetMem (
|
|
# IN VOID *Buffer,
|
|
# IN UINTN Count,
|
|
# IN UINT8 Value
|
|
# )
|
|
#------------------------------------------------------------------------------
|
|
.intel_syntax noprefix
|
|
ASM_GLOBAL ASM_PFX(InternalMemSetMem)
|
|
ASM_PFX(InternalMemSetMem):
|
|
push rdi
|
|
mov rdi, rcx # rdi <- Buffer
|
|
mov al, r8b # al <- Value
|
|
mov r9, rdi # r9 <- Buffer as return value
|
|
xor rcx, rcx
|
|
sub rcx, rdi
|
|
and rcx, 15 # rcx + rdi aligns on 16-byte boundary
|
|
jz L0
|
|
cmp rcx, rdx
|
|
cmova rcx, rdx
|
|
sub rdx, rcx
|
|
rep stosb
|
|
L0:
|
|
mov rcx, rdx
|
|
and rdx, 15
|
|
shr rcx, 4
|
|
jz L_SetBytes
|
|
mov ah, al # ax <- Value repeats twice
|
|
movdqa [rsp + 0x10], xmm0 # save xmm0
|
|
movd xmm0, eax # xmm0[0..16] <- Value repeats twice
|
|
pshuflw xmm0, xmm0, 0 # xmm0[0..63] <- Value repeats 8 times
|
|
movlhps xmm0, xmm0 # xmm0 <- Value repeats 16 times
|
|
L1:
|
|
movntdq [rdi], xmm0 # rdi should be 16-byte aligned
|
|
add rdi, 16
|
|
loop L1
|
|
mfence
|
|
movdqa xmm0, [rsp + 0x10] # restore xmm0
|
|
L_SetBytes:
|
|
mov ecx, edx # high 32 bits of rcx are always zero
|
|
rep stosb
|
|
mov rax, r9 # rax <- Return value
|
|
pop rdi
|
|
ret
|