;------------------------------------------------------------------------------ ; ; Copyright (c) 2006, Intel Corporation. All rights reserved.
; SPDX-License-Identifier: BSD-2-Clause-Patent ; ; Module Name: ; ; CopyMem.nasm ; ; Abstract: ; ; CopyMem function ; ; Notes: ; ;------------------------------------------------------------------------------ SECTION .text ;------------------------------------------------------------------------------ ; VOID * ; InternalMemCopyMem( ; IN VOID *Destination, ; IN VOID *Source, ; IN UINTN Count ; ); ;------------------------------------------------------------------------------ global ASM_PFX(InternalMemCopyMem) ASM_PFX(InternalMemCopyMem): push esi push edi mov esi, [esp + 16] ; esi <- Source mov edi, [esp + 12] ; edi <- Destination mov edx, [esp + 20] ; edx <- Count lea eax, [esi + edx - 1] ; eax <- End of Source cmp esi, edi jae .0 cmp eax, edi ; Overlapped? jae @CopyBackward ; Copy backward if overlapped .0: xor ecx, ecx sub ecx, edi and ecx, 15 ; ecx + edi aligns on 16-byte boundary jz .1 cmp ecx, edx cmova ecx, edx sub edx, ecx ; edx <- remaining bytes to copy rep movsb .1: mov ecx, edx and edx, 15 shr ecx, 4 ; ecx <- # of DQwords to copy jz @CopyBytes add esp, -16 movdqu [esp], xmm0 ; save xmm0 .2: movdqu xmm0, [esi] ; esi may not be 16-bytes aligned movntdq [edi], xmm0 ; edi should be 16-bytes aligned add esi, 16 add edi, 16 loop .2 mfence movdqu xmm0, [esp] ; restore xmm0 add esp, 16 ; stack cleanup jmp @CopyBytes @CopyBackward: mov esi, eax ; esi <- Last byte in Source lea edi, [edi + edx - 1] ; edi <- Last byte in Destination std @CopyBytes: mov ecx, edx rep movsb cld mov eax, [esp + 12] ; eax <- Destination as return value pop edi pop esi ret