Home | History | Annotate | Download | only in Ia32
      1 ;------------------------------------------------------------------------------
      2 ;
      3 ; Copyright (c) 2006, Intel Corporation. All rights reserved.<BR>
      4 ; This program and the accompanying materials
      5 ; are licensed and made available under the terms and conditions of the BSD License
      6 ; which accompanies this distribution.  The full text of the license may be found at
      7 ; http://opensource.org/licenses/bsd-license.php.
      8 ;
      9 ; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
     10 ; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
     11 ;
     12 ; Module Name:
     13 ;
     14 ;   CopyMem.nasm
     15 ;
     16 ; Abstract:
     17 ;
     18 ;   CopyMem function
     19 ;
     20 ; Notes:
     21 ;
     22 ;------------------------------------------------------------------------------
     23 
     24     SECTION .text
     25 
     26 ;------------------------------------------------------------------------------
     27 ;  VOID *
     28 ;  InternalMemCopyMem (
     29 ;    IN VOID   *Destination,
     30 ;    IN VOID   *Source,
     31 ;    IN UINTN  Count
     32 ;    );
     33 ;------------------------------------------------------------------------------
     34 global ASM_PFX(InternalMemCopyMem)
     35 ASM_PFX(InternalMemCopyMem):
     36     push    esi
     37     push    edi
     38     mov     esi, [esp + 16]             ; esi <- Source
     39     mov     edi, [esp + 12]             ; edi <- Destination
     40     mov     edx, [esp + 20]             ; edx <- Count
     41     lea     eax, [esi + edx - 1]        ; eax <- End of Source
     42     cmp     esi, edi
     43     jae     .0
     44     cmp     eax, edi                    ; Overlapped?
     45     jae     @CopyBackward               ; Copy backward if overlapped
     46 .0:
     47     xor     ecx, ecx
     48     sub     ecx, edi
     49     and     ecx, 15                     ; ecx + edi aligns on 16-byte boundary
     50     jz      .1
     51     cmp     ecx, edx
     52     cmova   ecx, edx
     53     sub     edx, ecx                    ; edx <- remaining bytes to copy
     54     rep     movsb
     55 .1:
     56     mov     ecx, edx
     57     and     edx, 15
     58     shr     ecx, 4                      ; ecx <- # of DQwords to copy
     59     jz      @CopyBytes
     60     add     esp, -16
     61     movdqu  [esp], xmm0                 ; save xmm0
     62 .2:
     63     movdqu  xmm0, [esi]                 ; esi may not be 16-bytes aligned
     64     movntdq [edi], xmm0                 ; edi should be 16-bytes aligned
     65     add     esi, 16
     66     add     edi, 16
     67     loop    .2
     68     mfence
     69     movdqu  xmm0, [esp]                 ; restore xmm0
     70     add     esp, 16                     ; stack cleanup
     71     jmp     @CopyBytes
     72 @CopyBackward:
     73     mov     esi, eax                    ; esi <- Last byte in Source
     74     lea     edi, [edi + edx - 1]        ; edi <- Last byte in Destination
     75     std
     76 @CopyBytes:
     77     mov     ecx, edx
     78     rep     movsb
     79     cld
     80     mov     eax, [esp + 12]             ; eax <- Destination as return value
     81     pop     edi
     82     pop     esi
     83     ret
     84 
     85