summaryrefslogtreecommitdiffstats
path: root/ArmPkg/Library/BaseMemoryLibVstm/Arm/CopyMem.S
blob: 0a6e039af9dc1461ac2af2bf1e9b3b7a508d81ff (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
#------------------------------------------------------------------------------
#
# CopyMem() worker for ARM
#
# This file started out as C code that did 64 bit moves if the buffer was
# 32-bit aligned, else it does a byte copy. It also does a byte copy for
# any trailing bytes. Update using VSTM/SLDM to do 128 byte copies.
#
# Copyright (c) 2008 - 2010, Apple Inc. All rights reserved.<BR>
# This program and the accompanying materials
# are licensed and made available under the terms and conditions of the BSD License
# which accompanies this distribution.  The full text of the license may be found at
# http://opensource.org/licenses/bsd-license.php
#
# THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
# WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
#
#------------------------------------------------------------------------------

/**
  Copy Length bytes from Source to Destination. Overlap is OK.

  This implementation

  @param  Destination Target of copy
  @param  Source      Place to copy from
  @param  Length      Number of bytes to copy

  @return Destination


VOID *
EFIAPI
InternalMemCopyMem (
  OUT     VOID                      *DestinationBuffer,
  IN      CONST VOID                *SourceBuffer,
  IN      UINTN                     Length
  )
**/
.text
.align 2
GCC_ASM_EXPORT(InternalMemCopyMem)

ASM_PFX(InternalMemCopyMem):
  stmfd  sp!, {r4, r9, lr}
  tst  r0, #3
  mov  r4, r0
  mov  r9, r0
  mov  ip, r2
  mov  lr, r1
  movne  r0, #0
  bne  L4
  tst  r1, #3
  movne  r3, #0
  moveq  r3, #1
  cmp  r2, #127
  movls  r0, #0
  andhi  r0, r3, #1
L4:
  cmp  r4, r1
  bcc  L26
  bls  L7
  rsb  r3, r1, r4
  cmp  ip, r3
  bcc  L26
  cmp  ip, #0
  beq  L7
  add  r9, r4, ip
  add  lr, ip, r1
  b  L16
L29:
  sub  ip, ip, #8
  cmp  ip, #7
  ldrd  r2, [lr, #-8]!
  movls  r0, #0
  cmp  ip, #0
  strd  r2, [r9, #-8]!
  beq  L7
L16:
  cmp  r0, #0
  bne  L29
  sub  r3, lr, #1
  sub  ip, ip, #1
  ldrb  r3, [r3, #0]
  sub  r2, r9, #1
  cmp  ip, #0
  sub  r9, r9, #1
  sub  lr, lr, #1
  strb  r3, [r2, #0]
  bne  L16
  b   L7
L11:
  ldrb  r3, [lr], #1
  sub  ip, ip, #1
  strb  r3, [r9], #1
L26:
  cmp  ip, #0
  beq  L7
L30:
  cmp  r0, #0
  beq  L11
  sub  ip, ip, #128          // 32
  cmp  ip, #127              // 31
  vldm     lr!, {d0-d15}
  movls  r0, #0
  cmp  ip, #0
  vstm  r9!, {d0-d15}
  bne  L30
L7:
  dsb
  mov  r0, r4
  ldmfd  sp!, {r4, r9, pc}