[memcpy.s]: Fix forward overlap case
Fix forward overlap case to copy correct set of bytes. Earlier code
was missing one byte from start and copying one extra byte in end.
Change-Id: Icbc1b35e597aa45a9437444782294eb222145912
diff --git a/lib/libc/string/arch/arm/memcpy.S b/lib/libc/string/arch/arm/memcpy.S
index 3b7816d..925f46e 100644
--- a/lib/libc/string/arch/arm/memcpy.S
+++ b/lib/libc/string/arch/arm/memcpy.S
@@ -165,6 +165,8 @@
// do a bytewise reverse copy for now
add r1, r1, r2
add r0, r0, r2
+ sub r1, r1, #1
+ sub r0, r0, #1
.L_bytewisereverse:
// simple bytewise reverse copy