summaryrefslogtreecommitdiff
path: root/libc/string/bfin/memcpy.S
blob: ae40cb244f9cc0fa72ae170c41b90b65c6e0372b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
/* memcpy.S
 * Copyright (C) 2003-2007 Analog Devices Inc., All Rights Reserved.
 *
 * This file is subject to the terms and conditions of the GNU Library General
 * Public License. See the file "COPYING.LIB" in the main directory of this
 * archive for more details.
 *
 * Non-LGPL License also available as part of VisualDSP++
 * http://www.analog.com/processors/resources/crosscore/visualDspDevSoftware.html
 */

#include <sysdep.h>

/* void *memcpy(void *dest, const void *src, size_t n);
 * R0 = To Address (dest) (leave unchanged to form result)
 * R1 = From Address (src)
 * R2 = count
 *
 * Note: Favours word alignment
 */

.text

.align 2

/* We have to bypass the libc-symbols.h machinery to make sure we get
 * a weak symbol for memcpy (some crummy gcc tests want to redefine it).
 */
.global ___GI_memcpy
.type ___GI_memcpy, STT_FUNC
___GI_memcpy:
	[--SP] = P3;
	P0 = R0;              /* P0 = To address */
	P3 = R1;              /* P3 = From Address */
	P2 = R2;              /* P2 = count */
	CC = R2 <= 7(IU);
	IF CC JUMP .Ltoo_small;
	I0 = R1;
	R3 = R1 | R0;         /* OR addresses together */
	R3 <<= 30;            /* check bottom two bits */
	CC =  AZ;             /* AZ set if zero. */
	IF !CC JUMP .Lbytes;  /* Jump if addrs not aligned. */
	P1 = P2 >> 2;         /* count = n/4 */
	P1 += -1;
	R3 =  3;
	R2 = R2 & R3;         /* remainder */
	P2 = R2;              /* set remainder */
	R1 = [I0++];
#if !defined(__WORKAROUND_AVOID_DAG1)
	LSETUP (.Lquad_loop, .Lquad_loop) LC0=P1;
.Lquad_loop:	MNOP || [P0++] = R1 || R1 = [I0++];
#else
	LSETUP (.Lquad_loop_s, .Lquad_loop_e) LC0=P1;
.Lquad_loop_s:	[P0++] = R1;
.Lquad_loop_e:	R1 = [I0++];
#endif
	[P0++] = R1;

	CC = P2 == 0;         /* any remaining bytes? */
	P3 = I0;              /* Ammend P3 for remaining copy */
	IF !CC JUMP .Lbytes;
	P3 = [SP++];
	RTS;

.Ltoo_small:
	CC = P2 == 0;          /* Check zero count */
	IF CC JUMP .Lfinished; /* very unlikely */

.Lbytes:
	LSETUP (.Lbyte_loop_s, .Lbyte_loop_e) LC0=P2;
.Lbyte_loop_s:	R1 = B[P3++](Z);
.Lbyte_loop_e:	B[P0++] = R1;

.Lfinished:
	P3 = [SP++];

	RTS;
.size ___GI_memcpy,.-___GI_memcpy

.hidden ___GI_memcpy
.weak _memcpy
.set _memcpy,___GI_memcpy