xref: /OK3568_Linux_fs/kernel/arch/csky/abiv2/memmove.S (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun// Copyright (C) 2018 Hangzhou C-SKY Microsystems co.,ltd.
3*4882a593Smuzhiyun
4*4882a593Smuzhiyun#include <linux/linkage.h>
5*4882a593Smuzhiyun#include "sysdep.h"
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun	.weak memmove
8*4882a593SmuzhiyunENTRY(__memmove)
9*4882a593SmuzhiyunENTRY(memmove)
10*4882a593Smuzhiyun	subu	r3, r0, r1
11*4882a593Smuzhiyun	cmphs	r3, r2
12*4882a593Smuzhiyun	bt	memcpy
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun	mov	r12, r0
15*4882a593Smuzhiyun	addu	r0, r0, r2
16*4882a593Smuzhiyun	addu	r1, r1, r2
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun	/* Test if len less than 4 bytes.  */
19*4882a593Smuzhiyun	cmplti	r2, 4
20*4882a593Smuzhiyun	bt	.L_copy_by_byte
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun	andi	r13, r0, 3
23*4882a593Smuzhiyun	/* Test if dest is not 4 bytes aligned.  */
24*4882a593Smuzhiyun	bnez	r13, .L_dest_not_aligned
25*4882a593Smuzhiyun	/* Hardware can handle unaligned access directly.  */
26*4882a593Smuzhiyun.L_dest_aligned:
27*4882a593Smuzhiyun	/* If dest is aligned, then copy.  */
28*4882a593Smuzhiyun	zext	r18, r2, 31, 4
29*4882a593Smuzhiyun	/* Test if len less than 16 bytes.  */
30*4882a593Smuzhiyun	bez	r18, .L_len_less_16bytes
31*4882a593Smuzhiyun	movi	r19, 0
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun	/* len > 16 bytes */
34*4882a593Smuzhiyun	LABLE_ALIGN
35*4882a593Smuzhiyun.L_len_larger_16bytes:
36*4882a593Smuzhiyun	subi	r1, 16
37*4882a593Smuzhiyun	subi	r0, 16
38*4882a593Smuzhiyun#if defined(__CK860__)
39*4882a593Smuzhiyun	ldw	r3, (r1, 12)
40*4882a593Smuzhiyun	stw	r3, (r0, 12)
41*4882a593Smuzhiyun	ldw	r3, (r1, 8)
42*4882a593Smuzhiyun	stw	r3, (r0, 8)
43*4882a593Smuzhiyun	ldw	r3, (r1, 4)
44*4882a593Smuzhiyun	stw	r3, (r0, 4)
45*4882a593Smuzhiyun	ldw	r3, (r1, 0)
46*4882a593Smuzhiyun	stw	r3, (r0, 0)
47*4882a593Smuzhiyun#else
48*4882a593Smuzhiyun	ldw	r20, (r1, 0)
49*4882a593Smuzhiyun	ldw	r21, (r1, 4)
50*4882a593Smuzhiyun	ldw	r22, (r1, 8)
51*4882a593Smuzhiyun	ldw	r23, (r1, 12)
52*4882a593Smuzhiyun	stw	r20, (r0, 0)
53*4882a593Smuzhiyun	stw	r21, (r0, 4)
54*4882a593Smuzhiyun	stw	r22, (r0, 8)
55*4882a593Smuzhiyun	stw	r23, (r0, 12)
56*4882a593Smuzhiyun	PRE_BNEZAD (r18)
57*4882a593Smuzhiyun#endif
58*4882a593Smuzhiyun	BNEZAD (r18, .L_len_larger_16bytes)
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun.L_len_less_16bytes:
61*4882a593Smuzhiyun	zext	r18, r2, 3, 2
62*4882a593Smuzhiyun	bez	r18, .L_copy_by_byte
63*4882a593Smuzhiyun.L_len_less_16bytes_loop:
64*4882a593Smuzhiyun	subi	r1, 4
65*4882a593Smuzhiyun	subi	r0, 4
66*4882a593Smuzhiyun	ldw	r3, (r1, 0)
67*4882a593Smuzhiyun	PRE_BNEZAD (r18)
68*4882a593Smuzhiyun	stw	r3, (r0, 0)
69*4882a593Smuzhiyun	BNEZAD (r18, .L_len_less_16bytes_loop)
70*4882a593Smuzhiyun
71*4882a593Smuzhiyun	/* Test if len less than 4 bytes.  */
72*4882a593Smuzhiyun.L_copy_by_byte:
73*4882a593Smuzhiyun	zext	r18, r2, 1, 0
74*4882a593Smuzhiyun	bez	r18, .L_return
75*4882a593Smuzhiyun.L_copy_by_byte_loop:
76*4882a593Smuzhiyun	subi	r1, 1
77*4882a593Smuzhiyun	subi	r0, 1
78*4882a593Smuzhiyun	ldb	r3, (r1, 0)
79*4882a593Smuzhiyun	PRE_BNEZAD (r18)
80*4882a593Smuzhiyun	stb	r3, (r0, 0)
81*4882a593Smuzhiyun	BNEZAD (r18, .L_copy_by_byte_loop)
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun.L_return:
84*4882a593Smuzhiyun	mov	r0, r12
85*4882a593Smuzhiyun	rts
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun	/* If dest is not aligned, just copy some bytes makes the dest
88*4882a593Smuzhiyun	   align.  */
89*4882a593Smuzhiyun.L_dest_not_aligned:
90*4882a593Smuzhiyun	sub	r2, r13
91*4882a593Smuzhiyun.L_dest_not_aligned_loop:
92*4882a593Smuzhiyun	subi	r1, 1
93*4882a593Smuzhiyun	subi	r0, 1
94*4882a593Smuzhiyun	/* Makes the dest align.  */
95*4882a593Smuzhiyun	ldb	r3, (r1, 0)
96*4882a593Smuzhiyun	PRE_BNEZAD (r13)
97*4882a593Smuzhiyun	stb	r3, (r0, 0)
98*4882a593Smuzhiyun	BNEZAD (r13, .L_dest_not_aligned_loop)
99*4882a593Smuzhiyun	cmplti	r2, 4
100*4882a593Smuzhiyun	bt	.L_copy_by_byte
101*4882a593Smuzhiyun	/* Check whether the src is aligned.  */
102*4882a593Smuzhiyun	jbr	.L_dest_aligned
103*4882a593SmuzhiyunENDPROC(memmove)
104*4882a593SmuzhiyunENDPROC(__memmove)
105