xref: /OK3568_Linux_fs/kernel/arch/hexagon/lib/memcpy_likely_aligned.S (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun/*
3*4882a593Smuzhiyun * Copyright (c) 2021, The Linux Foundation. All rights reserved.
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun#include <linux/linkage.h>
7*4882a593Smuzhiyun
8*4882a593SmuzhiyunSYM_FUNC_START(__hexagon_memcpy_likely_aligned_min32bytes_mult8bytes)
9*4882a593Smuzhiyun        {
10*4882a593Smuzhiyun                p0 = bitsclr(r1,#7)
11*4882a593Smuzhiyun                p0 = bitsclr(r0,#7)
12*4882a593Smuzhiyun                if (p0.new) r5:4 = memd(r1)
13*4882a593Smuzhiyun                if (p0.new) r7:6 = memd(r1+#8)
14*4882a593Smuzhiyun        }
15*4882a593Smuzhiyun        {
16*4882a593Smuzhiyun                if (!p0) jump:nt .Lmemcpy_call
17*4882a593Smuzhiyun                if (p0) r9:8 = memd(r1+#16)
18*4882a593Smuzhiyun                if (p0) r11:10 = memd(r1+#24)
19*4882a593Smuzhiyun                p0 = cmp.gtu(r2,#64)
20*4882a593Smuzhiyun        }
21*4882a593Smuzhiyun        {
22*4882a593Smuzhiyun                if (p0) jump:nt .Lmemcpy_call
23*4882a593Smuzhiyun                if (!p0) memd(r0) = r5:4
24*4882a593Smuzhiyun                if (!p0) memd(r0+#8) = r7:6
25*4882a593Smuzhiyun                p0 = cmp.gtu(r2,#32)
26*4882a593Smuzhiyun        }
27*4882a593Smuzhiyun        {
28*4882a593Smuzhiyun                p1 = cmp.gtu(r2,#40)
29*4882a593Smuzhiyun                p2 = cmp.gtu(r2,#48)
30*4882a593Smuzhiyun                if (p0) r13:12 = memd(r1+#32)
31*4882a593Smuzhiyun                if (p1.new) r15:14 = memd(r1+#40)
32*4882a593Smuzhiyun        }
33*4882a593Smuzhiyun        {
34*4882a593Smuzhiyun                memd(r0+#16) = r9:8
35*4882a593Smuzhiyun                memd(r0+#24) = r11:10
36*4882a593Smuzhiyun        }
37*4882a593Smuzhiyun        {
38*4882a593Smuzhiyun                if (p0) memd(r0+#32) = r13:12
39*4882a593Smuzhiyun                if (p1) memd(r0+#40) = r15:14
40*4882a593Smuzhiyun                if (!p2) jumpr:t r31
41*4882a593Smuzhiyun        }
42*4882a593Smuzhiyun        {
43*4882a593Smuzhiyun                p0 = cmp.gtu(r2,#56)
44*4882a593Smuzhiyun                r5:4 = memd(r1+#48)
45*4882a593Smuzhiyun                if (p0.new) r7:6 = memd(r1+#56)
46*4882a593Smuzhiyun        }
47*4882a593Smuzhiyun        {
48*4882a593Smuzhiyun                memd(r0+#48) = r5:4
49*4882a593Smuzhiyun                if (p0) memd(r0+#56) = r7:6
50*4882a593Smuzhiyun                jumpr r31
51*4882a593Smuzhiyun        }
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun.Lmemcpy_call:
54*4882a593Smuzhiyun        jump memcpy
55*4882a593Smuzhiyun
56*4882a593SmuzhiyunSYM_FUNC_END(__hexagon_memcpy_likely_aligned_min32bytes_mult8bytes)
57