xref: /OK3568_Linux_fs/kernel/arch/hexagon/lib/divsi3.S (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun/* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun/*
3*4882a593Smuzhiyun * Copyright (c) 2021, The Linux Foundation. All rights reserved.
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun#include <linux/linkage.h>
7*4882a593Smuzhiyun
8*4882a593SmuzhiyunSYM_FUNC_START(__hexagon_divsi3)
9*4882a593Smuzhiyun        {
10*4882a593Smuzhiyun                p0 = cmp.gt(r0,#-1)
11*4882a593Smuzhiyun                p1 = cmp.gt(r1,#-1)
12*4882a593Smuzhiyun                r3:2 = vabsw(r1:0)
13*4882a593Smuzhiyun        }
14*4882a593Smuzhiyun        {
15*4882a593Smuzhiyun                p3 = xor(p0,p1)
16*4882a593Smuzhiyun                r4 = sub(r2,r3)
17*4882a593Smuzhiyun                r6 = cl0(r2)
18*4882a593Smuzhiyun                p0 = cmp.gtu(r3,r2)
19*4882a593Smuzhiyun        }
20*4882a593Smuzhiyun        {
21*4882a593Smuzhiyun                r0 = mux(p3,#-1,#1)
22*4882a593Smuzhiyun                r7 = cl0(r3)
23*4882a593Smuzhiyun                p1 = cmp.gtu(r3,r4)
24*4882a593Smuzhiyun        }
25*4882a593Smuzhiyun        {
26*4882a593Smuzhiyun                r0 = mux(p0,#0,r0)
27*4882a593Smuzhiyun                p0 = or(p0,p1)
28*4882a593Smuzhiyun                if (p0.new) jumpr:nt r31
29*4882a593Smuzhiyun                r6 = sub(r7,r6)
30*4882a593Smuzhiyun        }
31*4882a593Smuzhiyun        {
32*4882a593Smuzhiyun                r7 = r6
33*4882a593Smuzhiyun                r5:4 = combine(#1,r3)
34*4882a593Smuzhiyun                r6 = add(#1,lsr(r6,#1))
35*4882a593Smuzhiyun                p0 = cmp.gtu(r6,#4)
36*4882a593Smuzhiyun        }
37*4882a593Smuzhiyun        {
38*4882a593Smuzhiyun                r5:4 = vaslw(r5:4,r7)
39*4882a593Smuzhiyun                if (!p0) r6 = #3
40*4882a593Smuzhiyun        }
41*4882a593Smuzhiyun        {
42*4882a593Smuzhiyun                loop0(1f,r6)
43*4882a593Smuzhiyun                r7:6 = vlsrw(r5:4,#1)
44*4882a593Smuzhiyun                r1:0 = #0
45*4882a593Smuzhiyun        }
46*4882a593Smuzhiyun        .falign
47*4882a593Smuzhiyun1:
48*4882a593Smuzhiyun        {
49*4882a593Smuzhiyun                r5:4 = vlsrw(r5:4,#2)
50*4882a593Smuzhiyun                if (!p0.new) r0 = add(r0,r5)
51*4882a593Smuzhiyun                if (!p0.new) r2 = sub(r2,r4)
52*4882a593Smuzhiyun                p0 = cmp.gtu(r4,r2)
53*4882a593Smuzhiyun        }
54*4882a593Smuzhiyun        {
55*4882a593Smuzhiyun                r7:6 = vlsrw(r7:6,#2)
56*4882a593Smuzhiyun                if (!p0.new) r0 = add(r0,r7)
57*4882a593Smuzhiyun                if (!p0.new) r2 = sub(r2,r6)
58*4882a593Smuzhiyun                p0 = cmp.gtu(r6,r2)
59*4882a593Smuzhiyun        }:endloop0
60*4882a593Smuzhiyun        {
61*4882a593Smuzhiyun                if (!p0) r0 = add(r0,r7)
62*4882a593Smuzhiyun        }
63*4882a593Smuzhiyun        {
64*4882a593Smuzhiyun                if (p3) r0 = sub(r1,r0)
65*4882a593Smuzhiyun                jumpr r31
66*4882a593Smuzhiyun        }
67*4882a593SmuzhiyunSYM_FUNC_END(__hexagon_divsi3)
68