beta-0.89.2
[luatex.git] / source / libs / gmp / gmp-src / mpn / sparc32 / submul_1.asm
blob73f93770067f296dc21fff400f9d8f193d6b4726
1 dnl SPARC mpn_submul_1 -- Multiply a limb vector with a limb and subtract
2 dnl the result from a second limb vector.
4 dnl Copyright 1992-1994, 2000 Free Software Foundation, Inc.
6 dnl This file is part of the GNU MP Library.
7 dnl
8 dnl The GNU MP Library is free software; you can redistribute it and/or modify
9 dnl it under the terms of either:
10 dnl
11 dnl * the GNU Lesser General Public License as published by the Free
12 dnl Software Foundation; either version 3 of the License, or (at your
13 dnl option) any later version.
14 dnl
15 dnl or
16 dnl
17 dnl * the GNU General Public License as published by the Free Software
18 dnl Foundation; either version 2 of the License, or (at your option) any
19 dnl later version.
20 dnl
21 dnl or both in parallel, as here.
22 dnl
23 dnl The GNU MP Library is distributed in the hope that it will be useful, but
24 dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
25 dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
26 dnl for more details.
27 dnl
28 dnl You should have received copies of the GNU General Public License and the
29 dnl GNU Lesser General Public License along with the GNU MP Library. If not,
30 dnl see https://www.gnu.org/licenses/.
33 include(`../config.m4')
35 C INPUT PARAMETERS
36 C res_ptr o0
37 C s1_ptr o1
38 C size o2
39 C s2_limb o3
41 ASM_START()
42 PROLOGUE(mpn_submul_1)
43 C Make S1_PTR and RES_PTR point at the end of their blocks
44 C and put (- 4 x SIZE) in index/loop counter.
45 sll %o2,2,%o2
46 add %o0,%o2,%o4 C RES_PTR in o4 since o0 is retval
47 add %o1,%o2,%o1
48 sub %g0,%o2,%o2
50 cmp %o3,0xfff
51 bgu L(large)
52 nop
54 ld [%o1+%o2],%o5
55 mov 0,%o0
56 b L(0)
57 add %o4,-4,%o4
58 L(loop0):
59 subcc %o5,%g1,%g1
60 ld [%o1+%o2],%o5
61 addx %o0,%g0,%o0
62 st %g1,[%o4+%o2]
63 L(0): wr %g0,%o3,%y
64 sra %o5,31,%g2
65 and %o3,%g2,%g2
66 andcc %g1,0,%g1
67 mulscc %g1,%o5,%g1
68 mulscc %g1,%o5,%g1
69 mulscc %g1,%o5,%g1
70 mulscc %g1,%o5,%g1
71 mulscc %g1,%o5,%g1
72 mulscc %g1,%o5,%g1
73 mulscc %g1,%o5,%g1
74 mulscc %g1,%o5,%g1
75 mulscc %g1,%o5,%g1
76 mulscc %g1,%o5,%g1
77 mulscc %g1,%o5,%g1
78 mulscc %g1,%o5,%g1
79 mulscc %g1,0,%g1
80 sra %g1,20,%g4
81 sll %g1,12,%g1
82 rd %y,%g3
83 srl %g3,20,%g3
84 or %g1,%g3,%g1
86 addcc %g1,%o0,%g1
87 addx %g2,%g4,%o0 C add sign-compensation and cy to hi limb
88 addcc %o2,4,%o2 C loop counter
89 bne L(loop0)
90 ld [%o4+%o2],%o5
92 subcc %o5,%g1,%g1
93 addx %o0,%g0,%o0
94 retl
95 st %g1,[%o4+%o2]
97 L(large):
98 ld [%o1+%o2],%o5
99 mov 0,%o0
100 sra %o3,31,%g4 C g4 = mask of ones iff S2_LIMB < 0
101 b L(1)
102 add %o4,-4,%o4
103 L(loop):
104 subcc %o5,%g3,%g3
105 ld [%o1+%o2],%o5
106 addx %o0,%g0,%o0
107 st %g3,[%o4+%o2]
108 L(1): wr %g0,%o5,%y
109 and %o5,%g4,%g2
110 andcc %g0,%g0,%g1
111 mulscc %g1,%o3,%g1
112 mulscc %g1,%o3,%g1
113 mulscc %g1,%o3,%g1
114 mulscc %g1,%o3,%g1
115 mulscc %g1,%o3,%g1
116 mulscc %g1,%o3,%g1
117 mulscc %g1,%o3,%g1
118 mulscc %g1,%o3,%g1
119 mulscc %g1,%o3,%g1
120 mulscc %g1,%o3,%g1
121 mulscc %g1,%o3,%g1
122 mulscc %g1,%o3,%g1
123 mulscc %g1,%o3,%g1
124 mulscc %g1,%o3,%g1
125 mulscc %g1,%o3,%g1
126 mulscc %g1,%o3,%g1
127 mulscc %g1,%o3,%g1
128 mulscc %g1,%o3,%g1
129 mulscc %g1,%o3,%g1
130 mulscc %g1,%o3,%g1
131 mulscc %g1,%o3,%g1
132 mulscc %g1,%o3,%g1
133 mulscc %g1,%o3,%g1
134 mulscc %g1,%o3,%g1
135 mulscc %g1,%o3,%g1
136 mulscc %g1,%o3,%g1
137 mulscc %g1,%o3,%g1
138 mulscc %g1,%o3,%g1
139 mulscc %g1,%o3,%g1
140 mulscc %g1,%o3,%g1
141 mulscc %g1,%o3,%g1
142 mulscc %g1,%o3,%g1
143 mulscc %g1,%g0,%g1
144 rd %y,%g3
145 addcc %g3,%o0,%g3
146 addx %g2,%g1,%o0
147 addcc %o2,4,%o2
148 bne L(loop)
149 ld [%o4+%o2],%o5
151 subcc %o5,%g3,%g3
152 addx %o0,%g0,%o0
153 retl
154 st %g3,[%o4+%o2]
155 EPILOGUE(mpn_submul_1)