beta-0.89.2
[luatex.git] / source / libs / gmp / gmp-src / mpn / pa64 / lshift.asm
blobc0fc2921c1654a7b9960f92719e4787f64176326
1 dnl HP-PA 2.0 mpn_lshift -- Left shift.
3 dnl Copyright 1997, 2000, 2002, 2003 Free Software Foundation, Inc.
5 dnl This file is part of the GNU MP Library.
6 dnl
7 dnl The GNU MP Library is free software; you can redistribute it and/or modify
8 dnl it under the terms of either:
9 dnl
10 dnl * the GNU Lesser General Public License as published by the Free
11 dnl Software Foundation; either version 3 of the License, or (at your
12 dnl option) any later version.
13 dnl
14 dnl or
15 dnl
16 dnl * the GNU General Public License as published by the Free Software
17 dnl Foundation; either version 2 of the License, or (at your option) any
18 dnl later version.
19 dnl
20 dnl or both in parallel, as here.
21 dnl
22 dnl The GNU MP Library is distributed in the hope that it will be useful, but
23 dnl WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
24 dnl or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
25 dnl for more details.
26 dnl
27 dnl You should have received copies of the GNU General Public License and the
28 dnl GNU Lesser General Public License along with the GNU MP Library. If not,
29 dnl see https://www.gnu.org/licenses/.
32 dnl This runs at 1.5 cycles/limb on PA8000 and 1.0 cycles/limb on PA8500.
34 include(`../config.m4')
36 dnl INPUT PARAMETERS
37 define(`rp',`%r26')
38 define(`up',`%r25')
39 define(`n',`%r24')
40 define(`cnt',`%r23')
42 ifdef(`HAVE_ABI_2_0w',
43 ` .level 2.0w
44 ',` .level 2.0
46 PROLOGUE(mpn_lshift)
47 shladd n, 3, up, up
48 shladd n, 3, rp, rp
49 subi 64, cnt, cnt
50 mtsar cnt
51 ldd -8(up), %r21
52 addib,= -1, n, L(end)
53 shrpd %r0, %r21, %sar, %r29 C compute carry out limb
54 depw,z n, 31, 3, %r28 C r28 = (size & 7)
55 sub %r0, n, %r22
56 depw,z %r22, 28, 3, %r22 C r22 = 8 * (-size & 7)
57 add up, %r22, up C offset up
58 blr %r28, %r0 C branch into jump table
59 add rp, %r22, rp C offset rp
60 b L(0)
61 nop
62 b L(1)
63 copy %r21, %r20
64 b L(2)
65 nop
66 b L(3)
67 copy %r21, %r20
68 b L(4)
69 nop
70 b L(5)
71 copy %r21, %r20
72 b L(6)
73 nop
74 b L(7)
75 copy %r21, %r20
77 LDEF(loop)
78 LDEF(0) ldd -16(up), %r20
79 shrpd %r21, %r20, %sar, %r21
80 std %r21, -8(rp)
81 LDEF(7) ldd -24(up), %r21
82 shrpd %r20, %r21, %sar, %r20
83 std %r20, -16(rp)
84 LDEF(6) ldd -32(up), %r20
85 shrpd %r21, %r20, %sar, %r21
86 std %r21, -24(rp)
87 LDEF(5) ldd -40(up), %r21
88 shrpd %r20, %r21, %sar, %r20
89 std %r20, -32(rp)
90 LDEF(4) ldd -48(up), %r20
91 shrpd %r21, %r20, %sar, %r21
92 std %r21, -40(rp)
93 LDEF(3) ldd -56(up), %r21
94 shrpd %r20, %r21, %sar, %r20
95 std %r20, -48(rp)
96 LDEF(2) ldd -64(up), %r20
97 shrpd %r21, %r20, %sar, %r21
98 std %r21, -56(rp)
99 LDEF(1) ldd -72(up), %r21
100 ldo -64(up), up
101 shrpd %r20, %r21, %sar, %r20
102 std %r20, -64(rp)
103 addib,> -8, n, L(loop)
104 ldo -64(rp), rp
106 LDEF(end)
107 shrpd %r21, %r0, %sar, %r21
108 std %r21, -8(rp)
109 bve (%r2)
110 ifdef(`HAVE_ABI_2_0w',
111 ` copy %r29,%r28
112 ',` extrd,u %r29, 31, 32, %r28
114 EPILOGUE(mpn_lshift)