]>
Commit | Line | Data |
---|---|---|
28f540f4 RM |
1 | ! SPARC __mpn_addmul_1 -- Multiply a limb vector with a limb and add |
2 | ! the result to a second limb vector. | |
f41c8091 | 3 | ! |
04277e02 | 4 | ! Copyright (C) 1992-2019 Free Software Foundation, Inc. |
f41c8091 | 5 | ! |
28f540f4 | 6 | ! This file is part of the GNU MP Library. |
f41c8091 | 7 | ! |
28f540f4 | 8 | ! The GNU MP Library is free software; you can redistribute it and/or modify |
6d84f89a AJ |
9 | ! it under the terms of the GNU Lesser General Public License as published by |
10 | ! the Free Software Foundation; either version 2.1 of the License, or (at your | |
28f540f4 | 11 | ! option) any later version. |
f41c8091 | 12 | ! |
28f540f4 RM |
13 | ! The GNU MP Library is distributed in the hope that it will be useful, but |
14 | ! WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY | |
6d84f89a | 15 | ! or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public |
28f540f4 | 16 | ! License for more details. |
f41c8091 | 17 | ! |
6d84f89a | 18 | ! You should have received a copy of the GNU Lesser General Public License |
59ba27a6 | 19 | ! along with the GNU MP Library; see the file COPYING.LIB. If not, |
5a82c748 | 20 | ! see <https://www.gnu.org/licenses/>. |
28f540f4 RM |
21 | |
22 | ||
23 | ! INPUT PARAMETERS | |
f41c8091 UD |
24 | ! RES_PTR o0 |
25 | ! S1_PTR o1 | |
26 | ! SIZE o2 | |
27 | ! S2_LIMB o3 | |
28f540f4 | 28 | |
f41c8091 | 29 | #include <sysdep.h> |
28f540f4 | 30 | |
f41c8091 | 31 | ENTRY(__mpn_addmul_1) |
28f540f4 RM |
32 | ! Make S1_PTR and RES_PTR point at the end of their blocks |
33 | ! and put (- 4 x SIZE) in index/loop counter. | |
34 | sll %o2,2,%o2 | |
35 | add %o0,%o2,%o4 ! RES_PTR in o4 since o0 is retval | |
36 | add %o1,%o2,%o1 | |
37 | sub %g0,%o2,%o2 | |
38 | ||
39 | cmp %o3,0xfff | |
f41c8091 | 40 | bgu LOC(large) |
28f540f4 RM |
41 | nop |
42 | ||
43 | ld [%o1+%o2],%o5 | |
44 | mov 0,%o0 | |
f41c8091 | 45 | b LOC(0) |
28f540f4 | 46 | add %o4,-4,%o4 |
f41c8091 | 47 | LOC(loop0): |
28f540f4 RM |
48 | addcc %o5,%g1,%g1 |
49 | ld [%o1+%o2],%o5 | |
50 | addx %o0,%g0,%o0 | |
51 | st %g1,[%o4+%o2] | |
f41c8091 | 52 | LOC(0): wr %g0,%o3,%y |
28f540f4 RM |
53 | sra %o5,31,%g2 |
54 | and %o3,%g2,%g2 | |
55 | andcc %g1,0,%g1 | |
56 | mulscc %g1,%o5,%g1 | |
57 | mulscc %g1,%o5,%g1 | |
58 | mulscc %g1,%o5,%g1 | |
59 | mulscc %g1,%o5,%g1 | |
60 | mulscc %g1,%o5,%g1 | |
61 | mulscc %g1,%o5,%g1 | |
62 | mulscc %g1,%o5,%g1 | |
63 | mulscc %g1,%o5,%g1 | |
64 | mulscc %g1,%o5,%g1 | |
65 | mulscc %g1,%o5,%g1 | |
66 | mulscc %g1,%o5,%g1 | |
67 | mulscc %g1,%o5,%g1 | |
68 | mulscc %g1,0,%g1 | |
69 | sra %g1,20,%g4 | |
70 | sll %g1,12,%g1 | |
71 | rd %y,%g3 | |
72 | srl %g3,20,%g3 | |
73 | or %g1,%g3,%g1 | |
74 | ||
75 | addcc %g1,%o0,%g1 | |
76 | addx %g2,%g4,%o0 ! add sign-compensation and cy to hi limb | |
77 | addcc %o2,4,%o2 ! loop counter | |
f41c8091 | 78 | bne LOC(loop0) |
28f540f4 RM |
79 | ld [%o4+%o2],%o5 |
80 | ||
81 | addcc %o5,%g1,%g1 | |
82 | addx %o0,%g0,%o0 | |
83 | retl | |
84 | st %g1,[%o4+%o2] | |
85 | ||
86 | ||
f41c8091 UD |
87 | LOC(large): |
88 | ld [%o1+%o2],%o5 | |
28f540f4 RM |
89 | mov 0,%o0 |
90 | sra %o3,31,%g4 ! g4 = mask of ones iff S2_LIMB < 0 | |
f41c8091 | 91 | b LOC(1) |
28f540f4 | 92 | add %o4,-4,%o4 |
f41c8091 | 93 | LOC(loop): |
28f540f4 RM |
94 | addcc %o5,%g3,%g3 |
95 | ld [%o1+%o2],%o5 | |
96 | addx %o0,%g0,%o0 | |
97 | st %g3,[%o4+%o2] | |
f41c8091 | 98 | LOC(1): wr %g0,%o5,%y |
28f540f4 RM |
99 | and %o5,%g4,%g2 |
100 | andcc %g0,%g0,%g1 | |
101 | mulscc %g1,%o3,%g1 | |
102 | mulscc %g1,%o3,%g1 | |
103 | mulscc %g1,%o3,%g1 | |
104 | mulscc %g1,%o3,%g1 | |
105 | mulscc %g1,%o3,%g1 | |
106 | mulscc %g1,%o3,%g1 | |
107 | mulscc %g1,%o3,%g1 | |
108 | mulscc %g1,%o3,%g1 | |
109 | mulscc %g1,%o3,%g1 | |
110 | mulscc %g1,%o3,%g1 | |
111 | mulscc %g1,%o3,%g1 | |
112 | mulscc %g1,%o3,%g1 | |
113 | mulscc %g1,%o3,%g1 | |
114 | mulscc %g1,%o3,%g1 | |
115 | mulscc %g1,%o3,%g1 | |
116 | mulscc %g1,%o3,%g1 | |
117 | mulscc %g1,%o3,%g1 | |
118 | mulscc %g1,%o3,%g1 | |
119 | mulscc %g1,%o3,%g1 | |
120 | mulscc %g1,%o3,%g1 | |
121 | mulscc %g1,%o3,%g1 | |
122 | mulscc %g1,%o3,%g1 | |
123 | mulscc %g1,%o3,%g1 | |
124 | mulscc %g1,%o3,%g1 | |
125 | mulscc %g1,%o3,%g1 | |
126 | mulscc %g1,%o3,%g1 | |
127 | mulscc %g1,%o3,%g1 | |
128 | mulscc %g1,%o3,%g1 | |
129 | mulscc %g1,%o3,%g1 | |
130 | mulscc %g1,%o3,%g1 | |
131 | mulscc %g1,%o3,%g1 | |
132 | mulscc %g1,%o3,%g1 | |
133 | mulscc %g1,%g0,%g1 | |
134 | rd %y,%g3 | |
135 | addcc %g3,%o0,%g3 | |
136 | addx %g2,%g1,%o0 | |
137 | addcc %o2,4,%o2 | |
f41c8091 | 138 | bne LOC(loop) |
28f540f4 RM |
139 | ld [%o4+%o2],%o5 |
140 | ||
141 | addcc %o5,%g3,%g3 | |
142 | addx %o0,%g0,%o0 | |
143 | retl | |
144 | st %g3,[%o4+%o2] | |
f41c8091 UD |
145 | |
146 | END(__mpn_addmul_1) |