blob: 57b06b3a559b656b2f8d14be8744254dea07f480 [file] [log] [blame]
Austin Schuhbb1338c2024-06-15 19:31:16 -07001/* mpz_addmul, mpz_submul -- add or subtract multiple.
2
3Copyright 2001, 2004, 2005, 2012 Free Software Foundation, Inc.
4
5This file is part of the GNU MP Library.
6
7The GNU MP Library is free software; you can redistribute it and/or modify
8it under the terms of either:
9
10 * the GNU Lesser General Public License as published by the Free
11 Software Foundation; either version 3 of the License, or (at your
12 option) any later version.
13
14or
15
16 * the GNU General Public License as published by the Free Software
17 Foundation; either version 2 of the License, or (at your option) any
18 later version.
19
20or both in parallel, as here.
21
22The GNU MP Library is distributed in the hope that it will be useful, but
23WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
24or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
25for more details.
26
27You should have received copies of the GNU General Public License and the
28GNU Lesser General Public License along with the GNU MP Library. If not,
29see https://www.gnu.org/licenses/. */
30
31#include "gmp-impl.h"
32
33
34/* expecting x and y both with non-zero high limbs */
35#define mpn_cmp_twosizes_lt(xp,xsize, yp,ysize) \
36 ((xsize) < (ysize) \
37 || ((xsize) == (ysize) && mpn_cmp (xp, yp, xsize) < 0))
38
39
40/* sub>=0 means an addmul w += x*y, sub<0 means a submul w -= x*y.
41
42 The signs of w, x and y are fully accounted for by each flipping "sub".
43
44 The sign of w is retained for the result, unless the absolute value
45 submul underflows, in which case it flips. */
46
47static void __gmpz_aorsmul (REGPARM_3_1 (mpz_ptr w, mpz_srcptr x, mpz_srcptr y, mp_size_t sub)) REGPARM_ATTR (1);
48#define mpz_aorsmul(w,x,y,sub) __gmpz_aorsmul (REGPARM_3_1 (w, x, y, sub))
49
50REGPARM_ATTR (1) static void
51mpz_aorsmul (mpz_ptr w, mpz_srcptr x, mpz_srcptr y, mp_size_t sub)
52{
53 mp_size_t xsize, ysize, tsize, wsize, wsize_signed;
54 mp_ptr wp, tp;
55 mp_limb_t c, high;
56 TMP_DECL;
57
58 /* w unaffected if x==0 or y==0 */
59 xsize = SIZ(x);
60 ysize = SIZ(y);
61 if (xsize == 0 || ysize == 0)
62 return;
63
64 /* make x the bigger of the two */
65 if (ABS(ysize) > ABS(xsize))
66 {
67 MPZ_SRCPTR_SWAP (x, y);
68 MP_SIZE_T_SWAP (xsize, ysize);
69 }
70
71 sub ^= ysize;
72 ysize = ABS(ysize);
73
74 /* use mpn_addmul_1/mpn_submul_1 if possible */
75 if (ysize == 1)
76 {
77 mpz_aorsmul_1 (w, x, PTR(y)[0], sub);
78 return;
79 }
80
81 sub ^= xsize;
82 xsize = ABS(xsize);
83
84 wsize_signed = SIZ(w);
85 sub ^= wsize_signed;
86 wsize = ABS(wsize_signed);
87
88 tsize = xsize + ysize;
89 wp = MPZ_REALLOC (w, MAX (wsize, tsize) + 1);
90
91 if (wsize_signed == 0)
92 {
93 /* Nothing to add to, just set w=x*y. No w==x or w==y overlap here,
94 since we know x,y!=0 but w==0. */
95 high = mpn_mul (wp, PTR(x),xsize, PTR(y),ysize);
96 tsize -= (high == 0);
97 SIZ(w) = (sub >= 0 ? tsize : -tsize);
98 return;
99 }
100
101 TMP_MARK;
102 tp = TMP_ALLOC_LIMBS (tsize);
103
104 high = mpn_mul (tp, PTR(x),xsize, PTR(y),ysize);
105 tsize -= (high == 0);
106 ASSERT (tp[tsize-1] != 0);
107 if (sub >= 0)
108 {
109 mp_srcptr up = wp;
110 mp_size_t usize = wsize;
111
112 if (usize < tsize)
113 {
114 up = tp;
115 usize = tsize;
116 tp = wp;
117 tsize = wsize;
118
119 wsize = usize;
120 }
121
122 c = mpn_add (wp, up,usize, tp,tsize);
123 wp[wsize] = c;
124 wsize += (c != 0);
125 }
126 else
127 {
128 mp_srcptr up = wp;
129 mp_size_t usize = wsize;
130
131 if (mpn_cmp_twosizes_lt (up,usize, tp,tsize))
132 {
133 up = tp;
134 usize = tsize;
135 tp = wp;
136 tsize = wsize;
137
138 wsize = usize;
139 wsize_signed = -wsize_signed;
140 }
141
142 ASSERT_NOCARRY (mpn_sub (wp, up,usize, tp,tsize));
143 wsize = usize;
144 MPN_NORMALIZE (wp, wsize);
145 }
146
147 SIZ(w) = (wsize_signed >= 0 ? wsize : -wsize);
148
149 TMP_FREE;
150}
151
152
153void
154mpz_addmul (mpz_ptr w, mpz_srcptr u, mpz_srcptr v)
155{
156 mpz_aorsmul (w, u, v, (mp_size_t) 0);
157}
158
159void
160mpz_submul (mpz_ptr w, mpz_srcptr u, mpz_srcptr v)
161{
162 mpz_aorsmul (w, u, v, (mp_size_t) -1);
163}