blob: 87974d7104473de060a1abef1830f4e6dc86ac9c [file] [log] [blame]
Austin Schuhdace2a62020-08-18 10:56:48 -07001/* mpn_popcount, mpn_hamdist -- mpn bit population count/hamming distance.
2
3Copyright 1994, 1996, 2000-2002, 2005, 2011, 2012 Free Software Foundation,
4Inc.
5
6This file is part of the GNU MP Library.
7
8The GNU MP Library is free software; you can redistribute it and/or modify
9it under the terms of either:
10
11 * the GNU Lesser General Public License as published by the Free
12 Software Foundation; either version 3 of the License, or (at your
13 option) any later version.
14
15or
16
17 * the GNU General Public License as published by the Free Software
18 Foundation; either version 2 of the License, or (at your option) any
19 later version.
20
21or both in parallel, as here.
22
23The GNU MP Library is distributed in the hope that it will be useful, but
24WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
25or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
26for more details.
27
28You should have received copies of the GNU General Public License and the
29GNU Lesser General Public License along with the GNU MP Library. If not,
30see https://www.gnu.org/licenses/. */
31
32#include "gmp-impl.h"
33
34#if OPERATION_popcount
35#define FNAME mpn_popcount
36#define POPHAM(u,v) u
37#endif
38
39#if OPERATION_hamdist
40#define FNAME mpn_hamdist
41#define POPHAM(u,v) u ^ v
42#endif
43
44mp_bitcnt_t
45FNAME (mp_srcptr up,
46#if OPERATION_hamdist
47 mp_srcptr vp,
48#endif
49 mp_size_t n) __GMP_NOTHROW
50{
51 mp_bitcnt_t result = 0;
52 mp_limb_t p0, p1, p2, p3, x, p01, p23;
53 mp_size_t i;
54
55 ASSERT (n >= 1); /* Actually, this code handles any n, but some
56 assembly implementations do not. */
57
58 for (i = n >> 2; i != 0; i--)
59 {
60 p0 = POPHAM (up[0], vp[0]);
61 p0 -= (p0 >> 1) & MP_LIMB_T_MAX/3; /* 2 0-2 */
62 p0 = ((p0 >> 2) & MP_LIMB_T_MAX/5) + (p0 & MP_LIMB_T_MAX/5); /* 4 0-4 */
63
64 p1 = POPHAM (up[1], vp[1]);
65 p1 -= (p1 >> 1) & MP_LIMB_T_MAX/3; /* 2 0-2 */
66 p1 = ((p1 >> 2) & MP_LIMB_T_MAX/5) + (p1 & MP_LIMB_T_MAX/5); /* 4 0-4 */
67
68 p01 = p0 + p1; /* 8 0-8 */
69 p01 = ((p01 >> 4) & MP_LIMB_T_MAX/17) + (p01 & MP_LIMB_T_MAX/17); /* 8 0-16 */
70
71 p2 = POPHAM (up[2], vp[2]);
72 p2 -= (p2 >> 1) & MP_LIMB_T_MAX/3; /* 2 0-2 */
73 p2 = ((p2 >> 2) & MP_LIMB_T_MAX/5) + (p2 & MP_LIMB_T_MAX/5); /* 4 0-4 */
74
75 p3 = POPHAM (up[3], vp[3]);
76 p3 -= (p3 >> 1) & MP_LIMB_T_MAX/3; /* 2 0-2 */
77 p3 = ((p3 >> 2) & MP_LIMB_T_MAX/5) + (p3 & MP_LIMB_T_MAX/5); /* 4 0-4 */
78
79 p23 = p2 + p3; /* 8 0-8 */
80 p23 = ((p23 >> 4) & MP_LIMB_T_MAX/17) + (p23 & MP_LIMB_T_MAX/17); /* 8 0-16 */
81
82 x = p01 + p23; /* 8 0-32 */
83 x = (x >> 8) + x; /* 8 0-64 */
84 x = (x >> 16) + x; /* 8 0-128 */
85#if GMP_LIMB_BITS > 32
86 x = ((x >> 32) & 0xff) + (x & 0xff); /* 8 0-256 */
87 result += x;
88#else
89 result += x & 0xff;
90#endif
91 up += 4;
92#if OPERATION_hamdist
93 vp += 4;
94#endif
95 }
96
97 n &= 3;
98 if (n != 0)
99 {
100 x = 0;
101 do
102 {
103 p0 = POPHAM (up[0], vp[0]);
104 p0 -= (p0 >> 1) & MP_LIMB_T_MAX/3; /* 2 0-2 */
105 p0 = ((p0 >> 2) & MP_LIMB_T_MAX/5) + (p0 & MP_LIMB_T_MAX/5); /* 4 0-4 */
106 p0 = ((p0 >> 4) + p0) & MP_LIMB_T_MAX/17; /* 8 0-8 */
107
108 x += p0;
109 up += 1;
110#if OPERATION_hamdist
111 vp += 1;
112#endif
113 }
114 while (--n);
115
116 x = (x >> 8) + x;
117 x = (x >> 16) + x;
118#if GMP_LIMB_BITS > 32
119 x = (x >> 32) + x;
120#endif
121 result += x & 0xff;
122 }
123
124 return result;
125}