master
 1//! popcount - population count
 2//! counts the number of 1 bits
 3//! SWAR-Popcount: count bits of duos, aggregate to nibbles, and bytes inside
 4//!   x-bit register in parallel to sum up all bytes
 5//!   SWAR-Masks and factors can be defined as 2-adic fractions
 6//! TAOCP: Combinational Algorithms, Bitwise Tricks And Techniques,
 7//!   subsubsection "Working with the rightmost bits" and "Sideways addition".
 8
 9const builtin = @import("builtin");
10const std = @import("std");
11const common = @import("common.zig");
12
13pub const panic = common.panic;
14
15comptime {
16    @export(&__popcountsi2, .{ .name = "__popcountsi2", .linkage = common.linkage, .visibility = common.visibility });
17    @export(&__popcountdi2, .{ .name = "__popcountdi2", .linkage = common.linkage, .visibility = common.visibility });
18    @export(&__popcountti2, .{ .name = "__popcountti2", .linkage = common.linkage, .visibility = common.visibility });
19}
20
21pub fn __popcountsi2(a: i32) callconv(.c) i32 {
22    return popcountXi2(i32, a);
23}
24
25pub fn __popcountdi2(a: i64) callconv(.c) i32 {
26    return popcountXi2(i64, a);
27}
28
29pub fn __popcountti2(a: i128) callconv(.c) i32 {
30    return popcountXi2(i128, a);
31}
32
33inline fn popcountXi2(comptime ST: type, a: ST) i32 {
34    const UT = switch (ST) {
35        i32 => u32,
36        i64 => u64,
37        i128 => u128,
38        else => unreachable,
39    };
40    var x: UT = @bitCast(a);
41    x -= (x >> 1) & (~@as(UT, 0) / 3); // 0x55...55, aggregate duos
42    x = ((x >> 2) & (~@as(UT, 0) / 5)) // 0x33...33, aggregate nibbles
43        + (x & (~@as(UT, 0) / 5));
44    x += x >> 4;
45    x &= ~@as(UT, 0) / 17; // 0x0F...0F, aggregate bytes
46    // 8 most significant bits of x + (x<<8) + (x<<16) + ..
47    x *%= ~@as(UT, 0) / 255; // 0x01...01
48    x >>= (@bitSizeOf(ST) - 8);
49    return @intCast(x);
50}
51
52test {
53    _ = @import("popcountsi2_test.zig");
54    _ = @import("popcountdi2_test.zig");
55    _ = @import("popcountti2_test.zig");
56}