blob: 25b5cd515b23a5b729ef75e46fc12394dbc4a6d9 [file] [log] [blame]
/**
* This module contains a collection of bit-level operations.
*
* Copyright: Copyright Don Clugston 2005 - 2013.
* License: $(LINK2 http://www.boost.org/LICENSE_1_0.txt, Boost License 1.0)
* Authors: Don Clugston, Sean Kelly, Walter Bright, Alex Rønne Petersen, Thomas Stuart Bockman
* Source: $(DRUNTIMESRC core/_bitop.d)
*/
module core.bitop;
nothrow:
@safe:
@nogc:
version (D_InlineAsm_X86_64)
version = AsmX86;
else version (D_InlineAsm_X86)
version = AsmX86;
version (X86_64)
version = AnyX86;
else version (X86)
version = AnyX86;
// Use to implement 64-bit bitops on 32-bit arch.
private union Split64
{
ulong u64;
struct
{
version (LittleEndian)
{
uint lo;
uint hi;
}
else
{
uint hi;
uint lo;
}
}
pragma(inline, true)
this(ulong u64) @safe pure nothrow @nogc
{
if (__ctfe)
{
lo = cast(uint) u64;
hi = cast(uint) (u64 >>> 32);
}
else
this.u64 = u64;
}
}
unittest
{
const rt = Split64(1);
assert((rt.lo == 1) && (rt.hi == 0));
enum ct = Split64(1);
assert((ct.lo == rt.lo) && (ct.hi == rt.hi));
}
/**
* Scans the bits in v starting with bit 0, looking
* for the first set bit.
* Returns:
* The bit number of the first bit set.
* The return value is undefined if v is zero.
*/
int bsf(uint v) pure
{
pragma(inline, false); // so intrinsic detection will work
return softBsf!uint(v);
}
/// ditto
int bsf(ulong v) pure
{
static if (size_t.sizeof == ulong.sizeof) // 64 bit code gen
{
pragma(inline, false); // so intrinsic detection will work
return softBsf!ulong(v);
}
else
{
/* intrinsic not available for 32 bit code,
* make do with 32 bit bsf
*/
const sv = Split64(v);
return (sv.lo == 0)?
bsf(sv.hi) + 32 :
bsf(sv.lo);
}
}
///
unittest
{
assert(bsf(0x21) == 0);
assert(bsf(ulong.max << 39) == 39);
}
unittest
{
// Make sure bsf() is available at CTFE
enum test_ctfe = bsf(ulong.max);
assert(test_ctfe == 0);
}
/**
* Scans the bits in v from the most significant bit
* to the least significant bit, looking
* for the first set bit.
* Returns:
* The bit number of the first bit set.
* The return value is undefined if v is zero.
*/
int bsr(uint v) pure
{
pragma(inline, false); // so intrinsic detection will work
return softBsr!uint(v);
}
/// ditto
int bsr(ulong v) pure
{
static if (size_t.sizeof == ulong.sizeof) // 64 bit code gen
{
pragma(inline, false); // so intrinsic detection will work
return softBsr!ulong(v);
}
else
{
/* intrinsic not available for 32 bit code,
* make do with 32 bit bsr
*/
const sv = Split64(v);
return (sv.hi == 0)?
bsr(sv.lo) :
bsr(sv.hi) + 32;
}
}
///
unittest
{
assert(bsr(0x21) == 5);
assert(bsr((ulong.max >> 15) - 1) == 48);
}
unittest
{
// Make sure bsr() is available at CTFE
enum test_ctfe = bsr(ulong.max);
assert(test_ctfe == 63);
}
private alias softBsf(N) = softScan!(N, true);
private alias softBsr(N) = softScan!(N, false);
/* Shared software fallback implementation for bit scan foward and reverse.
If forward is true, bsf is computed (the index of the first set bit).
If forward is false, bsr is computed (the index of the last set bit).
-1 is returned if no bits are set (v == 0).
*/
private int softScan(N, bool forward)(N v) pure
if (is(N == uint) || is(N == ulong))
{
// bsf() and bsr() are officially undefined for v == 0.
if (!v)
return -1;
// This is essentially an unrolled binary search:
enum mask(ulong lo) = forward ? cast(N) lo : cast(N)~lo;
enum inc(int up) = forward ? up : -up;
N x;
int ret;
static if (is(N == ulong))
{
x = v & mask!0x0000_0000_FFFF_FFFFL;
if (x)
{
v = x;
ret = forward ? 0 : 63;
}
else
ret = forward ? 32 : 31;
x = v & mask!0x0000_FFFF_0000_FFFFL;
if (x)
v = x;
else
ret += inc!16;
}
else static if (is(N == uint))
{
x = v & mask!0x0000_FFFF;
if (x)
{
v = x;
ret = forward ? 0 : 31;
}
else
ret = forward ? 16 : 15;
}
else
static assert(false);
x = v & mask!0x00FF_00FF_00FF_00FFL;
if (x)
v = x;
else
ret += inc!8;
x = v & mask!0x0F0F_0F0F_0F0F_0F0FL;
if (x)
v = x;
else
ret += inc!4;
x = v & mask!0x3333_3333_3333_3333L;
if (x)
v = x;
else
ret += inc!2;
x = v & mask!0x5555_5555_5555_5555L;
if (!x)
ret += inc!1;
return ret;
}
unittest
{
assert(softBsf!uint(0u) == -1);
assert(softBsr!uint(0u) == -1);
assert(softBsf!ulong(0uL) == -1);
assert(softBsr!ulong(0uL) == -1);
assert(softBsf!uint(0x0031_A000) == 13);
assert(softBsr!uint(0x0031_A000) == 21);
assert(softBsf!ulong(0x0000_0001_8000_0000L) == 31);
assert(softBsr!ulong(0x0000_0001_8000_0000L) == 32);
foreach (b; 0 .. 64)
{
if (b < 32)
{
assert(softBsf!uint(1u << b) == b);
assert(softBsr!uint(1u << b) == b);
}
assert(softBsf!ulong(1uL << b) == b);
assert(softBsr!ulong(1uL << b) == b);
}
}
/**
* Tests the bit.
* (No longer an intrisic - the compiler recognizes the patterns
* in the body.)
*/
int bt(const scope size_t* p, size_t bitnum) pure @system
{
static if (size_t.sizeof == 8)
return ((p[bitnum >> 6] & (1L << (bitnum & 63)))) != 0;
else static if (size_t.sizeof == 4)
return ((p[bitnum >> 5] & (1 << (bitnum & 31)))) != 0;
else
static assert(0);
}
///
@system pure unittest
{
size_t[2] array;
array[0] = 2;
array[1] = 0x100;
assert(bt(array.ptr, 1));
assert(array[0] == 2);
assert(array[1] == 0x100);
}
/**
* Tests and complements the bit.
*/
int btc(size_t* p, size_t bitnum) pure @system;
/**
* Tests and resets (sets to 0) the bit.
*/
int btr(size_t* p, size_t bitnum) pure @system;
/**
* Tests and sets the bit.
* Params:
* p = a non-NULL pointer to an array of size_ts.
* bitnum = a bit number, starting with bit 0 of p[0],
* and progressing. It addresses bits like the expression:
---
p[index / (size_t.sizeof*8)] & (1 << (index & ((size_t.sizeof*8) - 1)))
---
* Returns:
* A non-zero value if the bit was set, and a zero
* if it was clear.
*/
int bts(size_t* p, size_t bitnum) pure @system;
///
@system pure unittest
{
size_t[2] array;
array[0] = 2;
array[1] = 0x100;
assert(btc(array.ptr, 35) == 0);
if (size_t.sizeof == 8)
{
assert(array[0] == 0x8_0000_0002);
assert(array[1] == 0x100);
}
else
{
assert(array[0] == 2);
assert(array[1] == 0x108);
}
assert(btc(array.ptr, 35));
assert(array[0] == 2);
assert(array[1] == 0x100);
assert(bts(array.ptr, 35) == 0);
if (size_t.sizeof == 8)
{
assert(array[0] == 0x8_0000_0002);
assert(array[1] == 0x100);
}
else
{
assert(array[0] == 2);
assert(array[1] == 0x108);
}
assert(btr(array.ptr, 35));
assert(array[0] == 2);
assert(array[1] == 0x100);
}
/**
* Range over bit set. Each element is the bit number that is set.
*
* This is more efficient than testing each bit in a sparsely populated bit
* set. Note that the first bit in the bit set would be bit 0.
*/
struct BitRange
{
/// Number of bits in each size_t
enum bitsPerWord = size_t.sizeof * 8;
private
{
const(size_t)*bits; // points at next word of bits to check
size_t cur; // needed to allow searching bits using bsf
size_t idx; // index of current set bit
size_t len; // number of bits in the bit set.
}
@nogc nothrow pure:
/**
* Construct a BitRange.
*
* Params:
* bitarr = The array of bits to iterate over
* numBits = The total number of valid bits in the given bit array
*/
this(const(size_t)* bitarr, size_t numBits) @system
{
bits = bitarr;
len = numBits;
if (len)
{
// prime the first bit
cur = *bits++ ^ 1;
popFront();
}
}
/// Range functions
size_t front()
{
assert(!empty);
return idx;
}
/// ditto
bool empty() const
{
return idx >= len;
}
/// ditto
void popFront() @system
{
// clear the current bit
auto curbit = idx % bitsPerWord;
cur ^= size_t(1) << curbit;
if (!cur)
{
// find next size_t with set bit
idx -= curbit;
while (!cur)
{
if ((idx += bitsPerWord) >= len)
// now empty
return;
cur = *bits++;
}
idx += bsf(cur);
}
else
{
idx += bsf(cur) - curbit;
}
}
}
///
@system unittest
{
import core.stdc.stdlib : malloc, free;
import core.stdc.string : memset;
// initialize a bit array
enum nBytes = (100 + BitRange.bitsPerWord - 1) / 8;
size_t *bitArr = cast(size_t *)malloc(nBytes);
scope(exit) free(bitArr);
memset(bitArr, 0, nBytes);
// set some bits
bts(bitArr, 48);
bts(bitArr, 24);
bts(bitArr, 95);
bts(bitArr, 78);
enum sum = 48 + 24 + 95 + 78;
// iterate
size_t testSum;
size_t nBits;
foreach (b; BitRange(bitArr, 100))
{
testSum += b;
++nBits;
}
assert(testSum == sum);
assert(nBits == 4);
}
@system unittest
{
void testIt(size_t numBits, size_t[] bitsToTest...)
{
import core.stdc.stdlib : malloc, free;
import core.stdc.string : memset;
immutable numBytes = (numBits + size_t.sizeof * 8 - 1) / 8;
size_t* bitArr = cast(size_t *)malloc(numBytes);
scope(exit) free(bitArr);
memset(bitArr, 0, numBytes);
foreach (b; bitsToTest)
bts(bitArr, b);
auto br = BitRange(bitArr, numBits);
foreach (b; bitsToTest)
{
assert(!br.empty);
assert(b == br.front);
br.popFront();
}
assert(br.empty);
}
testIt(100, 0, 1, 31, 63, 85);
testIt(100, 6, 45, 89, 92, 99);
}
/**
* Swaps bytes in a 2 byte ushort.
* Params:
* x = value
* Returns:
* `x` with bytes swapped
*/
pragma(inline, false)
ushort byteswap(ushort x) pure
{
/* Calling it bswap(ushort) would break existing code that calls bswap(uint).
*
* This pattern is meant to be recognized by the dmd code generator.
* Don't change it without checking that an XCH instruction is still
* used to implement it.
* Inlining may also throw it off.
*/
return cast(ushort) (((x >> 8) & 0xFF) | ((x << 8) & 0xFF00u));
}
///
unittest
{
assert(byteswap(cast(ushort)0xF234) == 0x34F2);
static ushort xx = 0xF234;
assert(byteswap(xx) == 0x34F2);
}
/**
* Swaps bytes in a 4 byte uint end-to-end, i.e. byte 0 becomes
* byte 3, byte 1 becomes byte 2, byte 2 becomes byte 1, byte 3
* becomes byte 0.
*/
uint bswap(uint v) pure;
///
unittest
{
assert(bswap(0x01020304u) == 0x04030201u);
static uint xx = 0x10203040u;
assert(bswap(xx) == 0x40302010u);
}
/**
* Swaps bytes in an 8 byte ulong end-to-end, i.e. byte 0 becomes
* byte 7, byte 1 becomes byte 6, etc.
* This is meant to be recognized by the compiler as an intrinsic.
*/
ulong bswap(ulong v) pure;
///
unittest
{
assert(bswap(0x01020304_05060708uL) == 0x08070605_04030201uL);
static ulong xx = 0x10203040_50607080uL;
assert(bswap(xx) == 0x80706050_40302010uL);
}
version (DigitalMars) version (AnyX86) @system // not pure
{
/**
* Reads I/O port at port_address.
*/
ubyte inp(uint port_address);
/**
* ditto
*/
ushort inpw(uint port_address);
/**
* ditto
*/
uint inpl(uint port_address);
/**
* Writes and returns value to I/O port at port_address.
*/
ubyte outp(uint port_address, ubyte value);
/**
* ditto
*/
ushort outpw(uint port_address, ushort value);
/**
* ditto
*/
uint outpl(uint port_address, uint value);
}
/**
* Calculates the number of set bits in an integer.
*/
int popcnt(uint x) pure
{
// Select the fastest method depending on the compiler and CPU architecture
version (DigitalMars)
{
static if (is(typeof(_popcnt(uint.max))))
{
import core.cpuid;
if (!__ctfe && hasPopcnt)
return _popcnt(x);
}
}
return softPopcnt!uint(x);
}
unittest
{
assert( popcnt( 0 ) == 0 );
assert( popcnt( 7 ) == 3 );
assert( popcnt( 0xAA )== 4 );
assert( popcnt( 0x8421_1248 ) == 8 );
assert( popcnt( 0xFFFF_FFFF ) == 32 );
assert( popcnt( 0xCCCC_CCCC ) == 16 );
assert( popcnt( 0x7777_7777 ) == 24 );
// Make sure popcnt() is available at CTFE
enum test_ctfe = popcnt(uint.max);
assert(test_ctfe == 32);
}
/// ditto
int popcnt(ulong x) pure
{
// Select the fastest method depending on the compiler and CPU architecture
import core.cpuid;
static if (size_t.sizeof == uint.sizeof)
{
const sx = Split64(x);
version (DigitalMars)
{
static if (is(typeof(_popcnt(uint.max))))
{
if (!__ctfe && hasPopcnt)
return _popcnt(sx.lo) + _popcnt(sx.hi);
}
}
return softPopcnt!uint(sx.lo) + softPopcnt!uint(sx.hi);
}
else static if (size_t.sizeof == ulong.sizeof)
{
version (DigitalMars)
{
static if (is(typeof(_popcnt(ulong.max))))
{
if (!__ctfe && hasPopcnt)
return _popcnt(x);
}
}
return softPopcnt!ulong(x);
}
else
static assert(false);
}
unittest
{
assert(popcnt(0uL) == 0);
assert(popcnt(1uL) == 1);
assert(popcnt((1uL << 32) - 1) == 32);
assert(popcnt(0x48_65_6C_6C_6F_3F_21_00uL) == 28);
assert(popcnt(ulong.max) == 64);
// Make sure popcnt() is available at CTFE
enum test_ctfe = popcnt(ulong.max);
assert(test_ctfe == 64);
}
private int softPopcnt(N)(N x) pure
if (is(N == uint) || is(N == ulong))
{
// Avoid branches, and the potential for cache misses which
// could be incurred with a table lookup.
// We need to mask alternate bits to prevent the
// sum from overflowing.
// add neighbouring bits. Each bit is 0 or 1.
enum mask1 = cast(N) 0x5555_5555_5555_5555L;
x = x - ((x>>1) & mask1);
// now each two bits of x is a number 00,01 or 10.
// now add neighbouring pairs
enum mask2a = cast(N) 0xCCCC_CCCC_CCCC_CCCCL;
enum mask2b = cast(N) 0x3333_3333_3333_3333L;
x = ((x & mask2a)>>2) + (x & mask2b);
// now each nibble holds 0000-0100. Adding them won't
// overflow any more, so we don't need to mask any more
enum mask4 = cast(N) 0x0F0F_0F0F_0F0F_0F0FL;
x = (x + (x >> 4)) & mask4;
enum shiftbits = is(N == uint)? 24 : 56;
enum maskMul = cast(N) 0x0101_0101_0101_0101L;
x = (x * maskMul) >> shiftbits;
return cast(int) x;
}
version (DigitalMars) version (AnyX86)
{
/**
* Calculates the number of set bits in an integer
* using the X86 SSE4 POPCNT instruction.
* POPCNT is not available on all X86 CPUs.
*/
ushort _popcnt( ushort x ) pure;
/// ditto
int _popcnt( uint x ) pure;
version (X86_64)
{
/// ditto
int _popcnt( ulong x ) pure;
}
unittest
{
// Not everyone has SSE4 instructions
import core.cpuid;
if (!hasPopcnt)
return;
static int popcnt_x(ulong u) nothrow @nogc
{
int c;
while (u)
{
c += u & 1;
u >>= 1;
}
return c;
}
for (uint u = 0; u < 0x1_0000; ++u)
{
//writefln("%x %x %x", u, _popcnt(cast(ushort)u), popcnt_x(cast(ushort)u));
assert(_popcnt(cast(ushort)u) == popcnt_x(cast(ushort)u));
assert(_popcnt(cast(uint)u) == popcnt_x(cast(uint)u));
uint ui = u * 0x3_0001;
assert(_popcnt(ui) == popcnt_x(ui));
version (X86_64)
{
assert(_popcnt(cast(ulong)u) == popcnt_x(cast(ulong)u));
ulong ul = u * 0x3_0003_0001;
assert(_popcnt(ul) == popcnt_x(ul));
}
}
}
}
deprecated("volatileLoad has been moved to core.volatile. Use core.volatile.volatileLoad instead.")
{
public import core.volatile : volatileLoad;
}
deprecated("volatileStore has been moved to core.volatile. Use core.volatile.volatileStore instead.")
{
public import core.volatile : volatileStore;
}
/**
* Reverses the order of bits in a 32-bit integer.
*/
pragma(inline, true)
uint bitswap( uint x ) pure
{
if (!__ctfe)
{
static if (is(typeof(asmBitswap32(x))))
return asmBitswap32(x);
}
return softBitswap!uint(x);
}
unittest
{
static void test(alias impl)()
{
assert (impl( 0x8000_0100 ) == 0x0080_0001);
foreach (i; 0 .. 32)
assert (impl(1 << i) == 1 << 32 - i - 1);
}
test!(bitswap)();
test!(softBitswap!uint)();
static if (is(typeof(asmBitswap32(0u))))
test!(asmBitswap32)();
// Make sure bitswap() is available at CTFE
enum test_ctfe = bitswap(1U);
assert(test_ctfe == (1U << 31));
}
/**
* Reverses the order of bits in a 64-bit integer.
*/
pragma(inline, true)
ulong bitswap ( ulong x ) pure
{
if (!__ctfe)
{
static if (is(typeof(asmBitswap64(x))))
return asmBitswap64(x);
}
return softBitswap!ulong(x);
}
unittest
{
static void test(alias impl)()
{
assert (impl( 0b1000000000000000000000010000000000000000100000000000000000000001)
== 0b1000000000000000000000010000000000000000100000000000000000000001);
assert (impl( 0b1110000000000000000000010000000000000000100000000000000000000001)
== 0b1000000000000000000000010000000000000000100000000000000000000111);
foreach (i; 0 .. 64)
assert (impl(1UL << i) == 1UL << 64 - i - 1);
}
test!(bitswap)();
test!(softBitswap!ulong)();
static if (is(typeof(asmBitswap64(0uL))))
test!(asmBitswap64)();
// Make sure bitswap() is available at CTFE
enum test_ctfe = bitswap(1UL);
assert(test_ctfe == (1UL << 63));
}
private N softBitswap(N)(N x) pure
if (is(N == uint) || is(N == ulong))
{
// swap 1-bit pairs:
enum mask1 = cast(N) 0x5555_5555_5555_5555L;
x = ((x >> 1) & mask1) | ((x & mask1) << 1);
// swap 2-bit pairs:
enum mask2 = cast(N) 0x3333_3333_3333_3333L;
x = ((x >> 2) & mask2) | ((x & mask2) << 2);
// swap 4-bit pairs:
enum mask4 = cast(N) 0x0F0F_0F0F_0F0F_0F0FL;
x = ((x >> 4) & mask4) | ((x & mask4) << 4);
// reverse the order of all bytes:
x = bswap(x);
return x;
}
version (AsmX86)
{
private uint asmBitswap32(uint x) @trusted pure
{
asm pure nothrow @nogc { naked; }
version (D_InlineAsm_X86_64)
{
version (Win64)
asm pure nothrow @nogc { mov EAX, ECX; }
else
asm pure nothrow @nogc { mov EAX, EDI; }
}
asm pure nothrow @nogc
{
// Author: Tiago Gasiba.
mov EDX, EAX;
shr EAX, 1;
and EDX, 0x5555_5555;
and EAX, 0x5555_5555;
shl EDX, 1;
or EAX, EDX;
mov EDX, EAX;
shr EAX, 2;
and EDX, 0x3333_3333;
and EAX, 0x3333_3333;
shl EDX, 2;
or EAX, EDX;
mov EDX, EAX;
shr EAX, 4;
and EDX, 0x0f0f_0f0f;
and EAX, 0x0f0f_0f0f;
shl EDX, 4;
or EAX, EDX;
bswap EAX;
ret;
}
}
}
version (D_InlineAsm_X86_64)
{
private ulong asmBitswap64(ulong x) @trusted pure
{
asm pure nothrow @nogc { naked; }
version (Win64)
asm pure nothrow @nogc { mov RAX, RCX; }
else
asm pure nothrow @nogc { mov RAX, RDI; }
asm pure nothrow @nogc
{
// Author: Tiago Gasiba.
mov RDX, RAX;
shr RAX, 1;
mov RCX, 0x5555_5555_5555_5555L;
and RDX, RCX;
and RAX, RCX;
shl RDX, 1;
or RAX, RDX;
mov RDX, RAX;
shr RAX, 2;
mov RCX, 0x3333_3333_3333_3333L;
and RDX, RCX;
and RAX, RCX;
shl RDX, 2;
or RAX, RDX;
mov RDX, RAX;
shr RAX, 4;
mov RCX, 0x0f0f_0f0f_0f0f_0f0fL;
and RDX, RCX;
and RAX, RCX;
shl RDX, 4;
or RAX, RDX;
bswap RAX;
ret;
}
}
}
/**
* Bitwise rotate `value` left (`rol`) or right (`ror`) by
* `count` bit positions.
*/
pure T rol(T)(const T value, const uint count)
if (__traits(isIntegral, T) && __traits(isUnsigned, T))
{
assert(count < 8 * T.sizeof);
return cast(T) ((value << count) | (value >> (T.sizeof * 8 - count)));
}
/// ditto
pure T ror(T)(const T value, const uint count)
if (__traits(isIntegral, T) && __traits(isUnsigned, T))
{
assert(count < 8 * T.sizeof);
return cast(T) ((value >> count) | (value << (T.sizeof * 8 - count)));
}
/// ditto
pure T rol(uint count, T)(const T value)
if (__traits(isIntegral, T) && __traits(isUnsigned, T))
{
static assert(count < 8 * T.sizeof);
return cast(T) ((value << count) | (value >> (T.sizeof * 8 - count)));
}
/// ditto
pure T ror(uint count, T)(const T value)
if (__traits(isIntegral, T) && __traits(isUnsigned, T))
{
static assert(count < 8 * T.sizeof);
return cast(T) ((value >> count) | (value << (T.sizeof * 8 - count)));
}
///
unittest
{
ubyte a = 0b11110000U;
ulong b = ~1UL;
assert(rol(a, 1) == 0b11100001);
assert(ror(a, 1) == 0b01111000);
assert(rol(a, 3) == 0b10000111);
assert(ror(a, 3) == 0b00011110);
assert(rol(a, 0) == a);
assert(ror(a, 0) == a);
assert(rol(b, 63) == ~(1UL << 63));
assert(ror(b, 63) == ~2UL);
assert(rol!3(a) == 0b10000111);
assert(ror!3(a) == 0b00011110);
}