diff options
author | Stephan Diestelhorst <stephan.diestelhorst@arm.com> | 2014-04-24 17:41:26 +0100 |
---|---|---|
committer | Stephan Diestelhorst <stephan.diestelhorst@arm.com> | 2014-04-24 17:41:26 +0100 |
commit | fe98cb6be471e8187658fea950bee0ecd5bf959c (patch) | |
tree | cb9050f97b8961b796982afd5204fbdaed58a406 | |
parent | ba98d598aef0e3823d2ded7084b1a2829ade5b73 (diff) | |
download | gem5-fe98cb6be471e8187658fea950bee0ecd5bf959c.tar.xz |
misc: Add functions for doing popcount and power-of-two checking
Adds two public domain algorithms for determining number of set bits and also
whether a value is a power of two, uses the builtin that is available in GCC
and clang for popcount.
-rw-r--r-- | src/base/bitfield.hh | 33 |
1 files changed, 33 insertions, 0 deletions
diff --git a/src/base/bitfield.hh b/src/base/bitfield.hh index cc3695159..2cf93924b 100644 --- a/src/base/bitfield.hh +++ b/src/base/bitfield.hh @@ -178,4 +178,37 @@ findLsbSet(uint64_t val) { return lsb; } +/** + * Checks if a number is a power of two, or zero. + */ +template <class T> +inline bool +isPow2(T v) { + return (v & (v - 1)) == (T)0; +} + +/** + * Returns the number of set ones in the provided value. + * PD algorithm from + * http://graphics.stanford.edu/~seander/bithacks.html#CountBitsSetParallel + */ +inline int +popCount(uint64_t val) { +#ifndef __has_builtin + #define __has_builtin(foo) 0 +#endif +#if defined(__GNUC__) || (defined(__clang__) && __has_builtin(__builtin_popcountl)) + return __builtin_popcountl(val); +#else + const uint64_t m1 = 0x5555555555555555; // ..010101b + const uint64_t m2 = 0x3333333333333333; // ..110011b + const uint64_t m4 = 0x0f0f0f0f0f0f0f0f; // ..001111b + const uint64_t sum = 0x0101010101010101; + + val -= (val >> 1) & m1; // 2 bits count -> 2 bits + val = (val & m2) + ((val >> 2) & m2); // 4 bits count -> 4 bits + val = (val + (val >> 4)) & m4; // 8 bits count -> 8 bits + return (val * sum) >> 56; // horizontal sum +#endif // defined(__GNUC__) || (defined(__clang__) && __has_builtin(__builtin_popcountl)) +} #endif // __BASE_BITFIELD_HH__ |