123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170 |
- #ifndef AL_BIT_H
- #define AL_BIT_H
- #include <array>
- #ifndef __GNUC__
- #include <cstdint>
- #endif
- #include <cstring>
- #include <limits>
- #include <new>
- #include <type_traits>
- #if !defined(__GNUC__) && (defined(_WIN32) || defined(_WIN64))
- #include <intrin.h>
- #endif
- namespace al {
- template<typename To, typename From>
- std::enable_if_t<sizeof(To) == sizeof(From) && std::is_trivially_copyable_v<From>
- && std::is_trivially_copyable_v<To>,
- To> bit_cast(const From &src) noexcept
- {
- alignas(To) std::array<char,sizeof(To)> dst;
- std::memcpy(dst.data(), &src, sizeof(To));
- return *std::launder(reinterpret_cast<To*>(dst.data()));
- }
- #ifdef __BYTE_ORDER__
- enum class endian {
- little = __ORDER_LITTLE_ENDIAN__,
- big = __ORDER_BIG_ENDIAN__,
- native = __BYTE_ORDER__
- };
- #else
- /* This doesn't support mixed-endian. */
- namespace detail_ {
- constexpr bool IsLittleEndian() noexcept
- {
- static_assert(sizeof(char) < sizeof(int), "char is too big");
- constexpr int test_val{1};
- return static_cast<const char&>(test_val) ? true : false;
- }
- } // namespace detail_
- enum class endian {
- big = 0,
- little = 1,
- native = detail_::IsLittleEndian() ? little : big
- };
- #endif
- /* Define popcount (population count/count 1 bits) and countr_zero (count
- * trailing zero bits, starting from the lsb) methods, for various integer
- * types.
- */
- #ifdef __GNUC__
- namespace detail_ {
- inline int popcount(unsigned long long val) noexcept { return __builtin_popcountll(val); }
- inline int popcount(unsigned long val) noexcept { return __builtin_popcountl(val); }
- inline int popcount(unsigned int val) noexcept { return __builtin_popcount(val); }
- inline int countr_zero(unsigned long long val) noexcept { return __builtin_ctzll(val); }
- inline int countr_zero(unsigned long val) noexcept { return __builtin_ctzl(val); }
- inline int countr_zero(unsigned int val) noexcept { return __builtin_ctz(val); }
- } // namespace detail_
- template<typename T>
- inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
- int> popcount(T v) noexcept { return detail_::popcount(v); }
- template<typename T>
- inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
- int> countr_zero(T val) noexcept
- { return val ? detail_::countr_zero(val) : std::numeric_limits<T>::digits; }
- #else
- /* There be black magics here. The popcount method is derived from
- * https://graphics.stanford.edu/~seander/bithacks.html#CountBitsSetParallel
- * while the ctz-utilizing-popcount algorithm is shown here
- * http://www.hackersdelight.org/hdcodetxt/ntz.c.txt
- * as the ntz2 variant. These likely aren't the most efficient methods, but
- * they're good enough if the GCC built-ins aren't available.
- */
- namespace detail_ {
- template<typename T, size_t = std::numeric_limits<T>::digits>
- struct fast_utype { };
- template<typename T>
- struct fast_utype<T,8> { using type = std::uint_fast8_t; };
- template<typename T>
- struct fast_utype<T,16> { using type = std::uint_fast16_t; };
- template<typename T>
- struct fast_utype<T,32> { using type = std::uint_fast32_t; };
- template<typename T>
- struct fast_utype<T,64> { using type = std::uint_fast64_t; };
- template<typename T>
- constexpr T repbits(unsigned char bits) noexcept
- {
- T ret{bits};
- for(size_t i{1};i < sizeof(T);++i)
- ret = (ret<<8) | bits;
- return ret;
- }
- } // namespace detail_
- template<typename T>
- constexpr std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
- int> popcount(T val) noexcept
- {
- using fast_type = typename detail_::fast_utype<T>::type;
- constexpr fast_type b01010101{detail_::repbits<fast_type>(0x55)};
- constexpr fast_type b00110011{detail_::repbits<fast_type>(0x33)};
- constexpr fast_type b00001111{detail_::repbits<fast_type>(0x0f)};
- constexpr fast_type b00000001{detail_::repbits<fast_type>(0x01)};
- fast_type v{fast_type{val} - ((fast_type{val} >> 1) & b01010101)};
- v = (v & b00110011) + ((v >> 2) & b00110011);
- v = (v + (v >> 4)) & b00001111;
- return static_cast<int>(((v * b00000001) >> ((sizeof(T)-1)*8)) & 0xff);
- }
- #ifdef _WIN32
- template<typename T>
- inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value
- && std::numeric_limits<T>::digits <= 32,
- int> countr_zero(T v)
- {
- unsigned long idx{std::numeric_limits<T>::digits};
- _BitScanForward(&idx, static_cast<uint32_t>(v));
- return static_cast<int>(idx);
- }
- template<typename T>
- inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value
- && 32 < std::numeric_limits<T>::digits && std::numeric_limits<T>::digits <= 64,
- int> countr_zero(T v)
- {
- unsigned long idx{std::numeric_limits<T>::digits};
- #ifdef _WIN64
- _BitScanForward64(&idx, v);
- #else
- if(!_BitScanForward(&idx, static_cast<uint32_t>(v)))
- {
- if(_BitScanForward(&idx, static_cast<uint32_t>(v>>32)))
- idx += 32;
- }
- #endif /* _WIN64 */
- return static_cast<int>(idx);
- }
- #else
- template<typename T>
- constexpr std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
- int> countr_zero(T value)
- { return popcount(static_cast<T>(~value & (value - 1))); }
- #endif
- #endif
- } // namespace al
- #endif /* AL_BIT_H */
|