mirror of https://github.com/axmolengine/axmol.git
168 lines
5.1 KiB
C++
168 lines
5.1 KiB
C++
#ifndef AL_BIT_H
|
|
#define AL_BIT_H
|
|
|
|
#include <cstdint>
|
|
#include <cstring>
|
|
#include <limits>
|
|
#include <new>
|
|
#include <type_traits>
|
|
#if !defined(__GNUC__) && (defined(_WIN32) || defined(_WIN64))
|
|
#include <intrin.h>
|
|
#endif
|
|
|
|
namespace al {
|
|
|
|
template<typename To, typename From>
|
|
std::enable_if_t<sizeof(To) == sizeof(From) && std::is_trivially_copyable_v<From>
|
|
&& std::is_trivially_copyable_v<To>,
|
|
To> bit_cast(const From &src) noexcept
|
|
{
|
|
std::aligned_storage_t<sizeof(To), alignof(To)> dst;
|
|
std::memcpy(&dst, &src, sizeof(To));
|
|
return *std::launder(reinterpret_cast<To*>(&dst));
|
|
}
|
|
|
|
#ifdef __BYTE_ORDER__
|
|
enum class endian {
|
|
little = __ORDER_LITTLE_ENDIAN__,
|
|
big = __ORDER_BIG_ENDIAN__,
|
|
native = __BYTE_ORDER__
|
|
};
|
|
|
|
#else
|
|
|
|
/* This doesn't support mixed-endian. */
|
|
namespace detail_ {
|
|
constexpr bool IsLittleEndian() noexcept
|
|
{
|
|
static_assert(sizeof(char) < sizeof(int), "char is too big");
|
|
|
|
constexpr int test_val{1};
|
|
return static_cast<const char&>(test_val) ? true : false;
|
|
}
|
|
} // namespace detail_
|
|
|
|
enum class endian {
|
|
big = 0,
|
|
little = 1,
|
|
native = detail_::IsLittleEndian() ? little : big
|
|
};
|
|
#endif
|
|
|
|
|
|
/* Define popcount (population count/count 1 bits) and countr_zero (count
|
|
* trailing zero bits, starting from the lsb) methods, for various integer
|
|
* types.
|
|
*/
|
|
#ifdef __GNUC__
|
|
|
|
namespace detail_ {
|
|
inline int popcount(unsigned long long val) noexcept { return __builtin_popcountll(val); }
|
|
inline int popcount(unsigned long val) noexcept { return __builtin_popcountl(val); }
|
|
inline int popcount(unsigned int val) noexcept { return __builtin_popcount(val); }
|
|
|
|
inline int countr_zero(unsigned long long val) noexcept { return __builtin_ctzll(val); }
|
|
inline int countr_zero(unsigned long val) noexcept { return __builtin_ctzl(val); }
|
|
inline int countr_zero(unsigned int val) noexcept { return __builtin_ctz(val); }
|
|
} // namespace detail_
|
|
|
|
template<typename T>
|
|
inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
|
|
int> popcount(T v) noexcept { return detail_::popcount(v); }
|
|
|
|
template<typename T>
|
|
inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
|
|
int> countr_zero(T val) noexcept
|
|
{ return val ? detail_::countr_zero(val) : std::numeric_limits<T>::digits; }
|
|
|
|
#else
|
|
|
|
/* There be black magics here. The popcount method is derived from
|
|
* https://graphics.stanford.edu/~seander/bithacks.html#CountBitsSetParallel
|
|
* while the ctz-utilizing-popcount algorithm is shown here
|
|
* http://www.hackersdelight.org/hdcodetxt/ntz.c.txt
|
|
* as the ntz2 variant. These likely aren't the most efficient methods, but
|
|
* they're good enough if the GCC built-ins aren't available.
|
|
*/
|
|
namespace detail_ {
|
|
template<typename T, size_t = std::numeric_limits<T>::digits>
|
|
struct fast_utype { };
|
|
template<typename T>
|
|
struct fast_utype<T,8> { using type = std::uint_fast8_t; };
|
|
template<typename T>
|
|
struct fast_utype<T,16> { using type = std::uint_fast16_t; };
|
|
template<typename T>
|
|
struct fast_utype<T,32> { using type = std::uint_fast32_t; };
|
|
template<typename T>
|
|
struct fast_utype<T,64> { using type = std::uint_fast64_t; };
|
|
|
|
template<typename T>
|
|
constexpr T repbits(unsigned char bits) noexcept
|
|
{
|
|
T ret{bits};
|
|
for(size_t i{1};i < sizeof(T);++i)
|
|
ret = (ret<<8) | bits;
|
|
return ret;
|
|
}
|
|
} // namespace detail_
|
|
|
|
template<typename T>
|
|
constexpr std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
|
|
int> popcount(T val) noexcept
|
|
{
|
|
using fast_type = typename detail_::fast_utype<T>::type;
|
|
constexpr fast_type b01010101{detail_::repbits<fast_type>(0x55)};
|
|
constexpr fast_type b00110011{detail_::repbits<fast_type>(0x33)};
|
|
constexpr fast_type b00001111{detail_::repbits<fast_type>(0x0f)};
|
|
constexpr fast_type b00000001{detail_::repbits<fast_type>(0x01)};
|
|
|
|
fast_type v{fast_type{val} - ((fast_type{val} >> 1) & b01010101)};
|
|
v = (v & b00110011) + ((v >> 2) & b00110011);
|
|
v = (v + (v >> 4)) & b00001111;
|
|
return static_cast<int>(((v * b00000001) >> ((sizeof(T)-1)*8)) & 0xff);
|
|
}
|
|
|
|
#ifdef _WIN32
|
|
|
|
template<typename T>
|
|
inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value
|
|
&& std::numeric_limits<T>::digits <= 32,
|
|
int> countr_zero(T v)
|
|
{
|
|
unsigned long idx{std::numeric_limits<T>::digits};
|
|
_BitScanForward(&idx, static_cast<uint32_t>(v));
|
|
return static_cast<int>(idx);
|
|
}
|
|
|
|
template<typename T>
|
|
inline std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value
|
|
&& 32 < std::numeric_limits<T>::digits && std::numeric_limits<T>::digits <= 64,
|
|
int> countr_zero(T v)
|
|
{
|
|
unsigned long idx{std::numeric_limits<T>::digits};
|
|
#ifdef _WIN64
|
|
_BitScanForward64(&idx, v);
|
|
#else
|
|
if(!_BitScanForward(&idx, static_cast<uint32_t>(v)))
|
|
{
|
|
if(_BitScanForward(&idx, static_cast<uint32_t>(v>>32)))
|
|
idx += 32;
|
|
}
|
|
#endif /* _WIN64 */
|
|
return static_cast<int>(idx);
|
|
}
|
|
|
|
#else
|
|
|
|
template<typename T>
|
|
constexpr std::enable_if_t<std::is_integral<T>::value && std::is_unsigned<T>::value,
|
|
int> countr_zero(T value)
|
|
{ return popcount(static_cast<T>(~value & (value - 1))); }
|
|
|
|
#endif
|
|
#endif
|
|
|
|
} // namespace al
|
|
|
|
#endif /* AL_BIT_H */
|