utils.h 1.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172
  1. #pragma once
  2. #if defined(__GNUC__) || defined(__clang__)
  3. static inline uint32_t clz32(unsigned long val)
  4. {
  5. return __builtin_clz(val);
  6. }
  7. static inline uint32_t ctz32(unsigned long val)
  8. {
  9. return __builtin_ctz(val);
  10. }
  11. #elif defined(_MSC_VER) && _MSC_VER >= 1400
  12. static inline uint32_t clz32(unsigned long val)
  13. {
  14. /* __lzcnt() / _lzcnt_u32() do not work correctly on older Intel CPUs,
  15. * so use BSR instead for better compatibility. */
  16. uint32_t zeros = 0;
  17. _BitScanReverse(&zeros, val);
  18. return 31 - zeros;
  19. }
  20. static inline uint32_t ctz32(unsigned long val)
  21. {
  22. return _tzcnt_u32(val);
  23. }
  24. #else
  25. static uint32_t popcnt(uint32_t x)
  26. {
  27. x -= ((x >> 1) & 0x55555555);
  28. x = (((x >> 2) & 0x33333333) + (x & 0x33333333));
  29. x = (((x >> 4) + x) & 0x0f0f0f0f);
  30. x += (x >> 8);
  31. x += (x >> 16);
  32. return x & 0x0000003f;
  33. }
  34. static uint32_t clz32(uint32_t x)
  35. {
  36. x |= (x >> 1);
  37. x |= (x >> 2);
  38. x |= (x >> 4);
  39. x |= (x >> 8);
  40. x |= (x >> 16);
  41. return 32 - popcnt(x);
  42. }
  43. static uint32_t ctz32(uint32_t x)
  44. {
  45. return popcnt((x & -x) - 1);
  46. }
  47. #endif
  48. static inline uint32_t min_u32(uint32_t a, uint32_t b)
  49. {
  50. return (a < b) ? a : b;
  51. }
  52. static inline uint16_t min_u16(uint16_t a, uint16_t b)
  53. {
  54. return (a < b) ? a : b;
  55. }
  56. static inline int32_t min_i32(int32_t a, int32_t b)
  57. {
  58. return (a < b) ? a : b;
  59. }
  60. static inline uint8_t max_u8(uint8_t a, uint8_t b)
  61. {
  62. return (a > b) ? a : b;
  63. }