16 namespace faiss {
namespace gpu {
namespace utils {
18 template <
typename U,
typename V>
19 constexpr __host__ __device__
auto divUp(U a, V b) -> decltype(a + b) {
20 return (a + b - 1) / b;
23 template <
typename U,
typename V>
24 constexpr __host__ __device__
auto roundDown(U a, V b) -> decltype(a + b) {
28 template <
typename U,
typename V>
29 constexpr __host__ __device__
auto roundUp(U a, V b) -> decltype(a + b) {
30 return divUp(a, b) * b;
34 constexpr __host__ __device__ T pow(T n, T power) {
35 return (power > 0 ? n * pow(n, power - 1) : 1);
39 constexpr __host__ __device__ T pow2(T n) {
43 static_assert(pow2(8) == 256,
"pow2");
46 constexpr __host__ __device__
int log2(T n,
int p = 0) {
47 return (n <= 1) ? p : log2(n / 2, p + 1);
50 static_assert(log2(2) == 1,
"log2");
51 static_assert(log2(3) == 1,
"log2");
52 static_assert(log2(4) == 2,
"log2");
55 constexpr __host__ __device__
bool isPowerOf2(T v) {
56 return (v && !(v & (v - 1)));
59 static_assert(isPowerOf2(2048),
"isPowerOf2");
60 static_assert(!isPowerOf2(3333),
"isPowerOf2");
63 constexpr __host__ __device__ T nextHighestPowerOf2(T v) {
64 return (isPowerOf2(v) ? (T) 2 * v : (1 << (log2(v) + 1)));
67 static_assert(nextHighestPowerOf2(1) == 2,
"nextHighestPowerOf2");
68 static_assert(nextHighestPowerOf2(2) == 4,
"nextHighestPowerOf2");
69 static_assert(nextHighestPowerOf2(3) == 4,
"nextHighestPowerOf2");
70 static_assert(nextHighestPowerOf2(4) == 8,
"nextHighestPowerOf2");
72 static_assert(nextHighestPowerOf2(15) == 16,
"nextHighestPowerOf2");
73 static_assert(nextHighestPowerOf2(16) == 32,
"nextHighestPowerOf2");
74 static_assert(nextHighestPowerOf2(17) == 32,
"nextHighestPowerOf2");