10 #include "../../IndexFlat.h"
11 #include "../GpuIndexFlat.h"
12 #include "../StandardGpuResources.h"
13 #include "../utils/DeviceUtils.h"
14 #include "../test/TestUtils.h"
15 #include <gtest/gtest.h>
20 constexpr
float kF16MaxRelErr = 0.07f;
21 constexpr
float kF32MaxRelErr = 6e-3f;
29 numQueriesOverride(-1),
37 int numQueriesOverride;
42 int numVecs = opt.numVecsOverride > 0 ?
43 opt.numVecsOverride : faiss::gpu::randVal(1000, 20000);
44 int dim = faiss::gpu::randVal(50, 800);
45 int numQuery = opt.numQueriesOverride > 0 ?
46 opt.numQueriesOverride : faiss::gpu::randVal(1, 512);
51 int k = opt.useFloat16 ?
52 std::min(faiss::gpu::randVal(1, 50), numVecs) :
53 std::min(faiss::gpu::randVal(1, 1024), numVecs);
54 if (opt.kOverride > 0) {
67 int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
85 std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
86 cpuIndex->
add(numVecs, vecs.data());
87 gpuIndex->
add(numVecs, vecs.data());
89 std::stringstream str;
90 str << (opt.useL2 ?
"L2" :
"IP") <<
" numVecs " << numVecs
92 <<
" useFloat16 " << opt.useFloat16
93 <<
" transposed " << opt.useTransposed
94 <<
" numQuery " << numQuery
99 faiss::gpu::compareIndices(*cpuIndex, *gpuIndex, numQuery, dim, k, str.str(),
100 opt.useFloat16 ? kF16MaxRelErr : kF32MaxRelErr,
104 opt.useFloat16 ? 0.99f : 0.1f,
105 opt.useFloat16 ? 0.65f : 0.015f);
108 TEST(TestGpuIndexFlat, IP_Float32) {
109 for (
int tries = 0; tries < 5; ++tries) {
112 opt.useFloat16 =
false;
113 opt.useTransposed =
false;
117 opt.useTransposed =
true;
122 TEST(TestGpuIndexFlat, L2_Float32) {
123 for (
int tries = 0; tries < 5; ++tries) {
126 opt.useFloat16 =
false;
127 opt.useTransposed =
false;
131 opt.useTransposed =
true;
137 TEST(TestGpuIndexFlat, L2_Float32_K1) {
138 for (
int tries = 0; tries < 5; ++tries) {
141 opt.useFloat16 =
false;
142 opt.useTransposed =
false;
149 TEST(TestGpuIndexFlat, IP_Float16) {
150 for (
int tries = 0; tries < 5; ++tries) {
153 opt.useFloat16 =
true;
154 opt.useTransposed =
false;
158 opt.useTransposed =
true;
163 TEST(TestGpuIndexFlat, L2_Float16) {
164 for (
int tries = 0; tries < 5; ++tries) {
167 opt.useFloat16 =
true;
168 opt.useTransposed =
false;
172 opt.useTransposed =
true;
178 TEST(TestGpuIndexFlat, L2_Float16_K1) {
179 for (
int tries = 0; tries < 5; ++tries) {
182 opt.useFloat16 =
true;
183 opt.useTransposed =
false;
191 TEST(TestGpuIndexFlat, L2_Tiling) {
192 for (
int tries = 0; tries < 2; ++tries) {
195 opt.useFloat16 =
false;
196 opt.useTransposed =
false;
197 opt.numVecsOverride = 1000000;
198 opt.numQueriesOverride = 4;
202 opt.useTransposed =
true;
207 TEST(TestGpuIndexFlat, QueryEmpty) {
223 std::vector<float> queries(numQuery * dim, 1.0f);
225 std::vector<float> dist(numQuery * k, 0);
226 std::vector<faiss::Index::idx_t> ind(numQuery * k);
228 gpuIndex.
search(numQuery, queries.data(), k, dist.data(), ind.data());
230 for (
auto d : dist) {
231 EXPECT_EQ(d, std::numeric_limits<float>::max());
239 TEST(TestGpuIndexFlat, CopyFrom) {
240 int numVecs = faiss::gpu::randVal(100, 200);
241 int dim = faiss::gpu::randVal(1, 1000);
245 std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
246 cpuIndex.
add(numVecs, vecs.data());
252 int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
263 EXPECT_EQ(gpuIndex.
ntotal, numVecs);
265 EXPECT_EQ(cpuIndex.
d, gpuIndex.
d);
266 EXPECT_EQ(cpuIndex.
d, dim);
268 int idx = faiss::gpu::randVal(0, numVecs - 1);
270 std::vector<float> gpuVals(dim);
273 std::vector<float> cpuVals(dim);
276 EXPECT_EQ(gpuVals, cpuVals);
279 TEST(TestGpuIndexFlat, CopyTo) {
283 int numVecs = faiss::gpu::randVal(100, 200);
284 int dim = faiss::gpu::randVal(1, 1000);
286 int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
295 std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
296 gpuIndex.
add(numVecs, vecs.data());
300 gpuIndex.
copyTo(&cpuIndex);
303 EXPECT_EQ(gpuIndex.
ntotal, numVecs);
305 EXPECT_EQ(cpuIndex.
d, gpuIndex.
d);
306 EXPECT_EQ(cpuIndex.
d, dim);
308 int idx = faiss::gpu::randVal(0, numVecs - 1);
310 std::vector<float> gpuVals(dim);
313 std::vector<float> cpuVals(dim);
316 EXPECT_EQ(gpuVals, cpuVals);
319 TEST(TestGpuIndexFlat, UnifiedMemory) {
322 int device = faiss::gpu::randVal(0, faiss::gpu::getNumDevices() - 1);
324 if (!faiss::gpu::getFullUnifiedMemSupport(device)) {
333 size_t numVecs = 50000;
344 config.
memorySpace = faiss::gpu::MemorySpace::Unified;
348 std::vector<float> vecs = faiss::gpu::randVecs(numVecs, dim);
349 cpuIndexL2.add(numVecs, vecs.data());
350 gpuIndexL2.add(numVecs, vecs.data());
354 faiss::gpu::compareIndices(cpuIndexL2, gpuIndexL2,
355 numQuery, dim, k,
"Unified Memory",
361 int main(
int argc,
char** argv) {
362 testing::InitGoogleTest(&argc, argv);
365 faiss::gpu::setTestSeed(100);
367 return RUN_ALL_TESTS();
void copyTo(faiss::IndexFlat *index) const
void reconstruct(idx_t key, float *recons) const override
bool useFloat16
Whether or not data is stored as float16.
int device
GPU device on which the index is resident.
void reconstruct(faiss::Index::idx_t key, float *out) const override
idx_t ntotal
total nb of indexed vectors
void add(idx_t n, const float *x) override
void copyFrom(const faiss::IndexFlat *index)
void add(faiss::Index::idx_t, const float *x) override
Overrides to avoid excessive copies.
void search(faiss::Index::idx_t n, const float *x, faiss::Index::idx_t k, float *distances, faiss::Index::idx_t *labels) const override