faiss/tutorial/cpp/3-IVFPQ.cpp

96 lines
2.1 KiB
C++
Raw Normal View History

/*
* Copyright (c) Meta Platforms, Inc. and affiliates.
2017-02-23 06:26:44 +08:00
*
* This source code is licensed under the MIT license found in the
2017-02-23 06:26:44 +08:00
* LICENSE file in the root directory of this source tree.
*/
#include <cstdio>
#include <cstdlib>
#include <random>
2017-02-23 06:26:44 +08:00
#include <faiss/IndexFlat.h>
#include <faiss/IndexIVFPQ.h>
using idx_t = faiss::idx_t;
2017-02-23 06:26:44 +08:00
int main() {
int d = 64; // dimension
int nb = 100000; // database size
int nq = 10000; // nb of queries
2017-02-23 06:26:44 +08:00
std::mt19937 rng;
std::uniform_real_distribution<> distrib;
float* xb = new float[d * nb];
float* xq = new float[d * nq];
2017-02-23 06:26:44 +08:00
for (int i = 0; i < nb; i++) {
for (int j = 0; j < d; j++)
xb[d * i + j] = distrib(rng);
2017-02-23 06:26:44 +08:00
xb[d * i] += i / 1000.;
}
for (int i = 0; i < nq; i++) {
for (int j = 0; j < d; j++)
xq[d * i + j] = distrib(rng);
2017-02-23 06:26:44 +08:00
xq[d * i] += i / 1000.;
}
int nlist = 100;
int k = 4;
int m = 8; // bytes per vector
faiss::IndexFlatL2 quantizer(d); // the other index
2017-02-23 06:26:44 +08:00
faiss::IndexIVFPQ index(&quantizer, d, nlist, m, 8);
2017-02-23 06:26:44 +08:00
index.train(nb, xb);
index.add(nb, xb);
{ // sanity check
idx_t* I = new idx_t[k * 5];
float* D = new float[k * 5];
2017-02-23 06:26:44 +08:00
index.search(5, xb, k, D, I);
printf("I=\n");
for (int i = 0; i < 5; i++) {
for (int j = 0; j < k; j++)
2020-06-28 19:00:44 +08:00
printf("%5zd ", I[i * k + j]);
2017-02-23 06:26:44 +08:00
printf("\n");
}
printf("D=\n");
for (int i = 0; i < 5; i++) {
for (int j = 0; j < k; j++)
2017-02-23 06:26:44 +08:00
printf("%7g ", D[i * k + j]);
printf("\n");
}
delete[] I;
delete[] D;
2017-02-23 06:26:44 +08:00
}
{ // search xq
idx_t* I = new idx_t[k * nq];
float* D = new float[k * nq];
2017-02-23 06:26:44 +08:00
index.nprobe = 10;
index.search(nq, xq, k, D, I);
printf("I=\n");
for (int i = nq - 5; i < nq; i++) {
for (int j = 0; j < k; j++)
2020-06-28 19:00:44 +08:00
printf("%5zd ", I[i * k + j]);
2017-02-23 06:26:44 +08:00
printf("\n");
}
delete[] I;
delete[] D;
2017-02-23 06:26:44 +08:00
}
delete[] xb;
delete[] xq;
2017-02-23 06:26:44 +08:00
return 0;
}