11 #include "../test/TestUtils.h"
12 #include "../../utils.h"
14 #include <gtest/gtest.h>
18 #include <unordered_map>
20 namespace faiss {
namespace gpu {
22 inline float relativeError(
float a,
float b) {
23 return std::abs(a - b) / (0.5f * (std::abs(a) + std::abs(b)));
32 clock_gettime(CLOCK_REALTIME, &t);
34 setTestSeed(t.tv_nsec);
37 void setTestSeed(
long seed) {
38 printf(
"testing with random seed %ld\n", seed);
44 int randVal(
int a,
int b) {
48 return a + (lrand48() % (b + 1 - a));
52 return randSelect<bool>({
true,
false});
55 std::vector<float> randVecs(
size_t num,
size_t dim) {
56 std::vector<float> v(num * dim);
57 static bool first =
true;
59 faiss::float_rand(v.data(), v.size(), s_seed);
67 void compareIndices(
const std::vector<float>& queryVecs,
70 int numQuery,
int dim,
int k,
71 const std::string& configMsg,
72 float maxRelativeError,
76 std::vector<float> refDistance(numQuery * k, 0);
77 std::vector<faiss::Index::idx_t> refIndices(numQuery * k, -1);
78 refIndex.
search(numQuery, queryVecs.data(),
79 k, refDistance.data(), refIndices.data());
81 std::vector<float> testDistance(numQuery * k, 0);
82 std::vector<faiss::Index::idx_t> testIndices(numQuery * k, -1);
83 testIndex.
search(numQuery, queryVecs.data(),
84 k, testDistance.data(), testIndices.data());
86 faiss::gpu::compareLists(refDistance.data(),
93 maxRelativeError, pctMaxDiff1, pctMaxDiffN);
98 int numQuery,
int dim,
int k,
99 const std::string& configMsg,
100 float maxRelativeError,
103 auto queryVecs = faiss::gpu::randVecs(numQuery, dim);
105 compareIndices(queryVecs,
115 template <
typename T>
116 inline T lookup(
const T* p,
int i,
int j,
int ,
int dim2) {
117 return p[i * dim2 + j];
120 void compareLists(
const float* refDist,
122 const float* testDist,
125 const std::string& configMsg,
126 bool printBasicStats,
bool printDiffs,
bool assertOnErr,
127 float maxRelativeError,
131 float maxAbsErr = 0.0f;
132 for (
int i = 0; i < dim1 * dim2; ++i) {
133 maxAbsErr = std::max(maxAbsErr, std::abs(refDist[i] - testDist[i]));
135 int numResults = dim1 * dim2;
138 std::vector<std::unordered_map<faiss::Index::idx_t, int>> refIndexMap;
140 for (
int query = 0; query < dim1; ++query) {
141 std::unordered_map<faiss::Index::idx_t, int> indices;
143 for (
int result = 0; result < dim2; ++result) {
144 indices[lookup(refInd, query, result, dim1, dim2)] = result;
147 refIndexMap.emplace_back(std::move(indices));
152 std::vector<std::vector<int>> indexDiffs;
157 int nonUniqueIndices = 0;
159 double avgDiff = 0.0;
161 float maxRelErr = 0.0f;
163 for (
int query = 0; query < dim1; ++query) {
164 std::vector<int> diffs;
165 std::set<faiss::Index::idx_t> uniqueIndices;
167 auto& indices = refIndexMap[query];
169 for (
int result = 0; result < dim2; ++result) {
170 auto t = lookup(testInd, query, result, dim1, dim2);
174 bool uniqueIndex = uniqueIndices.count(t) == 0;
176 EXPECT_TRUE(uniqueIndex) << configMsg
185 uniqueIndices.insert(t);
188 auto it = indices.find(t);
189 if (it != indices.end()) {
190 int diff = std::abs(result - it->second);
191 diffs.push_back(diff);
195 maxDiff = std::max(diff, maxDiff);
196 }
else if (diff > 1) {
198 maxDiff = std::max(diff, maxDiff);
201 avgDiff += (double) diff;
208 auto refD = lookup(refDist, query, result, dim1, dim2);
209 auto testD = lookup(testDist, query, result, dim1, dim2);
211 float relErr = relativeError(refD, testD);
214 EXPECT_LE(relErr, maxRelativeError) << configMsg
215 <<
" (" << query <<
", " << result
216 <<
") refD: " << refD
217 <<
" testD: " << testD;
220 maxRelErr = std::max(maxRelErr, relErr);
223 indexDiffs.emplace_back(std::move(diffs));
227 EXPECT_LE((
float) (diff1 + diffN + diffInf),
228 (
float) numResults * pctMaxDiff1) << configMsg;
232 EXPECT_LE((
float) diffN, (
float) numResults * pctMaxDiffN) << configMsg;
235 avgDiff /= (double) numResults;
237 if (printBasicStats) {
238 if (!configMsg.empty()) {
240 "----------------------------\n"
245 printf(
"Result error and differences\n"
246 "----------------------------\n"
247 "max abs diff %.7f rel diff %.7f\n"
248 "idx diff avg: %.5g max: %d\n"
249 "idx diff of 1: %d (%.3f%% of queries)\n"
250 "idx diff of >1: %d (%.3f%% of queries)\n"
251 "idx diff not found: %d (%.3f%% of queries)"
252 " [typically a last element inversion]\n"
253 "non-unique indices: %d (a serious error if >0)\n",
254 maxAbsErr, maxRelErr,
256 diff1, 100.0f * (
float) diff1 / (
float) numResults,
257 diffN, 100.0f * (
float) diffN / (
float) numResults,
258 diffInf, 100.0f * (
float) diffInf / (
float) numResults,
263 printf(
"differences:\n");
264 printf(
"==================\n");
265 for (
int query = 0; query < dim1; ++query) {
266 for (
int result = 0; result < dim2; ++result) {
267 long refI = lookup(refInd, query, result, dim1, dim2);
268 long testI = lookup(testInd, query, result, dim1, dim2);
271 float refD = lookup(refDist, query, result, dim1, dim2);
272 float testD = lookup(testDist, query, result, dim1, dim2);
274 float maxDist = std::max(refD, testD);
275 float delta = std::abs(refD - testD);
277 float relErr = delta / maxDist;
280 printf(
"(%d, %d [%d]) (ref %ld tst %ld dist ==)\n",
282 indexDiffs[query][result],
285 printf(
"(%d, %d [%d]) (ref %ld tst %ld abs %.8f "
286 "rel %.8f ref %a tst %a)\n",
288 indexDiffs[query][result],
289 refI, testI, delta, relErr, refD, testD);
long idx_t
all indices are this type
virtual void search(idx_t n, const float *x, idx_t k, float *distances, idx_t *labels) const =0