12 #include "../test/TestUtils.h"
13 #include "../../utils.h"
15 #include <gtest/gtest.h>
19 #include <unordered_map>
21 namespace faiss {
namespace gpu {
23 inline float relativeError(
float a,
float b) {
24 return std::abs(a - b) / (0.5f * (std::abs(a) + std::abs(b)));
33 clock_gettime(CLOCK_REALTIME, &t);
35 setTestSeed(t.tv_nsec);
38 void setTestSeed(
long seed) {
39 printf(
"testing with random seed %ld\n", seed);
45 int randVal(
int a,
int b) {
49 return a + (lrand48() % (b + 1 - a));
53 return randSelect<bool>({
true,
false});
56 std::vector<float> randVecs(
int num,
int dim) {
57 std::vector<float> v(num * dim);
58 static bool first =
true;
60 faiss::float_rand(v.data(), v.size(), s_seed);
70 int numQuery,
int dim,
int k,
71 const std::string& configMsg,
72 float maxRelativeError,
75 auto queries = faiss::gpu::randVecs(numQuery, dim);
78 std::vector<float> refDistance(numQuery * k, 0);
79 std::vector<faiss::Index::idx_t> refIndices(numQuery * k, -1);
80 refIndex.
search(numQuery, queries.data(),
81 k, refDistance.data(), refIndices.data());
83 std::vector<float> testDistance(numQuery * k, 0);
84 std::vector<faiss::Index::idx_t> testIndices(numQuery * k, -1);
85 testIndex.
search(numQuery, queries.data(),
86 k, testDistance.data(), testIndices.data());
88 faiss::gpu::compareLists(refDistance.data(),
95 maxRelativeError, pctMaxDiff1, pctMaxDiffN);
99 inline T lookup(
const T* p,
int i,
int j,
int dim1,
int dim2) {
100 return p[i * dim2 + j];
103 void compareLists(
const float* refDist,
105 const float* testDist,
108 const std::string& configMsg,
109 bool printBasicStats,
bool printDiffs,
bool assertOnErr,
110 float maxRelativeError,
114 float maxAbsErr = 0.0f;
115 for (
int i = 0; i < dim1 * dim2; ++i) {
116 maxAbsErr = std::max(maxAbsErr, std::abs(refDist[i] - testDist[i]));
118 int numResults = dim1 * dim2;
121 std::vector<std::unordered_map<faiss::Index::idx_t, int>> refIndexMap;
123 for (
int query = 0; query < dim1; ++query) {
124 std::unordered_map<faiss::Index::idx_t, int> indices;
126 for (
int result = 0; result < dim2; ++result) {
127 indices[lookup(refInd, query, result, dim1, dim2)] = result;
130 refIndexMap.emplace_back(std::move(indices));
135 std::vector<std::vector<int>> indexDiffs;
140 int nonUniqueIndices = 0;
142 double avgDiff = 0.0;
144 float maxRelErr = 0.0f;
146 for (
int query = 0; query < dim1; ++query) {
147 std::vector<int> diffs;
148 std::set<faiss::Index::idx_t> uniqueIndices;
150 auto& indices = refIndexMap[query];
152 for (
int result = 0; result < dim2; ++result) {
153 auto t = lookup(testInd, query, result, dim1, dim2);
157 bool uniqueIndex = uniqueIndices.count(t) == 0;
159 EXPECT_TRUE(uniqueIndex) << configMsg
168 uniqueIndices.insert(t);
171 auto it = indices.find(t);
172 if (it != indices.end()) {
173 int diff = std::abs(result - it->second);
174 diffs.push_back(diff);
178 maxDiff = std::max(diff, maxDiff);
179 }
else if (diff > 1) {
181 maxDiff = std::max(diff, maxDiff);
184 avgDiff += (double) diff;
191 auto refD = lookup(refDist, query, result, dim1, dim2);
192 auto testD = lookup(testDist, query, result, dim1, dim2);
194 float relErr = relativeError(refD, testD);
197 EXPECT_LE(relErr, maxRelativeError) << configMsg
198 <<
" " << query <<
" " << result;
201 maxRelErr = std::max(maxRelErr, relErr);
204 indexDiffs.emplace_back(std::move(diffs));
208 EXPECT_LE((
float) (diff1 + diffN + diffInf),
209 (
float) numResults * pctMaxDiff1) << configMsg;
213 EXPECT_LE((
float) diffN, (
float) numResults * pctMaxDiffN) << configMsg;
216 avgDiff /= (double) numResults;
218 if (printBasicStats) {
219 if (!configMsg.empty()) {
221 "----------------------------\n"
226 printf(
"Result error and differences\n"
227 "----------------------------\n"
228 "max abs diff %.7f rel diff %.7f\n"
229 "idx diff avg: %.5g max: %d\n"
230 "idx diff of 1: %d (%.3f%% of queries)\n"
231 "idx diff of >1: %d (%.3f%% of queries)\n"
232 "idx diff not found: %d (%.3f%% of queries)"
233 " [typically a last element inversion]\n"
234 "non-unique indices: %d (a serious error if >0)\n",
235 maxAbsErr, maxRelErr,
237 diff1, 100.0f * (
float) diff1 / (
float) numResults,
238 diffN, 100.0f * (
float) diffN / (
float) numResults,
239 diffInf, 100.0f * (
float) diffInf / (
float) numResults,
244 printf(
"differences:\n");
245 printf(
"==================\n");
246 for (
int query = 0; query < dim1; ++query) {
247 for (
int result = 0; result < dim2; ++result) {
248 long refI = lookup(refInd, query, result, dim1, dim2);
249 long testI = lookup(testInd, query, result, dim1, dim2);
252 float refD = lookup(refDist, query, result, dim1, dim2);
253 float testD = lookup(testDist, query, result, dim1, dim2);
255 float maxDist = std::max(refD, testD);
256 float delta = std::abs(refD - testD);
258 float relErr = delta / maxDist;
261 printf(
"(%d, %d [%d]) (ref %ld tst %ld dist ==)\n",
263 indexDiffs[query][result],
266 printf(
"(%d, %d [%d]) (ref %ld tst %ld abs %.8f "
267 "rel %.8f ref %a tst %a)\n",
269 indexDiffs[query][result],
270 refI, testI, delta, relErr, refD, testD);
long idx_t
all indices are this type
virtual void search(idx_t n, const float *x, idx_t k, float *distances, idx_t *labels) const =0