11 #include "../test/TestUtils.h"
12 #include "../../utils.h"
14 #include <gtest/gtest.h>
18 #include <unordered_map>
20 namespace faiss {
namespace gpu {
22 inline float relativeError(
float a,
float b) {
23 return std::abs(a - b) / (0.5f * (std::abs(a) + std::abs(b)));
32 clock_gettime(CLOCK_REALTIME, &t);
34 setTestSeed(t.tv_nsec);
37 void setTestSeed(
long seed) {
38 printf(
"testing with random seed %ld\n", seed);
44 int randVal(
int a,
int b) {
48 return a + (lrand48() % (b + 1 - a));
52 return randSelect<bool>({
true,
false});
55 std::vector<float> randVecs(
size_t num,
size_t dim) {
56 std::vector<float> v(num * dim);
57 static bool first =
true;
59 faiss::float_rand(v.data(), v.size(), s_seed);
69 int numQuery,
int dim,
int k,
70 const std::string& configMsg,
71 float maxRelativeError,
74 auto queries = faiss::gpu::randVecs(numQuery, dim);
77 std::vector<float> refDistance(numQuery * k, 0);
78 std::vector<faiss::Index::idx_t> refIndices(numQuery * k, -1);
79 refIndex.
search(numQuery, queries.data(),
80 k, refDistance.data(), refIndices.data());
82 std::vector<float> testDistance(numQuery * k, 0);
83 std::vector<faiss::Index::idx_t> testIndices(numQuery * k, -1);
84 testIndex.
search(numQuery, queries.data(),
85 k, testDistance.data(), testIndices.data());
87 faiss::gpu::compareLists(refDistance.data(),
94 maxRelativeError, pctMaxDiff1, pctMaxDiffN);
98 inline T lookup(
const T* p,
int i,
int j,
int dim1,
int dim2) {
99 return p[i * dim2 + j];
102 void compareLists(
const float* refDist,
104 const float* testDist,
107 const std::string& configMsg,
108 bool printBasicStats,
bool printDiffs,
bool assertOnErr,
109 float maxRelativeError,
113 float maxAbsErr = 0.0f;
114 for (
int i = 0; i < dim1 * dim2; ++i) {
115 maxAbsErr = std::max(maxAbsErr, std::abs(refDist[i] - testDist[i]));
117 int numResults = dim1 * dim2;
120 std::vector<std::unordered_map<faiss::Index::idx_t, int>> refIndexMap;
122 for (
int query = 0; query < dim1; ++query) {
123 std::unordered_map<faiss::Index::idx_t, int> indices;
125 for (
int result = 0; result < dim2; ++result) {
126 indices[lookup(refInd, query, result, dim1, dim2)] = result;
129 refIndexMap.emplace_back(std::move(indices));
134 std::vector<std::vector<int>> indexDiffs;
139 int nonUniqueIndices = 0;
141 double avgDiff = 0.0;
143 float maxRelErr = 0.0f;
145 for (
int query = 0; query < dim1; ++query) {
146 std::vector<int> diffs;
147 std::set<faiss::Index::idx_t> uniqueIndices;
149 auto& indices = refIndexMap[query];
151 for (
int result = 0; result < dim2; ++result) {
152 auto t = lookup(testInd, query, result, dim1, dim2);
156 bool uniqueIndex = uniqueIndices.count(t) == 0;
158 EXPECT_TRUE(uniqueIndex) << configMsg
167 uniqueIndices.insert(t);
170 auto it = indices.find(t);
171 if (it != indices.end()) {
172 int diff = std::abs(result - it->second);
173 diffs.push_back(diff);
177 maxDiff = std::max(diff, maxDiff);
178 }
else if (diff > 1) {
180 maxDiff = std::max(diff, maxDiff);
183 avgDiff += (double) diff;
190 auto refD = lookup(refDist, query, result, dim1, dim2);
191 auto testD = lookup(testDist, query, result, dim1, dim2);
193 float relErr = relativeError(refD, testD);
196 EXPECT_LE(relErr, maxRelativeError) << configMsg
197 <<
" (" << query <<
", " << result
198 <<
") refD: " << refD
199 <<
" testD: " << testD;
202 maxRelErr = std::max(maxRelErr, relErr);
205 indexDiffs.emplace_back(std::move(diffs));
209 EXPECT_LE((
float) (diff1 + diffN + diffInf),
210 (
float) numResults * pctMaxDiff1) << configMsg;
214 EXPECT_LE((
float) diffN, (
float) numResults * pctMaxDiffN) << configMsg;
217 avgDiff /= (double) numResults;
219 if (printBasicStats) {
220 if (!configMsg.empty()) {
222 "----------------------------\n"
227 printf(
"Result error and differences\n"
228 "----------------------------\n"
229 "max abs diff %.7f rel diff %.7f\n"
230 "idx diff avg: %.5g max: %d\n"
231 "idx diff of 1: %d (%.3f%% of queries)\n"
232 "idx diff of >1: %d (%.3f%% of queries)\n"
233 "idx diff not found: %d (%.3f%% of queries)"
234 " [typically a last element inversion]\n"
235 "non-unique indices: %d (a serious error if >0)\n",
236 maxAbsErr, maxRelErr,
238 diff1, 100.0f * (
float) diff1 / (
float) numResults,
239 diffN, 100.0f * (
float) diffN / (
float) numResults,
240 diffInf, 100.0f * (
float) diffInf / (
float) numResults,
245 printf(
"differences:\n");
246 printf(
"==================\n");
247 for (
int query = 0; query < dim1; ++query) {
248 for (
int result = 0; result < dim2; ++result) {
249 long refI = lookup(refInd, query, result, dim1, dim2);
250 long testI = lookup(testInd, query, result, dim1, dim2);
253 float refD = lookup(refDist, query, result, dim1, dim2);
254 float testD = lookup(testDist, query, result, dim1, dim2);
256 float maxDist = std::max(refD, testD);
257 float delta = std::abs(refD - testD);
259 float relErr = delta / maxDist;
262 printf(
"(%d, %d [%d]) (ref %ld tst %ld dist ==)\n",
264 indexDiffs[query][result],
267 printf(
"(%d, %d [%d]) (ref %ld tst %ld abs %.8f "
268 "rel %.8f ref %a tst %a)\n",
270 indexDiffs[query][result],
271 refI, testI, delta, relErr, refD, testD);
long idx_t
all indices are this type
virtual void search(idx_t n, const float *x, idx_t k, float *distances, idx_t *labels) const =0