faiss/gpu/GpuIndex.h

137 lines
4.1 KiB
C++

/**
* Copyright (c) 2015-present, Facebook, Inc.
* All rights reserved.
*
* This source code is licensed under the BSD+Patents license found in the
* LICENSE file in the root directory of this source tree.
*/
#pragma once
#include "../Index.h"
#include "utils/MemorySpace.h"
namespace faiss { namespace gpu {
class GpuResources;
struct GpuIndexConfig {
inline GpuIndexConfig()
: device(0),
memorySpace(MemorySpace::Device) {
}
/// GPU device on which the index is resident
int device;
/// What memory space to use for primary storage.
/// On Pascal and above (CC 6+) architectures, allows GPUs to use
/// more memory than is available on the GPU.
MemorySpace memorySpace;
};
class GpuIndex : public faiss::Index {
public:
GpuIndex(GpuResources* resources,
int dims,
faiss::MetricType metric,
GpuIndexConfig config);
inline int getDevice() const {
return device_;
}
inline GpuResources* getResources() {
return resources_;
}
/// Set the minimum data size for searches (in MiB) for which we use
/// CPU -> GPU paging
void setMinPagingSize(size_t size);
/// Returns the current minimum data size for paged searches
size_t getMinPagingSize() const;
/// `x` can be resident on the CPU or any GPU; copies are performed
/// as needed
/// Handles paged adds if the add set is too large; calls addInternal_
void add(faiss::Index::idx_t, const float* x) override;
/// `x` and `ids` can be resident on the CPU or any GPU; copies are
/// performed as needed
/// Handles paged adds if the add set is too large; calls addInternal_
void add_with_ids(Index::idx_t n,
const float* x,
const Index::idx_t* ids) override;
/// `x`, `distances` and `labels` can be resident on the CPU or any
/// GPU; copies are performed as needed
void search(Index::idx_t n,
const float* x,
Index::idx_t k,
float* distances,
Index::idx_t* labels) const override;
protected:
/// Does addImpl_ require IDs? If so, and no IDs are provided, we will
/// generate them sequentially based on the order in which the IDs are added
virtual bool addImplRequiresIDs_() const = 0;
/// Overridden to actually perform the add
/// All data is guaranteed to be resident on our device
virtual void addImpl_(int n,
const float* x,
const Index::idx_t* ids) = 0;
/// Overridden to actually perform the search
/// All data is guaranteed to be resident on our device
virtual void searchImpl_(int n,
const float* x,
int k,
float* distances,
Index::idx_t* labels) const = 0;
private:
/// Handles paged adds if the add set is too large, passes to
/// addImpl_ to actually perform the add for the current page
void addPaged_(int n,
const float* x,
const Index::idx_t* ids);
/// Calls addImpl_ for a single page of GPU-resident data
void addPage_(int n,
const float* x,
const Index::idx_t* ids);
/// Calls searchImpl_ for a single page of GPU-resident data
void searchNonPaged_(int n,
const float* x,
int k,
float* outDistancesData,
Index::idx_t* outIndicesData) const;
/// Calls searchImpl_ for a single page of GPU-resident data,
/// handling paging of the data and copies from the CPU
void searchFromCpuPaged_(int n,
const float* x,
int k,
float* outDistancesData,
Index::idx_t* outIndicesData) const;
protected:
/// Manages streams, cuBLAS handles and scratch memory for devices
GpuResources* resources_;
/// The GPU device we are resident on
const int device_;
/// The memory space of our primary storage on the GPU
const MemorySpace memorySpace_;
/// Size above which we page copies from the CPU to GPU
size_t minPagedSize_;
};
} } // namespace