faiss/gpu/GpuIndex.h

149 lines
4.6 KiB
C
Raw Normal View History

2017-02-23 06:26:44 +08:00
/**
* Copyright (c) Facebook, Inc. and its affiliates.
2017-02-23 06:26:44 +08:00
*
* This source code is licensed under the MIT license found in the
2017-02-23 06:26:44 +08:00
* LICENSE file in the root directory of this source tree.
*/
#pragma once
#include <faiss/Index.h>
#include <faiss/gpu/utils/MemorySpace.h>
2017-02-23 06:26:44 +08:00
namespace faiss { namespace gpu {
class GpuResources;
struct GpuIndexConfig {
inline GpuIndexConfig()
: device(0),
memorySpace(MemorySpace::Device) {
}
/// GPU device on which the index is resident
int device;
/// What memory space to use for primary storage.
/// On Pascal and above (CC 6+) architectures, allows GPUs to use
/// more memory than is available on the GPU.
MemorySpace memorySpace;
};
2017-02-23 06:26:44 +08:00
class GpuIndex : public faiss::Index {
public:
GpuIndex(GpuResources* resources,
int dims,
faiss::MetricType metric,
GpuIndexConfig config);
2017-02-23 06:26:44 +08:00
inline int getDevice() const {
2017-02-23 06:26:44 +08:00
return device_;
}
inline GpuResources* getResources() {
2017-02-23 06:26:44 +08:00
return resources_;
}
/// Set the minimum data size for searches (in MiB) for which we use
/// CPU -> GPU paging
void setMinPagingSize(size_t size);
/// Returns the current minimum data size for paged searches
size_t getMinPagingSize() const;
/// `x` can be resident on the CPU or any GPU; copies are performed
/// as needed
/// Handles paged adds if the add set is too large; calls addInternal_
void add(faiss::Index::idx_t, const float* x) override;
/// `x` and `ids` can be resident on the CPU or any GPU; copies are
/// performed as needed
/// Handles paged adds if the add set is too large; calls addInternal_
void add_with_ids(Index::idx_t n,
const float* x,
const Index::idx_t* ids) override;
/// `x`, `distances` and `labels` can be resident on the CPU or any
/// GPU; copies are performed as needed
void search(Index::idx_t n,
const float* x,
Index::idx_t k,
float* distances,
Index::idx_t* labels) const override;
/// Overridden to force GPU indices to provide their own GPU-friendly
/// implementation
void compute_residual(const float* x,
float* residual,
Index::idx_t key) const override;
/// Overridden to force GPU indices to provide their own GPU-friendly
/// implementation
void compute_residual_n(Index::idx_t n,
const float* xs,
float* residuals,
const Index::idx_t* keys) const override;
protected:
/// Does addImpl_ require IDs? If so, and no IDs are provided, we will
/// generate them sequentially based on the order in which the IDs are added
virtual bool addImplRequiresIDs_() const = 0;
/// Overridden to actually perform the add
/// All data is guaranteed to be resident on our device
virtual void addImpl_(int n,
const float* x,
const Index::idx_t* ids) = 0;
/// Overridden to actually perform the search
/// All data is guaranteed to be resident on our device
virtual void searchImpl_(int n,
const float* x,
int k,
float* distances,
Index::idx_t* labels) const = 0;
private:
/// Handles paged adds if the add set is too large, passes to
/// addImpl_ to actually perform the add for the current page
void addPaged_(int n,
const float* x,
const Index::idx_t* ids);
/// Calls addImpl_ for a single page of GPU-resident data
void addPage_(int n,
const float* x,
const Index::idx_t* ids);
/// Calls searchImpl_ for a single page of GPU-resident data
void searchNonPaged_(int n,
const float* x,
int k,
float* outDistancesData,
Index::idx_t* outIndicesData) const;
/// Calls searchImpl_ for a single page of GPU-resident data,
/// handling paging of the data and copies from the CPU
void searchFromCpuPaged_(int n,
const float* x,
int k,
float* outDistancesData,
Index::idx_t* outIndicesData) const;
2017-02-23 06:26:44 +08:00
protected:
/// Manages streams, cuBLAS handles and scratch memory for devices
2017-02-23 06:26:44 +08:00
GpuResources* resources_;
/// The GPU device we are resident on
const int device_;
/// The memory space of our primary storage on the GPU
const MemorySpace memorySpace_;
/// Size above which we page copies from the CPU to GPU
size_t minPagedSize_;
2017-02-23 06:26:44 +08:00
};
} } // namespace