136 lines
4.1 KiB
C++
136 lines
4.1 KiB
C++
/**
|
|
* Copyright (c) Facebook, Inc. and its affiliates.
|
|
*
|
|
* This source code is licensed under the MIT license found in the
|
|
* LICENSE file in the root directory of this source tree.
|
|
*/
|
|
|
|
|
|
#pragma once
|
|
|
|
#include "../Index.h"
|
|
#include "utils/MemorySpace.h"
|
|
|
|
namespace faiss { namespace gpu {
|
|
|
|
class GpuResources;
|
|
|
|
struct GpuIndexConfig {
|
|
inline GpuIndexConfig()
|
|
: device(0),
|
|
memorySpace(MemorySpace::Device) {
|
|
}
|
|
|
|
/// GPU device on which the index is resident
|
|
int device;
|
|
|
|
/// What memory space to use for primary storage.
|
|
/// On Pascal and above (CC 6+) architectures, allows GPUs to use
|
|
/// more memory than is available on the GPU.
|
|
MemorySpace memorySpace;
|
|
};
|
|
|
|
class GpuIndex : public faiss::Index {
|
|
public:
|
|
GpuIndex(GpuResources* resources,
|
|
int dims,
|
|
faiss::MetricType metric,
|
|
GpuIndexConfig config);
|
|
|
|
inline int getDevice() const {
|
|
return device_;
|
|
}
|
|
|
|
inline GpuResources* getResources() {
|
|
return resources_;
|
|
}
|
|
|
|
/// Set the minimum data size for searches (in MiB) for which we use
|
|
/// CPU -> GPU paging
|
|
void setMinPagingSize(size_t size);
|
|
|
|
/// Returns the current minimum data size for paged searches
|
|
size_t getMinPagingSize() const;
|
|
|
|
/// `x` can be resident on the CPU or any GPU; copies are performed
|
|
/// as needed
|
|
/// Handles paged adds if the add set is too large; calls addInternal_
|
|
void add(faiss::Index::idx_t, const float* x) override;
|
|
|
|
/// `x` and `ids` can be resident on the CPU or any GPU; copies are
|
|
/// performed as needed
|
|
/// Handles paged adds if the add set is too large; calls addInternal_
|
|
void add_with_ids(Index::idx_t n,
|
|
const float* x,
|
|
const Index::idx_t* ids) override;
|
|
|
|
/// `x`, `distances` and `labels` can be resident on the CPU or any
|
|
/// GPU; copies are performed as needed
|
|
void search(Index::idx_t n,
|
|
const float* x,
|
|
Index::idx_t k,
|
|
float* distances,
|
|
Index::idx_t* labels) const override;
|
|
|
|
protected:
|
|
/// Does addImpl_ require IDs? If so, and no IDs are provided, we will
|
|
/// generate them sequentially based on the order in which the IDs are added
|
|
virtual bool addImplRequiresIDs_() const = 0;
|
|
|
|
/// Overridden to actually perform the add
|
|
/// All data is guaranteed to be resident on our device
|
|
virtual void addImpl_(int n,
|
|
const float* x,
|
|
const Index::idx_t* ids) = 0;
|
|
|
|
/// Overridden to actually perform the search
|
|
/// All data is guaranteed to be resident on our device
|
|
virtual void searchImpl_(int n,
|
|
const float* x,
|
|
int k,
|
|
float* distances,
|
|
Index::idx_t* labels) const = 0;
|
|
|
|
private:
|
|
/// Handles paged adds if the add set is too large, passes to
|
|
/// addImpl_ to actually perform the add for the current page
|
|
void addPaged_(int n,
|
|
const float* x,
|
|
const Index::idx_t* ids);
|
|
|
|
/// Calls addImpl_ for a single page of GPU-resident data
|
|
void addPage_(int n,
|
|
const float* x,
|
|
const Index::idx_t* ids);
|
|
|
|
/// Calls searchImpl_ for a single page of GPU-resident data
|
|
void searchNonPaged_(int n,
|
|
const float* x,
|
|
int k,
|
|
float* outDistancesData,
|
|
Index::idx_t* outIndicesData) const;
|
|
|
|
/// Calls searchImpl_ for a single page of GPU-resident data,
|
|
/// handling paging of the data and copies from the CPU
|
|
void searchFromCpuPaged_(int n,
|
|
const float* x,
|
|
int k,
|
|
float* outDistancesData,
|
|
Index::idx_t* outIndicesData) const;
|
|
|
|
protected:
|
|
/// Manages streams, cuBLAS handles and scratch memory for devices
|
|
GpuResources* resources_;
|
|
|
|
/// The GPU device we are resident on
|
|
const int device_;
|
|
|
|
/// The memory space of our primary storage on the GPU
|
|
const MemorySpace memorySpace_;
|
|
|
|
/// Size above which we page copies from the CPU to GPU
|
|
size_t minPagedSize_;
|
|
};
|
|
|
|
} } // namespace
|