docs/html/GpuIndexIVFFlat_8cu_source.html

 /**

  * Copyright (c) Facebook, Inc. and its affiliates.

  *

  * This source code is licensed under the MIT license found in the

  * LICENSE file in the root directory of this source tree.

  */


 #include "GpuIndexIVFFlat.h"

 #include "../IndexFlat.h"

 #include "../IndexIVFFlat.h"

 #include "GpuIndexFlat.h"

 #include "GpuResources.h"

 #include "impl/IVFFlat.cuh"

 #include "utils/CopyUtils.cuh"

 #include "utils/DeviceUtils.h"

 #include "utils/Float16.cuh"


 #include <limits>


 namespace faiss { namespace gpu {


 GpuIndexIVFFlat::GpuIndexIVFFlat(GpuResources* resources,

                                  const faiss::IndexIVFFlat* index,

                                  GpuIndexIVFFlatConfig config) :

     GpuIndexIVF(resources,

                 index->d,

                 index->metric_type,

                 index->nlist,

                 config),

     ivfFlatConfig_(config),

     reserveMemoryVecs_(0),

     index_(nullptr) {

 #ifndef FAISS_USE_FLOAT16

   FAISS_THROW_IF_NOT_MSG(!ivfFlatConfig_.useFloat16IVFStorage,

                      "float16 unsupported; need CUDA SDK >= 7.5");

 #endif


   copyFrom(index);

 }


 GpuIndexIVFFlat::GpuIndexIVFFlat(GpuResources* resources,

                                  int dims,

                                  int nlist,

                                  faiss::MetricType metric,

                                  GpuIndexIVFFlatConfig config) :

     GpuIndexIVF(resources, dims, metric, nlist, config),

     ivfFlatConfig_(config),

     reserveMemoryVecs_(0),

     index_(nullptr) {


   // faiss::Index params

   this->is_trained = false;


 #ifndef FAISS_USE_FLOAT16

   FAISS_THROW_IF_NOT_MSG(!ivfFlatConfig_.useFloat16IVFStorage,

                      "float16 unsupported; need CUDA SDK >= 7.5");

 #endif


   // We haven't trained ourselves, so don't construct the IVFFlat

   // index yet

 }


 GpuIndexIVFFlat::~GpuIndexIVFFlat() {

   delete index_;

 }


 void

 GpuIndexIVFFlat::reserveMemory(size_t numVecs) {

   reserveMemoryVecs_ = numVecs;

   if (index_) {

     index_->reserveMemory(numVecs);

   }

 }


 void

 GpuIndexIVFFlat::copyFrom(const faiss::IndexIVFFlat* index) {

   DeviceScope scope(device_);


   GpuIndexIVF::copyFrom(index);


   // Clear out our old data

   delete index_;

   index_ = nullptr;


   // The other index might not be trained

   if (!index->is_trained) {

     return;

   }


   // Otherwise, we can populate ourselves from the other index

   this->is_trained = true;


   // Copy our lists as well

   index_ = new IVFFlat(resources_,

                        quantizer_->getGpuData(),

                        index->metric_type == faiss::METRIC_L2,

                        ivfFlatConfig_.useFloat16IVFStorage,

                        ivfFlatConfig_.indicesOptions,

                        memorySpace_);

   InvertedLists *ivf = index->invlists;


   for (size_t i = 0; i < ivf->nlist; ++i) {

     auto numVecs = ivf->list_size(i);


     // GPU index can only support max int entries per list

     FAISS_THROW_IF_NOT_FMT(numVecs <=

                        (size_t) std::numeric_limits<int>::max(),

                        "GPU inverted list can only support "

                        "%zu entries; %zu found",

                        (size_t) std::numeric_limits<int>::max(),

                        numVecs);


     index_->addCodeVectorsFromCpu(

              i, (const float*)(ivf->get_codes(i)),

              ivf->get_ids(i), numVecs);

   }

 }


 void

 GpuIndexIVFFlat::copyTo(faiss::IndexIVFFlat* index) const {

   DeviceScope scope(device_);


   // We must have the indices in order to copy to ourselves

   FAISS_THROW_IF_NOT_MSG(ivfFlatConfig_.indicesOptions != INDICES_IVF,

                      "Cannot copy to CPU as GPU index doesn't retain "

                      "indices (INDICES_IVF)");


   GpuIndexIVF::copyTo(index);

   index->code_size = this->d * sizeof(float);


   InvertedLists *ivf = new ArrayInvertedLists(

       nlist_, index->code_size);


   index->replace_invlists(ivf, true);


   // Copy the inverted lists

   if (index_) {

     for (int i = 0; i < nlist_; ++i) {

       ivf->add_entries (

               i, index_->getListIndices(i).size(),

               index_->getListIndices(i).data(),

               (const uint8_t*)index_->getListVectors(i).data());

     }

   }

 }


 size_t

 GpuIndexIVFFlat::reclaimMemory() {

   if (index_) {

     DeviceScope scope(device_);


     return index_->reclaimMemory();

   }


   return 0;

 }


 void

 GpuIndexIVFFlat::reset() {

   if (index_) {

     DeviceScope scope(device_);


     index_->reset();

     this->ntotal = 0;

   } else {

     FAISS_ASSERT(this->ntotal == 0);

   }

 }


 void

 GpuIndexIVFFlat::train(Index::idx_t n, const float* x) {

   DeviceScope scope(device_);


   if (this->is_trained) {

     FAISS_ASSERT(quantizer_->is_trained);

     FAISS_ASSERT(quantizer_->ntotal == nlist_);

     FAISS_ASSERT(index_);

     return;

   }


   FAISS_ASSERT(!index_);


   trainQuantizer_(n, x);


   // The quantizer is now trained; construct the IVF index

   index_ = new IVFFlat(resources_,

                        quantizer_->getGpuData(),

                        this->metric_type == faiss::METRIC_L2,

                        ivfFlatConfig_.useFloat16IVFStorage,

                        ivfFlatConfig_.indicesOptions,

                        memorySpace_);


   if (reserveMemoryVecs_) {

     index_->reserveMemory(reserveMemoryVecs_);

   }


   this->is_trained = true;

 }


 void

 GpuIndexIVFFlat::addImpl_(int n,

                           const float* x,

                           const Index::idx_t* xids) {

   // Device is already set in GpuIndex::add

   FAISS_ASSERT(index_);

   FAISS_ASSERT(n > 0);


   // Data is already resident on the GPU

   Tensor<float, 2, true> data(const_cast<float*>(x), {n, (int) this->d});


   static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");

   Tensor<long, 1, true> labels(const_cast<long*>(xids), {n});


   // Not all vectors may be able to be added (some may contain NaNs etc)

   index_->classifyAndAddVectors(data, labels);


   // but keep the ntotal based on the total number of vectors that we attempted

   // to add

   ntotal += n;

 }


 void

 GpuIndexIVFFlat::searchImpl_(int n,

                              const float* x,

                              int k,

                              float* distances,

                              Index::idx_t* labels) const {

   // Device is already set in GpuIndex::search

   FAISS_ASSERT(index_);

   FAISS_ASSERT(n > 0);


   // Data is already resident on the GPU

   Tensor<float, 2, true> queries(const_cast<float*>(x), {n, (int) this->d});

   Tensor<float, 2, true> outDistances(distances, {n, k});


   static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");

   Tensor<long, 2, true> outLabels(const_cast<long*>(labels), {n, k});


   index_->query(queries, nprobe_, k, outDistances, outLabels);

 }


 } } // namespace

faiss::gpu::IVFFlat
Definition: IVFFlat.cuh:15

faiss::gpu::GpuIndexIVFFlat::GpuIndexIVFFlat
GpuIndexIVFFlat(GpuResources *resources, const faiss::IndexIVFFlat *index, GpuIndexIVFFlatConfig config=GpuIndexIVFFlatConfig())
Definition: GpuIndexIVFFlat.cu:23

faiss::ArrayInvertedLists
simple (default) implementation as an array of inverted lists
Definition: InvertedLists.h:182

faiss::gpu::GpuIndexFlat::getGpuData
FlatIndex * getGpuData()
For internal access.
Definition: GpuIndexFlat.h:99

faiss::gpu::GpuIndexIVFFlat::addImpl_
void addImpl_(int n, const float *x, const Index::idx_t *ids) override
Called from GpuIndex for add/add_with_ids.
Definition: GpuIndexIVFFlat.cu:202

faiss::InvertedLists::list_size
virtual size_t list_size(size_t list_no) const =0
get the size of a list

faiss::gpu::GpuIndexIVFFlat::copyFrom
void copyFrom(const faiss::IndexIVFFlat *index)
Definition: GpuIndexIVFFlat.cu:77

faiss::gpu::IVFBase::reserveMemory
void reserveMemory(size_t numVecs)
Reserve GPU memory in our inverted lists for this number of vectors.
Definition: IVFBase.cu:43

faiss::gpu::GpuIndexIVFFlat::reclaimMemory
size_t reclaimMemory()
Definition: GpuIndexIVFFlat.cu:149

faiss::gpu::GpuIndexIVFFlatConfig::useFloat16IVFStorage
bool useFloat16IVFStorage
Definition: GpuIndexIVFFlat.h:27

faiss::gpu::GpuResources
Definition: GpuResources.h:21

faiss::IndexIVFFlat
Definition: IndexIVFFlat.h:24

faiss::gpu::GpuIndexIVFFlat::train
void train(Index::idx_t n, const float *x) override
Definition: GpuIndexIVFFlat.cu:172

faiss::InvertedLists
Definition: InvertedLists.h:31

faiss::gpu::GpuIndexIVF
Definition: GpuIndexIVF.h:35

faiss::Index::d
int d
vector dimension
Definition: Index.h:66

faiss::Index::idx_t
long idx_t
all indices are this type
Definition: Index.h:62

faiss::gpu::IVFFlat::classifyAndAddVectors
int classifyAndAddVectors(Tensor< float, 2, true > &vecs, Tensor< long, 1, true > &indices)
Definition: IVFFlat.cu:127

faiss::gpu::GpuIndexIVFFlat::copyTo
void copyTo(faiss::IndexIVFFlat *index) const
Definition: GpuIndexIVFFlat.cu:121

faiss::gpu::GpuIndexIVF::nprobe_
int nprobe_
Number of inverted list probes per query.
Definition: GpuIndexIVF.h:84

faiss::gpu::GpuIndexIVFFlat::reserveMemory
void reserveMemory(size_t numVecs)
Reserve GPU memory in our inverted lists for this number of vectors.
Definition: GpuIndexIVFFlat.cu:69

faiss::gpu::GpuIndex::device_
const int device_
The GPU device we are resident on.
Definition: GpuIndex.h:126

faiss::gpu::GpuIndex::resources_
GpuResources * resources_
Manages streams, cuBLAS handles and scratch memory for devices.
Definition: GpuIndex.h:123

faiss::gpu::GpuIndexIVF::copyTo
void copyTo(faiss::IndexIVF *index) const
Copy what we have to the CPU equivalent.
Definition: GpuIndexIVF.cu:153

faiss::IndexIVF::replace_invlists
void replace_invlists(InvertedLists *il, bool own=false)
replace the inverted lists, old one is deallocated if own_invlists
Definition: IndexIVF.cpp:735

faiss::gpu::GpuIndexIVF::nlist_
int nlist_
Number of inverted lists that we manage.
Definition: GpuIndexIVF.h:81

faiss::Index::ntotal
idx_t ntotal
total nb of indexed vectors
Definition: Index.h:67

faiss::gpu::IVFBase::reset
void reset()
Definition: IVFBase.cu:73

faiss::gpu::Tensor
Our tensor type.
Definition: Tensor.cuh:28

faiss::gpu::IVFFlat::addCodeVectorsFromCpu
void addCodeVectorsFromCpu(int listId, const float *vecs, const long *indices, size_t numVecs)
Definition: IVFFlat.cu:52

faiss::gpu::DeviceScope
Definition: DeviceUtils.h:68

faiss::gpu::GpuIndex::memorySpace_
const MemorySpace memorySpace_
The memory space of our primary storage on the GPU.
Definition: GpuIndex.h:129

faiss::gpu::GpuIndexIVF::quantizer_
GpuIndexFlat * quantizer_
Quantizer for inverted lists.
Definition: GpuIndexIVF.h:87

faiss::gpu::IVFFlat::query
void query(Tensor< float, 2, true > &queries, int nprobe, int k, Tensor< float, 2, true > &outDistances, Tensor< long, 2, true > &outIndices)
Definition: IVFFlat.cu:285

faiss::gpu::IVFFlat::getListVectors
std::vector< float > getListVectors(int listId) const
Return the vectors of a particular list back to the CPU.
Definition: IVFFlat.cu:351

faiss::Index::metric_type
MetricType metric_type
type of metric this index uses for search
Definition: Index.h:74

faiss::gpu::GpuIndexIVFFlat::searchImpl_
void searchImpl_(int n, const float *x, int k, float *distances, Index::idx_t *labels) const override
Called from GpuIndex for search.
Definition: GpuIndexIVFFlat.cu:224

faiss::IndexIVF::invlists
InvertedLists * invlists
Acess to the actual data.
Definition: IndexIVF.h:92

faiss::gpu::IVFBase::getListIndices
std::vector< long > getListIndices(int listId) const
Return the list indices of a particular list back to the CPU.
Definition: IVFBase.cu:205

faiss::gpu::GpuIndexIVF::copyFrom
void copyFrom(const faiss::IndexIVF *index)
Copy what we need from the CPU equivalent.
Definition: GpuIndexIVF.cu:79

faiss::Index::is_trained
bool is_trained
set if the Index does not require training, or if training is done already
Definition: Index.h:71

faiss::gpu::GpuIndexIVFFlatConfig
Definition: GpuIndexIVFFlat.h:20

faiss::gpu::GpuIndexIVFConfig::indicesOptions
IndicesOptions indicesOptions
Index storage options for the GPU.
Definition: GpuIndexIVF.h:29

faiss::gpu::IVFBase::reclaimMemory
size_t reclaimMemory()
Definition: IVFBase.cu:103

faiss::gpu::GpuIndexIVFFlat::reset
void reset() override
removes all elements from the database.
Definition: GpuIndexIVFFlat.cu:160

faiss::IndexIVF::code_size
size_t code_size
code size per vector in bytes
Definition: IndexIVF.h:95

faiss::MetricType
MetricType
Some algorithms support both an inner product version and a L2 search version.
Definition: Index.h:44