docs/html/GpuIndexIVFFlat_8cu_source.html

 /**

  * Copyright (c) 2015-present, Facebook, Inc.

  * All rights reserved.

  *

  * This source code is licensed under the CC-by-NC license found in the

  * LICENSE file in the root directory of this source tree.

  */


 // Copyright 2004-present Facebook. All Rights Reserved.


 #include "GpuIndexIVFFlat.h"

 #include "../IndexFlat.h"

 #include "../IndexIVF.h"

 #include "GpuIndexFlat.h"

 #include "GpuResources.h"

 #include "impl/IVFFlat.cuh"

 #include "utils/CopyUtils.cuh"

 #include "utils/DeviceUtils.h"

 #include "utils/Float16.cuh"


 #include <limits>


 namespace faiss { namespace gpu {


 GpuIndexIVFFlat::GpuIndexIVFFlat(GpuResources* resources,

                                  int device,

                                  bool useFloat16CoarseQuantizer,

                                  bool useFloat16IVFStorage,

                                  int dims,

                                  int nlist,

                                  IndicesOptions indicesOptions,

                                  faiss::MetricType metric) :

     GpuIndexIVF(resources,

                 device,

                 indicesOptions,

                 useFloat16CoarseQuantizer,

                 dims,

                 metric,

                 nlist),

     useFloat16IVFStorage_(useFloat16IVFStorage),

     reserveMemoryVecs_(0),

     index_(nullptr) {

   DeviceScope scope(device_);


   // faiss::Index params

   this->is_trained = false;


 #ifndef FAISS_USE_FLOAT16

   FAISS_ASSERT(!useFloat16IVFStorage_,

                "float16 unsupported; need CUDA SDK >= 7.5");

 #endif


   // We haven't trained ourselves, so don't construct the IVFFlat

   // index yet

 }


 GpuIndexIVFFlat::GpuIndexIVFFlat(GpuResources* resources,

                                  int device,

                                  GpuIndexFlat* quantizer,

                                  bool useFloat16IVFStorage,

                                  int dims,

                                  int nlist,

                                  IndicesOptions indicesOptions,

                                  faiss::MetricType metric) :

     GpuIndexIVF(resources, device, indicesOptions, dims,

                 metric, nlist, quantizer),

     useFloat16IVFStorage_(useFloat16IVFStorage),

     reserveMemoryVecs_(0),

     index_(nullptr) {

   DeviceScope scope(device_);


   // faiss::Index params

   this->is_trained = (quantizer->ntotal > 0);


 #ifndef FAISS_USE_FLOAT16

   FAISS_ASSERT(!useFloat16IVFStorage_,

                "float16 unsupported; need CUDA SDK >= 7.5");

 #endif


   if (this->is_trained) {

     index_ = new IVFFlat(resources_,

                          quantizer_->getGpuData(),

                          quantizer_->metric_type == faiss::METRIC_L2,

                          useFloat16IVFStorage_,

                          indicesOptions_);

   }

 }


 GpuIndexIVFFlat::~GpuIndexIVFFlat() {

   delete index_;

 }


 void

 GpuIndexIVFFlat::reserveMemory(size_t numVecs) {

   reserveMemoryVecs_ = numVecs;

   if (index_) {

     index_->reserveMemory(numVecs);

   }

 }


 void

 GpuIndexIVFFlat::copyFrom(const faiss::IndexIVFFlat* index) {

   DeviceScope scope(device_);


   GpuIndexIVF::copyFrom(index);


   // Clear out our old data

   delete index_;

   index_ = nullptr;


   // The other index might not be trained

   if (!index->is_trained) {

     return;

   }


   // Otherwise, we can populate ourselves from the other index

   this->is_trained = true;


   // Copy our lists as well

   index_ = new IVFFlat(resources_,

                        quantizer_->getGpuData(),

                        index->metric_type == faiss::METRIC_L2,

                        useFloat16IVFStorage_,

                        indicesOptions_);


   FAISS_ASSERT(index->vecs.size() == index->ids.size());

   for (size_t i = 0; i < index->vecs.size(); ++i) {

     auto& vecs = index->vecs[i];

     auto& ids = index->ids[i];


     FAISS_ASSERT(vecs.size() % this->d == 0);

     auto numVecs = vecs.size() / this->d;

     FAISS_ASSERT(numVecs == ids.size());


     index_->addCodeVectorsFromCpu(i, vecs.data(), ids.data(), numVecs);

   }

 }


 void

 GpuIndexIVFFlat::copyTo(faiss::IndexIVFFlat* index) const {

   DeviceScope scope(device_);


   // We must have the indices in order to copy to ourselves

   FAISS_ASSERT(indicesOptions_ != INDICES_IVF);


   GpuIndexIVF::copyTo(index);


   // Clear out the old inverted lists

   index->vecs.clear();

   index->vecs.resize(nlist_);


   // Copy the inverted lists

   if (index_) {

     for (int i = 0; i < nlist_; ++i) {

       index->vecs[i] = index_->getListVectors(i);

       index->ids[i] = index_->getListIndices(i);

     }

   }

 }


 size_t

 GpuIndexIVFFlat::reclaimMemory() {

   if (index_) {

     DeviceScope scope(device_);


     return index_->reclaimMemory();

   }


   return 0;

 }


 void

 GpuIndexIVFFlat::reset() {

   if (index_) {

     DeviceScope scope(device_);


     index_->reset();

     this->ntotal = 0;

   } else {

     FAISS_ASSERT(this->ntotal == 0);

   }

 }


 void

 GpuIndexIVFFlat::train(Index::idx_t n, const float* x) {

   DeviceScope scope(device_);


   if (this->is_trained) {

     FAISS_ASSERT(quantizer_->is_trained);

     FAISS_ASSERT(quantizer_->ntotal == nlist_);

     FAISS_ASSERT(index_);

     return;

   }


   FAISS_ASSERT(!index_);


   trainQuantizer_(n, x);


   // The quantizer is now trained; construct the IVF index

   index_ = new IVFFlat(resources_,

                        quantizer_->getGpuData(),

                        this->metric_type == faiss::METRIC_L2,

                        useFloat16IVFStorage_,

                        indicesOptions_);

   if (reserveMemoryVecs_) {

     index_->reserveMemory(reserveMemoryVecs_);

   }


   this->is_trained = true;

 }


 void

 GpuIndexIVFFlat::add_with_ids(Index::idx_t n,

                               const float* x,

                               const Index::idx_t* xids) {

   FAISS_ASSERT(this->is_trained);

   FAISS_ASSERT(index_);


   DeviceScope scope(device_);

   auto stream = resources_->getDefaultStreamCurrentDevice();


   auto deviceVecs =

     toDevice<float, 2>(resources_,

                        device_,

                        const_cast<float*>(x),

                        stream,

                        {(int) n, index_->getDim()});


   static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");

   auto deviceIds =

     toDevice<long, 1>(resources_,

                       device_,

                       const_cast<long*>(xids),

                       stream,

                       {(int) n});


   // Not all vectors may be able to be added (some may contain NaNs

   // etc)

   ntotal += index_->classifyAndAddVectors(deviceVecs, deviceIds);

 }


 void

 GpuIndexIVFFlat::search(faiss::Index::idx_t n,

                         const float* x,

                         faiss::Index::idx_t k,

                         float* distances,

                         faiss::Index::idx_t* labels) const {

   if (n == 0) {

     return;

   }


   FAISS_ASSERT(this->is_trained);

   FAISS_ASSERT(index_);


   DeviceScope scope(device_);

   auto stream = resources_->getDefaultStream(device_);


   // Make sure arguments are on the device we desire; use temporary

   // memory allocations to move it if necessary

   auto devX =

     toDevice<float, 2>(resources_,

                        device_,

                        const_cast<float*>(x),

                        stream,

                        {(int) n, this->d});

   auto devDistances =

     toDevice<float, 2>(resources_,

                        device_,

                        distances,

                        stream,

                        {(int) n, (int) k});

   auto devLabels =

     toDevice<faiss::Index::idx_t, 2>(resources_,

                                      device_,

                                      labels,

                                      stream,

                                      {(int) n, (int) k});


   index_->query(devX, nprobe_, k, devDistances, devLabels);


   // Copy back if necessary

   fromDevice<float, 2>(devDistances, distances, stream);

   fromDevice<faiss::Index::idx_t, 2>(devLabels, labels, stream);

 }


 void

 GpuIndexIVFFlat::set_typename() {

   this->index_typename = "GpuIndexIVFFlat";

 }


 } } // namespace

faiss::gpu::IVFFlat
Definition: IVFFlat.cuh:18

faiss::gpu::IVFBase::getDim
int getDim() const
Return the number of dimensions we are indexing.
Definition: IVFBase.cu:98

faiss::gpu::GpuIndexFlat::getGpuData
FlatIndex * getGpuData()
For internal access.
Definition: GpuIndexFlat.h:100

faiss::gpu::GpuIndexIVFFlat::copyFrom
void copyFrom(const faiss::IndexIVFFlat *index)
Definition: GpuIndexIVFFlat.cu:103

faiss::gpu::IVFBase::reserveMemory
void reserveMemory(size_t numVecs)
Reserve GPU memory in our inverted lists for this number of vectors.
Definition: IVFBase.cu:44

faiss::gpu::GpuIndexIVFFlat::reclaimMemory
size_t reclaimMemory()
Definition: GpuIndexIVFFlat.cu:163

faiss::gpu::GpuResources
Definition: GpuResources.h:24

faiss::IndexIVFFlat
Definition: IndexIVF.h:113

faiss::gpu::GpuIndexIVFFlat::train
void train(Index::idx_t n, const float *x) override
Definition: GpuIndexIVFFlat.cu:186

faiss::gpu::GpuIndex::device_
int device_
The GPU device we are resident on.
Definition: GpuIndex.h:43

faiss::IndexIVF::ids
std::vector< std::vector< long > > ids
Inverted lists for indexes.
Definition: IndexIVF.h:56

faiss::gpu::GpuIndexIVF
Definition: GpuIndexIVF.h:25

faiss::Index::d
int d
vector dimension
Definition: Index.h:66

faiss::gpu::IVFFlat::classifyAndAddVectors
int classifyAndAddVectors(Tensor< float, 2, true > &vecs, Tensor< long, 1, true > &indices)
Definition: IVFFlat.cu:129

faiss::gpu::GpuIndexIVFFlat::copyTo
void copyTo(faiss::IndexIVFFlat *index) const
Definition: GpuIndexIVFFlat.cu:141

faiss::gpu::GpuIndexIVF::nprobe_
int nprobe_
Number of inverted list probes per query.
Definition: GpuIndexIVF.h:91

faiss::gpu::GpuIndexIVF::indicesOptions_
const IndicesOptions indicesOptions_
How should indices be stored on the GPU?
Definition: GpuIndexIVF.h:81

faiss::gpu::GpuIndexIVFFlat::reserveMemory
void reserveMemory(size_t numVecs)
Reserve GPU memory in our inverted lists for this number of vectors.
Definition: GpuIndexIVFFlat.cu:95

faiss::gpu::GpuIndex::resources_
GpuResources * resources_
Manages streans, cuBLAS handles and scratch memory for devices.
Definition: GpuIndex.h:40

faiss::gpu::GpuIndexIVF::copyTo
void copyTo(faiss::IndexIVF *index) const
Copy what we have to the CPU equivalent.
Definition: GpuIndexIVF.cu:181

faiss::Index::idx_t
long idx_t
all indices are this type
Definition: Index.h:64

faiss::gpu::GpuIndexIVF::nlist_
int nlist_
Number of inverted lists that we manage.
Definition: GpuIndexIVF.h:88

faiss::Index::ntotal
idx_t ntotal
total nb of indexed vectors
Definition: Index.h:67

faiss::gpu::IVFBase::reset
void reset()
Definition: IVFBase.cu:74

faiss::gpu::GpuIndexIVFFlat::add_with_ids
void add_with_ids(Index::idx_t n, const float *x, const Index::idx_t *xids) override
Definition: GpuIndexIVFFlat.cu:214

faiss::gpu::IVFFlat::addCodeVectorsFromCpu
void addCodeVectorsFromCpu(int listId, const float *vecs, const long *indices, size_t numVecs)
Definition: IVFFlat.cu:57

faiss::gpu::DeviceScope
Definition: DeviceUtils.h:55

faiss::gpu::GpuIndexIVF::quantizer_
GpuIndexFlat * quantizer_
Quantizer for inverted lists.
Definition: GpuIndexIVF.h:97

faiss::gpu::IVFFlat::query
void query(Tensor< float, 2, true > &queries, int nprobe, int k, Tensor< float, 2, true > &outDistances, Tensor< long, 2, true > &outIndices)
Definition: IVFFlat.cu:287

faiss::gpu::IVFFlat::getListVectors
std::vector< float > getListVectors(int listId) const
Return the vectors of a particular list back to the CPU.
Definition: IVFFlat.cu:353

faiss::Index::metric_type
MetricType metric_type
type of metric this index uses for search
Definition: Index.h:74

faiss::gpu::GpuIndexIVFFlat::GpuIndexIVFFlat
GpuIndexIVFFlat(GpuResources *resources, int device, bool useFloat16CoarseQuantizer, bool useFloat16IVFStorage, int dims, int nlist, IndicesOptions indicesOptions, faiss::MetricType metric)
Definition: GpuIndexIVFFlat.cu:26

faiss::gpu::IVFBase::getListIndices
std::vector< long > getListIndices(int listId) const
Return the list indices of a particular list back to the CPU.
Definition: IVFBase.cu:205

faiss::gpu::GpuIndexFlat
Definition: GpuIndexFlat.h:31

faiss::gpu::GpuIndexIVF::copyFrom
void copyFrom(const faiss::IndexIVF *index)
Copy what we need from the CPU equivalent.
Definition: GpuIndexIVF.cu:117

faiss::Index::is_trained
bool is_trained
set if the Index does not require training, or if training is done already
Definition: Index.h:71

faiss::gpu::IVFBase::reclaimMemory
size_t reclaimMemory()
Definition: IVFBase.cu:103

faiss::gpu::GpuIndexIVFFlat::reset
void reset() override
removes all elements from the database.
Definition: GpuIndexIVFFlat.cu:174

faiss::gpu::GpuIndexIVFFlat::search
void search(faiss::Index::idx_t n, const float *x, faiss::Index::idx_t k, float *distances, faiss::Index::idx_t *labels) const override
Definition: GpuIndexIVFFlat.cu:244

faiss::MetricType
MetricType
Some algorithms support both an inner product vetsion and a L2 search version.
Definition: Index.h:44

faiss::IndexIVFFlat::vecs
std::vector< std::vector< float > > vecs
Definition: IndexIVF.h:116