docs/html/GpuIndexFlat_8h_source.html

 /**

  * Copyright (c) Facebook, Inc. and its affiliates.

  *

  * This source code is licensed under the MIT license found in the

  * LICENSE file in the root directory of this source tree.

  */


 #pragma once


 #include "GpuIndex.h"


 namespace faiss {


 struct IndexFlat;

 struct IndexFlatL2;

 struct IndexFlatIP;


 }


 namespace faiss { namespace gpu {


 struct FlatIndex;


 struct GpuIndexFlatConfig : public GpuIndexConfig {

   inline GpuIndexFlatConfig()

       : useFloat16(false),

         useFloat16Accumulator(false),

         storeTransposed(false) {

   }


   /// Whether or not data is stored as float16

   bool useFloat16;


   /// Whether or not all math is performed in float16, if useFloat16 is

   /// specified. If true, we use cublasHgemm, supported only on CC

   /// 5.3+. Otherwise, we use cublasSgemmEx.

   bool useFloat16Accumulator;


   /// Whether or not data is stored (transparently) in a transposed

   /// layout, enabling use of the NN GEMM call, which is ~10% faster.

   /// This will improve the speed of the flat index, but will

   /// substantially slow down any add() calls made, as all data must

   /// be transposed, and will increase storage requirements (we store

   /// data in both transposed and non-transposed layouts).

   bool storeTransposed;

 };


 /// Wrapper around the GPU implementation that looks like

 /// faiss::IndexFlat; copies over centroid data from a given

 /// faiss::IndexFlat

 class GpuIndexFlat : public GpuIndex {

  public:

   /// Construct from a pre-existing faiss::IndexFlat instance, copying

   /// data over to the given GPU

   GpuIndexFlat(GpuResources* resources,

                const faiss::IndexFlat* index,

                GpuIndexFlatConfig config = GpuIndexFlatConfig());


   /// Construct an empty instance that can be added to

   GpuIndexFlat(GpuResources* resources,

                int dims,

                faiss::MetricType metric,

                GpuIndexFlatConfig config = GpuIndexFlatConfig());


   ~GpuIndexFlat() override;


   /// Initialize ourselves from the given CPU index; will overwrite

   /// all data in ourselves

   void copyFrom(const faiss::IndexFlat* index);


   /// Copy ourselves to the given CPU index; will overwrite all data

   /// in the index instance

   void copyTo(faiss::IndexFlat* index) const;


   /// Returns the number of vectors we contain

   size_t getNumVecs() const;


   /// Clears all vectors from this index

   void reset() override;


   /// This index is not trained, so this does nothing

   void train(Index::idx_t n, const float* x) override;


   /// Overrides to avoid excessive copies

   void add(faiss::Index::idx_t, const float* x) override;


   /// Reconstruction methods; prefer the batch reconstruct as it will

   /// be more efficient

   void reconstruct(faiss::Index::idx_t key, float* out) const override;


   /// Batch reconstruction method

   void reconstruct_n(

       faiss::Index::idx_t i0,

       faiss::Index::idx_t num,

       float* out) const override;


   /// For internal access

   inline FlatIndex* getGpuData() { return data_; }


  protected:

   /// Flat index does not require IDs as there is no storage available for them

   bool addImplRequiresIDs_() const override;


   /// Called from GpuIndex for add

   void addImpl_(int n,

                 const float* x,

                 const Index::idx_t* ids) override;


   /// Called from GpuIndex for search

   void searchImpl_(int n,

                    const float* x,

                    int k,

                    float* distances,

                    faiss::Index::idx_t* labels) const override;


  private:

   /// Checks user settings for consistency

   void verifySettings_() const;


  protected:

   /// Our config object

   const GpuIndexFlatConfig config_;


   /// Holds our GPU data containing the list of vectors; is managed via raw

   /// pointer so as to allow non-CUDA compilers to see this header

   FlatIndex* data_;

 };


 /// Wrapper around the GPU implementation that looks like

 /// faiss::IndexFlatL2; copies over centroid data from a given

 /// faiss::IndexFlat

 class GpuIndexFlatL2 : public GpuIndexFlat {

  public:

   /// Construct from a pre-existing faiss::IndexFlatL2 instance, copying

   /// data over to the given GPU

   GpuIndexFlatL2(GpuResources* resources,

                  faiss::IndexFlatL2* index,

                  GpuIndexFlatConfig config = GpuIndexFlatConfig());


   /// Construct an empty instance that can be added to

   GpuIndexFlatL2(GpuResources* resources,

                  int dims,

                  GpuIndexFlatConfig config = GpuIndexFlatConfig());


   /// Initialize ourselves from the given CPU index; will overwrite

   /// all data in ourselves

   void copyFrom(faiss::IndexFlatL2* index);


   /// Copy ourselves to the given CPU index; will overwrite all data

   /// in the index instance

   void copyTo(faiss::IndexFlatL2* index);

 };


 /// Wrapper around the GPU implementation that looks like

 /// faiss::IndexFlatIP; copies over centroid data from a given

 /// faiss::IndexFlat

 class GpuIndexFlatIP : public GpuIndexFlat {

  public:

   /// Construct from a pre-existing faiss::IndexFlatIP instance, copying

   /// data over to the given GPU

   GpuIndexFlatIP(GpuResources* resources,

                  faiss::IndexFlatIP* index,

                  GpuIndexFlatConfig config = GpuIndexFlatConfig());


   /// Construct an empty instance that can be added to

   GpuIndexFlatIP(GpuResources* resources,

                  int dims,

                  GpuIndexFlatConfig config = GpuIndexFlatConfig());


   /// Initialize ourselves from the given CPU index; will overwrite

   /// all data in ourselves

   void copyFrom(faiss::IndexFlatIP* index);


   /// Copy ourselves to the given CPU index; will overwrite all data

   /// in the index instance

   void copyTo(faiss::IndexFlatIP* index);

 };


 } } // namespace

faiss::IndexFlat
Definition: IndexFlat.h:21

faiss::gpu::GpuIndexFlatConfig::useFloat16Accumulator
bool useFloat16Accumulator
Definition: GpuIndexFlat.h:38

faiss::gpu::GpuIndexFlatConfig::storeTransposed
bool storeTransposed
Definition: GpuIndexFlat.h:46

faiss::gpu::GpuIndexFlatL2::copyFrom
void copyFrom(faiss::IndexFlatL2 *index)
Definition: GpuIndexFlat.cu:297

faiss::gpu::GpuIndexFlat::copyTo
void copyTo(faiss::IndexFlat *index) const
Definition: GpuIndexFlat.cu:100

faiss::gpu::GpuIndexFlat::reconstruct_n
void reconstruct_n(faiss::Index::idx_t i0, faiss::Index::idx_t num, float *out) const override
Batch reconstruction method.
Definition: GpuIndexFlat.cu:243

faiss::gpu::FlatIndex
Holder of GPU resources for a particular flat index.
Definition: FlatIndex.cuh:21

faiss::gpu::GpuIndexFlat::getGpuData
FlatIndex * getGpuData()
For internal access.
Definition: GpuIndexFlat.h:99

faiss::gpu::GpuIndexFlatL2::copyTo
void copyTo(faiss::IndexFlatL2 *index)
Definition: GpuIndexFlat.cu:302

faiss::IndexFlatL2
Definition: IndexFlat.h:77

faiss::gpu::GpuIndexFlat::getNumVecs
size_t getNumVecs() const
Returns the number of vectors we contain.
Definition: GpuIndexFlat.cu:124

faiss::gpu::GpuIndexFlat::searchImpl_
void searchImpl_(int n, const float *x, int k, float *distances, faiss::Index::idx_t *labels) const override
Called from GpuIndex for search.
Definition: GpuIndexFlat.cu:199

faiss::gpu::GpuResources
Definition: GpuResources.h:21

faiss::gpu::GpuIndexFlat::GpuIndexFlat
GpuIndexFlat(GpuResources *resources, const faiss::IndexFlat *index, GpuIndexFlatConfig config=GpuIndexFlatConfig())
Definition: GpuIndexFlat.cu:25

faiss::IndexFlatIP
Definition: IndexFlat.h:71

faiss::gpu::GpuIndexFlatConfig::useFloat16
bool useFloat16
Whether or not data is stored as float16.
Definition: GpuIndexFlat.h:33

faiss::gpu::GpuIndex
Definition: GpuIndex.h:33

faiss::gpu::GpuIndexFlatL2::GpuIndexFlatL2
GpuIndexFlatL2(GpuResources *resources, faiss::IndexFlatL2 *index, GpuIndexFlatConfig config=GpuIndexFlatConfig())
Definition: GpuIndexFlat.cu:284

faiss::Index::idx_t
long idx_t
all indices are this type
Definition: Index.h:62

faiss::gpu::GpuIndexFlatConfig
Definition: GpuIndexFlat.h:25

faiss::gpu::GpuIndexFlat::reconstruct
void reconstruct(faiss::Index::idx_t key, float *out) const override
Definition: GpuIndexFlat.cu:226

faiss::gpu::GpuIndexFlatIP::copyTo
void copyTo(faiss::IndexFlatIP *index)
Definition: GpuIndexFlat.cu:328

faiss::gpu::GpuIndexFlatIP::GpuIndexFlatIP
GpuIndexFlatIP(GpuResources *resources, faiss::IndexFlatIP *index, GpuIndexFlatConfig config=GpuIndexFlatConfig())
Definition: GpuIndexFlat.cu:310

faiss::gpu::GpuIndexFlat::addImpl_
void addImpl_(int n, const float *x, const Index::idx_t *ids) override
Called from GpuIndex for add.
Definition: GpuIndexFlat.cu:178

faiss::gpu::GpuIndexFlatIP
Definition: GpuIndexFlat.h:158

faiss::gpu::GpuIndexFlat::copyFrom
void copyFrom(const faiss::IndexFlat *index)
Definition: GpuIndexFlat.cu:67

faiss::gpu::GpuIndexFlat::addImplRequiresIDs_
bool addImplRequiresIDs_() const override
Flat index does not require IDs as there is no storage available for them.
Definition: GpuIndexFlat.cu:173

faiss::gpu::GpuIndexFlat::config_
const GpuIndexFlatConfig config_
Our config object.
Definition: GpuIndexFlat.h:123

faiss::gpu::GpuIndexFlatL2
Definition: GpuIndexFlat.h:133

faiss::gpu::GpuIndexConfig
Definition: GpuIndex.h:18

faiss::gpu::GpuIndexFlat::add
void add(faiss::Index::idx_t, const float *x) override
Overrides to avoid excessive copies.
Definition: GpuIndexFlat.cu:143

faiss::gpu::GpuIndexFlat
Definition: GpuIndexFlat.h:52

faiss::gpu::GpuIndexFlat::reset
void reset() override
Clears all vectors from this index.
Definition: GpuIndexFlat.cu:129

faiss::gpu::GpuIndexFlatIP::copyFrom
void copyFrom(faiss::IndexFlatIP *index)
Definition: GpuIndexFlat.cu:323

faiss::gpu::GpuIndexFlat::train
void train(Index::idx_t n, const float *x) override
This index is not trained, so this does nothing.
Definition: GpuIndexFlat.cu:138

faiss::MetricType
MetricType
Some algorithms support both an inner product version and a L2 search version.
Definition: Index.h:44

faiss::gpu::GpuIndexFlat::data_
FlatIndex * data_
Definition: GpuIndexFlat.h:127