docs/html/FlatIndex_8cuh_source.html

 /**

  * Copyright (c) 2015-present, Facebook, Inc.

  * All rights reserved.

  *

  * This source code is licensed under the BSD+Patents license found in the

  * LICENSE file in the root directory of this source tree.

  */


 // Copyright 2004-present Facebook. All Rights Reserved.


 #pragma once


 #include "../utils/DeviceTensor.cuh"

 #include "../utils/DeviceVector.cuh"

 #include "../utils/Float16.cuh"

 #include "../utils/MemorySpace.h"


 namespace faiss { namespace gpu {


 class GpuResources;


 /// Holder of GPU resources for a particular flat index

 class FlatIndex {

  public:

   FlatIndex(GpuResources* res,

             int dim,

             bool l2Distance,

             bool useFloat16,

             bool useFloat16Accumulator,

             bool storeTransposed,

             MemorySpace space);


   bool getUseFloat16() const;


   /// Returns the number of vectors we contain

   int getSize() const;


   int getDim() const;


   /// Reserve storage that can contain at least this many vectors

   void reserve(size_t numVecs, cudaStream_t stream);


   /// Returns a reference to our vectors currently in use

   Tensor<float, 2, true>& getVectorsFloat32Ref();


 #ifdef FAISS_USE_FLOAT16

   /// Returns a reference to our vectors currently in use (useFloat16 mode)

   Tensor<half, 2, true>& getVectorsFloat16Ref();

 #endif


   /// Performs a copy of the vectors on the given device, converting

   /// as needed from float16

   DeviceTensor<float, 2, true> getVectorsFloat32Copy(cudaStream_t stream);


   /// Returns only a subset of the vectors

   DeviceTensor<float, 2, true> getVectorsFloat32Copy(int from,

                                                      int num,

                                                      cudaStream_t stream);


   void query(Tensor<float, 2, true>& vecs,

              int k,

              Tensor<float, 2, true>& outDistances,

              Tensor<int, 2, true>& outIndices,

              bool exactDistance,

              int tileSize = -1);


 #ifdef FAISS_USE_FLOAT16

   void query(Tensor<half, 2, true>& vecs,

              int k,

              Tensor<half, 2, true>& outDistances,

              Tensor<int, 2, true>& outIndices,

              bool exactDistance,

              int tileSize = -1);

 #endif


   /// Add vectors to ourselves; the pointer passed can be on the host

   /// or the device

   void add(const float* data, int numVecs, cudaStream_t stream);


   /// Free all storage

   void reset();


  private:

   /// Collection of GPU resources that we use

   GpuResources* resources_;


   /// Dimensionality of our vectors

   const int dim_;


   /// Float16 data format

   const bool useFloat16_;


   /// For supporting hardware, whether or not we use Hgemm

   const bool useFloat16Accumulator_;


   /// Store vectors in transposed layout for speed; makes addition to

   /// the index slower

   const bool storeTransposed_;


   /// L2 or inner product distance?

   bool l2Distance_;


   /// Memory space for our allocations

   MemorySpace space_;


   /// How many vectors we have

   int num_;


   /// The underlying expandable storage

   DeviceVector<char> rawData_;


   /// Vectors currently in rawData_

   DeviceTensor<float, 2, true> vectors_;

   DeviceTensor<float, 2, true> vectorsTransposed_;


 #ifdef FAISS_USE_FLOAT16

   /// Vectors currently in rawData_, float16 form

   DeviceTensor<half, 2, true> vectorsHalf_;

   DeviceTensor<half, 2, true> vectorsHalfTransposed_;

 #endif


   /// Precomputed L2 norms

   DeviceTensor<float, 1, true> norms_;


 #ifdef FAISS_USE_FLOAT16

   /// Precomputed L2 norms, float16 form

   DeviceTensor<half, 1, true> normsHalf_;

 #endif

 };


 } } // namespace

faiss::gpu::FlatIndex::getVectorsFloat32Copy
DeviceTensor< float, 2, true > getVectorsFloat32Copy(cudaStream_t stream)
Definition: FlatIndex.cu:91

faiss::gpu::FlatIndex::getSize
int getSize() const
Returns the number of vectors we contain.
Definition: FlatIndex.cu:47

faiss::gpu::FlatIndex
Holder of GPU resources for a particular flat index.
Definition: FlatIndex.cuh:23

faiss::gpu::GpuResources
Definition: GpuResources.h:23

faiss::gpu::DeviceVector< char >

faiss::gpu::FlatIndex::reserve
void reserve(size_t numVecs, cudaStream_t stream)
Reserve storage that can contain at least this many vectors.
Definition: FlatIndex.cu:68

faiss::gpu::FlatIndex::add
void add(const float *data, int numVecs, cudaStream_t stream)
Definition: FlatIndex.cu:201

faiss::gpu::Tensor
Our tensor type.
Definition: Tensor.cuh:30

faiss::gpu::FlatIndex::getVectorsFloat32Ref
Tensor< float, 2, true > & getVectorsFloat32Ref()
Returns a reference to our vectors currently in use.
Definition: FlatIndex.cu:79

faiss::gpu::FlatIndex::reset
void reset()
Free all storage.
Definition: FlatIndex.cu:273

faiss::gpu::DeviceTensor< float, 2, true >