docs/html/FlatIndex_8cu_source.html

 /**

  * Copyright (c) 2015-present, Facebook, Inc.

  * All rights reserved.

  *

  * This source code is licensed under the CC-by-NC license found in the

  * LICENSE file in the root directory of this source tree.

  */


 // Copyright 2004-present Facebook. All Rights Reserved.


 #include "FlatIndex.cuh"

 #include "Distance.cuh"

 #include "L2Norm.cuh"

 #include "../utils/CopyUtils.cuh"

 #include "../utils/DeviceUtils.h"


 namespace faiss { namespace gpu {


 FlatIndex::FlatIndex(GpuResources* res,

                      int dim,

                      bool l2Distance,

                      bool useFloat16) :

     resources_(res),

     dim_(dim),

     useFloat16_(useFloat16),

     l2Distance_(l2Distance),

     num_(0) {

 #ifndef FAISS_USE_FLOAT16

   FAISS_ASSERT(!useFloat16_);

 #endif

 }


 bool

 FlatIndex::getUseFloat16() const {

   return useFloat16_;

 }


 /// Returns the number of vectors we contain

 int FlatIndex::getSize() const {

 #ifdef FAISS_USE_FLOAT16

   if (useFloat16_) {

     return vectorsHalf_.getSize(0);

   }

 #endif


   return vectors_.getSize(0);

 }


 int FlatIndex::getDim() const {

 #ifdef FAISS_USE_FLOAT16

   if (useFloat16_) {

     return vectorsHalf_.getSize(1);

   }

 #endif


   return vectors_.getSize(1);

 }


 Tensor<float, 2, true>&

 FlatIndex::getVectorsFloat32Ref() {

   return vectors_;

 }


 #ifdef FAISS_USE_FLOAT16

 Tensor<half, 2, true>&

 FlatIndex::getVectorsFloat16Ref() {

   return vectorsHalf_;

 }

 #endif


 DeviceTensor<float, 2, true>

 FlatIndex::getVectorsFloat32Copy(cudaStream_t stream) {

   return getVectorsFloat32Copy(0, num_, stream);

 }


 DeviceTensor<float, 2, true>

 FlatIndex::getVectorsFloat32Copy(int from, int num, cudaStream_t stream) {

   DeviceTensor<float, 2, true> vecFloat32({num, dim_});


   if (useFloat16_) {

 #ifdef FAISS_USE_FLOAT16

     runConvertToFloat32(vecFloat32.data(),

                         vectorsHalf_[from].data(),

                         num * dim_, stream);

 #endif

   } else {

     vectors_.copyTo(vecFloat32, stream);

   }


   return vecFloat32;

 }


 void

 FlatIndex::query(Tensor<float, 2, true>& vecs,

                  int k,

                  Tensor<float, 2, true>& outDistances,

                  Tensor<int, 2, true>& outIndices,

                  bool exactDistance,

                  int tileSize) {

   auto stream = resources_->getDefaultStreamCurrentDevice();

   auto& mem = resources_->getMemoryManagerCurrentDevice();


   if (useFloat16_) {

     // We need to convert to float16

 #ifdef FAISS_USE_FLOAT16

     auto vecsHalf = toHalf<2>(resources_, stream, vecs);


     DeviceTensor<half, 2, true> outDistancesHalf(

       mem, {outDistances.getSize(0), outDistances.getSize(1)}, stream);


     query(vecsHalf, k, outDistancesHalf, outIndices, exactDistance, tileSize);


     if (exactDistance) {

       // Convert outDistances back

       fromHalf<2>(stream, outDistancesHalf, outDistances);

     }

 #endif

   } else {

     if (l2Distance_) {

       runL2Distance(resources_,

                     vectors_,

                     &norms_,

                     vecs,

                     k,

                     outDistances,

                     outIndices,

                     // FIXME

                     !exactDistance,

                     tileSize);

     } else {

       runIPDistance(resources_,

                     vectors_,

                     vecs,

                     k,

                     outDistances,

                     outIndices,

                     tileSize);

     }

   }

 }


 #ifdef FAISS_USE_FLOAT16

 void

 FlatIndex::query(Tensor<half, 2, true>& vecs,

                  int k,

                  Tensor<half, 2, true>& outDistances,

                  Tensor<int, 2, true>& outIndices,

                  bool exactDistance,

                  int tileSize) {

   FAISS_ASSERT(useFloat16_);


   if (l2Distance_) {

     runL2Distance(resources_,

                   vectorsHalf_,

                   &normsHalf_,

                   vecs,

                   k,

                   outDistances,

                   outIndices,

                   // FIXME

                   !exactDistance,

                   tileSize);

   } else {

     runIPDistance(resources_,

                   vectorsHalf_,

                   vecs,

                   k,

                   outDistances,

                   outIndices,

                   tileSize);

   }

 }

 #endif


 void

 FlatIndex::add(const float* data, int numVecs, cudaStream_t stream) {

   if (numVecs == 0) {

     return;

   }


   if (useFloat16_) {

 #ifdef FAISS_USE_FLOAT16

     // Make sure that `data` is on our device; we'll run the

     // conversion on our device

     auto devData = toDevice<float, 2>(resources_,

                                       getCurrentDevice(),

                                       (float*) data,

                                       stream,

                                       {numVecs, dim_});


     auto devDataHalf = toHalf<2>(resources_, stream, devData);


     rawData_.append((char*) devDataHalf.data(),

                     devDataHalf.getSizeInBytes(),

                     stream);

 #endif

   } else {

     rawData_.append((char*) data,

                     (size_t) dim_ * numVecs * sizeof(float),

                     stream);

   }


   num_ += numVecs;


   if (useFloat16_) {

 #ifdef FAISS_USE_FLOAT16

     DeviceTensor<half, 2, true> vectorsHalf(

       (half*) rawData_.data(), {(int) num_, dim_});

     vectorsHalf_ = std::move(vectorsHalf);

 #endif

   } else {

     DeviceTensor<float, 2, true> vectors(

     (float*) rawData_.data(), {(int) num_, dim_});

     vectors_ = std::move(vectors);

   }


   if (l2Distance_) {

     // Precompute L2 norms of our database

     if (useFloat16_) {

 #ifdef FAISS_USE_FLOAT16

       DeviceTensor<half, 1, true> normsHalf({(int) num_});

       runL2Norm(vectorsHalf_, normsHalf, true, stream);

       normsHalf_ = std::move(normsHalf);

 #endif

     } else {

       DeviceTensor<float, 1, true> norms({(int) num_});

       runL2Norm(vectors_, norms, true, stream);

       norms_ = std::move(norms);

     }

   }

 }


 void

 FlatIndex::reset() {

   rawData_.clear();

   vectors_ = std::move(DeviceTensor<float, 2, true>());

   norms_ = std::move(DeviceTensor<float, 1, true>());

   num_ = 0;

 }


 } }

faiss::gpu::FlatIndex::getVectorsFloat32Copy
DeviceTensor< float, 2, true > getVectorsFloat32Copy(cudaStream_t stream)
Definition: FlatIndex.cu:73

faiss::gpu::FlatIndex::getSize
int getSize() const
Returns the number of vectors we contain.
Definition: FlatIndex.cu:40

faiss::gpu::Tensor::copyTo
__host__ void copyTo(Tensor< T, Dim, Contig, IndexT, PtrTraits > &t, cudaStream_t stream)
Copies ourselves into a tensor; sizes must match.
Definition: Tensor-inl.cuh:139

faiss::gpu::FlatIndex::add
void add(const float *data, int numVecs, cudaStream_t stream)
Definition: FlatIndex.cu:177

faiss::gpu::Tensor
Our tensor type.
Definition: Tensor.cuh:31

faiss::gpu::Tensor::getSize
__host__ __device__ IndexT getSize(int i) const
Definition: Tensor.cuh:210

faiss::gpu::FlatIndex::getVectorsFloat32Ref
Tensor< float, 2, true > & getVectorsFloat32Ref()
Returns a reference to our vectors currently in use.
Definition: FlatIndex.cu:61

faiss::gpu::FlatIndex::reset
void reset()
Free all storage.
Definition: FlatIndex.cu:235

faiss::gpu::DeviceTensor< float, 2, true >