faiss/gpu/GpuIndexIVFScalarQuantizer.cu

/**
 * Copyright (c) Facebook, Inc. and its affiliates.
 *
 * This source code is licensed under the MIT license found in the
 * LICENSE file in the root directory of this source tree.
 */


#include <faiss/gpu/GpuIndexIVFScalarQuantizer.h>
#include <faiss/gpu/GpuIndexFlat.h>
#include <faiss/gpu/GpuResources.h>
#include <faiss/gpu/impl/GpuScalarQuantizer.cuh>
#include <faiss/gpu/impl/IVFFlat.cuh>
#include <faiss/gpu/utils/CopyUtils.cuh>
#include <faiss/gpu/utils/DeviceUtils.h>
#include <limits>

namespace faiss { namespace gpu {

GpuIndexIVFScalarQuantizer::GpuIndexIVFScalarQuantizer(
  GpuResources* resources,
  const faiss::IndexIVFScalarQuantizer* index,
  GpuIndexIVFScalarQuantizerConfig config) :
    GpuIndexIVF(resources,
                index->d,
                index->metric_type,
                index->metric_arg,
                index->nlist,
                config),
    ivfSQConfig_(config),
    sq(index->sq),
    by_residual(index->by_residual),
    reserveMemoryVecs_(0),
    index_(nullptr) {
  copyFrom(index);

  FAISS_THROW_IF_NOT_MSG(isSQSupported(sq.qtype),
                         "Unsupported QuantizerType on GPU");
}

GpuIndexIVFScalarQuantizer::GpuIndexIVFScalarQuantizer(
  GpuResources* resources,
  int dims,
  int nlist,
  faiss::ScalarQuantizer::QuantizerType qtype,
  faiss::MetricType metric,
  bool encodeResidual,
  GpuIndexIVFScalarQuantizerConfig config) :
    GpuIndexIVF(resources, dims, metric, 0, nlist, config),
    ivfSQConfig_(config),
    sq(dims, qtype),
    by_residual(encodeResidual),
    reserveMemoryVecs_(0),
    index_(nullptr) {

  // faiss::Index params
  this->is_trained = false;

  // We haven't trained ourselves, so don't construct the IVFFlat
  // index yet
  FAISS_THROW_IF_NOT_MSG(isSQSupported(sq.qtype),
                         "Unsupported QuantizerType on GPU");
}

GpuIndexIVFScalarQuantizer::~GpuIndexIVFScalarQuantizer() {
  delete index_;
}

void
GpuIndexIVFScalarQuantizer::reserveMemory(size_t numVecs) {
  reserveMemoryVecs_ = numVecs;
  if (index_) {
    DeviceScope scope(device_);
    index_->reserveMemory(numVecs);
  }
}

void
GpuIndexIVFScalarQuantizer::copyFrom(
  const faiss::IndexIVFScalarQuantizer* index) {
  DeviceScope scope(device_);

  // Clear out our old data
  delete index_;
  index_ = nullptr;

  // Copy what we need from the CPU index
  GpuIndexIVF::copyFrom(index);
  sq = index->sq;
  by_residual = index->by_residual;

  // The other index might not be trained, in which case we don't need to copy
  // over the lists
  if (!index->is_trained) {
    return;
  }

  // Otherwise, we can populate ourselves from the other index
  this->is_trained = true;

  // Copy our lists as well
  index_ = new IVFFlat(resources_,
                       quantizer->getGpuData(),
                       index->metric_type,
                       index->metric_arg,
                       by_residual,
                       &sq,
                       ivfSQConfig_.indicesOptions,
                       memorySpace_);

  InvertedLists* ivf = index->invlists;

  for (size_t i = 0; i < ivf->nlist; ++i) {
    auto numVecs = ivf->list_size(i);

    // GPU index can only support max int entries per list
    FAISS_THROW_IF_NOT_FMT(numVecs <=
                           (size_t) std::numeric_limits<int>::max(),
                           "GPU inverted list can only support "
                           "%zu entries; %zu found",
                           (size_t) std::numeric_limits<int>::max(),
                           numVecs);

    index_->addCodeVectorsFromCpu(
      i,
      (const unsigned char*) ivf->get_codes(i),
      ivf->get_ids(i),
      numVecs);
  }
}

void
GpuIndexIVFScalarQuantizer::copyTo(
  faiss::IndexIVFScalarQuantizer* index) const {
  DeviceScope scope(device_);

  // We must have the indices in order to copy to ourselves
  FAISS_THROW_IF_NOT_MSG(
    ivfSQConfig_.indicesOptions != INDICES_IVF,
    "Cannot copy to CPU as GPU index doesn't retain "
    "indices (INDICES_IVF)");

  GpuIndexIVF::copyTo(index);
  index->sq = sq;
  index->code_size = sq.code_size;
  index->by_residual = by_residual;

  InvertedLists* ivf = new ArrayInvertedLists(nlist, index->code_size);
  index->replace_invlists(ivf, true);

  // Copy the inverted lists
  if (index_) {
    for (int i = 0; i < nlist; ++i) {
      auto listIndices = index_->getListIndices(i);
      auto listData = index_->getListVectors(i);

      ivf->add_entries(i,
                       listIndices.size(),
                       listIndices.data(),
                       (const uint8_t*) listData.data());
    }
  }
}

size_t
GpuIndexIVFScalarQuantizer::reclaimMemory() {
  if (index_) {
    DeviceScope scope(device_);

    return index_->reclaimMemory();
  }

  return 0;
}

void
GpuIndexIVFScalarQuantizer::reset() {
  if (index_) {
    DeviceScope scope(device_);

    index_->reset();
    this->ntotal = 0;
  } else {
    FAISS_ASSERT(this->ntotal == 0);
  }
}

void
GpuIndexIVFScalarQuantizer::trainResiduals_(Index::idx_t n, const float* x) {
  // The input is already guaranteed to be on the CPU
  sq.train_residual(n, x, quantizer, by_residual, verbose);
}

void
GpuIndexIVFScalarQuantizer::train(Index::idx_t n, const float* x) {
  DeviceScope scope(device_);

  if (this->is_trained) {
    FAISS_ASSERT(quantizer->is_trained);
    FAISS_ASSERT(quantizer->ntotal == nlist);
    FAISS_ASSERT(index_);
    return;
  }

  FAISS_ASSERT(!index_);

  // FIXME: GPUize more of this
  // First, make sure that the data is resident on the CPU, if it is not on the
  // CPU, as we depend upon parts of the CPU code
  auto hostData = toHost<float, 2>((float*) x,
                                   resources_->getDefaultStream(device_),
                                   {(int) n, (int) this->d});

  trainQuantizer_(n, hostData.data());
  trainResiduals_(n, hostData.data());

  // The quantizer is now trained; construct the IVF index
  index_ = new IVFFlat(resources_,
                       quantizer->getGpuData(),
                       this->metric_type,
                       this->metric_arg,
                       by_residual,
                       &sq,
                       ivfSQConfig_.indicesOptions,
                       memorySpace_);

  if (reserveMemoryVecs_) {
    index_->reserveMemory(reserveMemoryVecs_);
  }

  this->is_trained = true;
}

void
GpuIndexIVFScalarQuantizer::addImpl_(int n,
                                     const float* x,
                                     const Index::idx_t* xids) {
  // Device is already set in GpuIndex::add
  FAISS_ASSERT(index_);
  FAISS_ASSERT(n > 0);

  // Data is already resident on the GPU
  Tensor<float, 2, true> data(const_cast<float*>(x), {n, (int) this->d});

  static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");
  Tensor<long, 1, true> labels(const_cast<long*>(xids), {n});

  // Not all vectors may be able to be added (some may contain NaNs etc)
  index_->classifyAndAddVectors(data, labels);

  // but keep the ntotal based on the total number of vectors that we attempted
  // to add
  ntotal += n;
}

void
GpuIndexIVFScalarQuantizer::searchImpl_(int n,
                                        const float* x,
                                        int k,
                                        float* distances,
                                        Index::idx_t* labels) const {
  // Device is already set in GpuIndex::search
  FAISS_ASSERT(index_);
  FAISS_ASSERT(n > 0);

  // Data is already resident on the GPU
  Tensor<float, 2, true> queries(const_cast<float*>(x), {n, (int) this->d});
  Tensor<float, 2, true> outDistances(distances, {n, k});

  static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");
  Tensor<long, 2, true> outLabels(const_cast<long*>(labels), {n, k});

  index_->query(queries, nprobe, k, outDistances, outLabels);
}

} } // namespace
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`/**`
			`* Copyright (c) Facebook, Inc. and its affiliates.`
			`*`
			`* This source code is licensed under the MIT license found in the`
			`* LICENSE file in the root directory of this source tree.`
			`*/`


			`#include <faiss/gpu/GpuIndexIVFScalarQuantizer.h>`
			`#include <faiss/gpu/GpuIndexFlat.h>`
			`#include <faiss/gpu/GpuResources.h>`
			`#include <faiss/gpu/impl/GpuScalarQuantizer.cuh>`
			`#include <faiss/gpu/impl/IVFFlat.cuh>`
			`#include <faiss/gpu/utils/CopyUtils.cuh>`
			`#include <faiss/gpu/utils/DeviceUtils.h>`
			`#include <limits>`

			`namespace faiss { namespace gpu {`

			`GpuIndexIVFScalarQuantizer::GpuIndexIVFScalarQuantizer(`
			`GpuResources* resources,`
			`const faiss::IndexIVFScalarQuantizer* index,`
			`GpuIndexIVFScalarQuantizerConfig config) :`
			`GpuIndexIVF(resources,`
			`index->d,`
			`index->metric_type,`
Facebook sync (2020-03-10) (#1136) 2020-03-10 14:24:07 +01:00			`index->metric_arg,`
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`index->nlist,`
			`config),`
			`ivfSQConfig_(config),`
			`sq(index->sq),`
			`by_residual(index->by_residual),`
			`reserveMemoryVecs_(0),`
			`index_(nullptr) {`
			`copyFrom(index);`

			`FAISS_THROW_IF_NOT_MSG(isSQSupported(sq.qtype),`
			`"Unsupported QuantizerType on GPU");`
			`}`

			`GpuIndexIVFScalarQuantizer::GpuIndexIVFScalarQuantizer(`
			`GpuResources* resources,`
			`int dims,`
			`int nlist,`
			`faiss::ScalarQuantizer::QuantizerType qtype,`
			`faiss::MetricType metric,`
			`bool encodeResidual,`
			`GpuIndexIVFScalarQuantizerConfig config) :`
Facebook sync (2020-03-10) (#1136) 2020-03-10 14:24:07 +01:00			`GpuIndexIVF(resources, dims, metric, 0, nlist, config),`
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`ivfSQConfig_(config),`
			`sq(dims, qtype),`
			`by_residual(encodeResidual),`
			`reserveMemoryVecs_(0),`
			`index_(nullptr) {`

			`// faiss::Index params`
			`this->is_trained = false;`

			`// We haven't trained ourselves, so don't construct the IVFFlat`
			`// index yet`
			`FAISS_THROW_IF_NOT_MSG(isSQSupported(sq.qtype),`
			`"Unsupported QuantizerType on GPU");`
			`}`

			`GpuIndexIVFScalarQuantizer::~GpuIndexIVFScalarQuantizer() {`
			`delete index_;`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::reserveMemory(size_t numVecs) {`
			`reserveMemoryVecs_ = numVecs;`
			`if (index_) {`
Facebook sync (2020-03-10) (#1136) 2020-03-10 14:24:07 +01:00			`DeviceScope scope(device_);`
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`index_->reserveMemory(numVecs);`
			`}`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::copyFrom(`
			`const faiss::IndexIVFScalarQuantizer* index) {`
			`DeviceScope scope(device_);`

			`// Clear out our old data`
			`delete index_;`
			`index_ = nullptr;`

			`// Copy what we need from the CPU index`
			`GpuIndexIVF::copyFrom(index);`
			`sq = index->sq;`
			`by_residual = index->by_residual;`

			`// The other index might not be trained, in which case we don't need to copy`
			`// over the lists`
			`if (!index->is_trained) {`
			`return;`
			`}`

			`// Otherwise, we can populate ourselves from the other index`
			`this->is_trained = true;`

			`// Copy our lists as well`
			`index_ = new IVFFlat(resources_,`
			`quantizer->getGpuData(),`
			`index->metric_type,`
Facebook sync (2020-03-10) (#1136) 2020-03-10 14:24:07 +01:00			`index->metric_arg,`
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`by_residual,`
			`&sq,`
			`ivfSQConfig_.indicesOptions,`
			`memorySpace_);`

			`InvertedLists* ivf = index->invlists;`

			`for (size_t i = 0; i < ivf->nlist; ++i) {`
			`auto numVecs = ivf->list_size(i);`

			`// GPU index can only support max int entries per list`
			`FAISS_THROW_IF_NOT_FMT(numVecs <=`
			`(size_t) std::numeric_limits<int>::max(),`
			`"GPU inverted list can only support "`
			`"%zu entries; %zu found",`
			`(size_t) std::numeric_limits<int>::max(),`
			`numVecs);`

			`index_->addCodeVectorsFromCpu(`
			`i,`
			`(const unsigned char*) ivf->get_codes(i),`
			`ivf->get_ids(i),`
			`numVecs);`
			`}`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::copyTo(`
			`faiss::IndexIVFScalarQuantizer* index) const {`
			`DeviceScope scope(device_);`

			`// We must have the indices in order to copy to ourselves`
			`FAISS_THROW_IF_NOT_MSG(`
			`ivfSQConfig_.indicesOptions != INDICES_IVF,`
			`"Cannot copy to CPU as GPU index doesn't retain "`
			`"indices (INDICES_IVF)");`

			`GpuIndexIVF::copyTo(index);`
			`index->sq = sq;`
Fix GPUSQ copyto bug 2019-10-29 16:55:27 +08:00			`index->code_size = sq.code_size;`
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`index->by_residual = by_residual;`

			`InvertedLists* ivf = new ArrayInvertedLists(nlist, index->code_size);`
			`index->replace_invlists(ivf, true);`

			`// Copy the inverted lists`
			`if (index_) {`
			`for (int i = 0; i < nlist; ++i) {`
			`auto listIndices = index_->getListIndices(i);`
			`auto listData = index_->getListVectors(i);`

			`ivf->add_entries(i,`
			`listIndices.size(),`
			`listIndices.data(),`
			`(const uint8_t*) listData.data());`
			`}`
			`}`
			`}`

			`size_t`
			`GpuIndexIVFScalarQuantizer::reclaimMemory() {`
			`if (index_) {`
			`DeviceScope scope(device_);`

			`return index_->reclaimMemory();`
			`}`

			`return 0;`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::reset() {`
			`if (index_) {`
			`DeviceScope scope(device_);`

			`index_->reset();`
			`this->ntotal = 0;`
			`} else {`
			`FAISS_ASSERT(this->ntotal == 0);`
			`}`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::trainResiduals_(Index::idx_t n, const float* x) {`
			`// The input is already guaranteed to be on the CPU`
			`sq.train_residual(n, x, quantizer, by_residual, verbose);`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::train(Index::idx_t n, const float* x) {`
			`DeviceScope scope(device_);`

			`if (this->is_trained) {`
			`FAISS_ASSERT(quantizer->is_trained);`
			`FAISS_ASSERT(quantizer->ntotal == nlist);`
			`FAISS_ASSERT(index_);`
			`return;`
			`}`

			`FAISS_ASSERT(!index_);`

			`// FIXME: GPUize more of this`
			`// First, make sure that the data is resident on the CPU, if it is not on the`
			`// CPU, as we depend upon parts of the CPU code`
			`auto hostData = toHost<float, 2>((float*) x,`
			`resources_->getDefaultStream(device_),`
			`{(int) n, (int) this->d});`

			`trainQuantizer_(n, hostData.data());`
			`trainResiduals_(n, hostData.data());`

			`// The quantizer is now trained; construct the IVF index`
			`index_ = new IVFFlat(resources_,`
			`quantizer->getGpuData(),`
			`this->metric_type,`
Facebook sync (2020-03-10) (#1136) 2020-03-10 14:24:07 +01:00			`this->metric_arg,`
Facebook sync (2019-09-10) (#943) * Facebook sync (2019-09-10) * Fix depends Makefile target. * Add faiss symlink for new include directives. * Fix missing header. * Fix tests. * Fix Makefile. * Update depend. * Fix include directives spacing. 2019-09-20 18:59:10 +02:00			`by_residual,`
			`&sq,`
			`ivfSQConfig_.indicesOptions,`
			`memorySpace_);`

			`if (reserveMemoryVecs_) {`
			`index_->reserveMemory(reserveMemoryVecs_);`
			`}`

			`this->is_trained = true;`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::addImpl_(int n,`
			`const float* x,`
			`const Index::idx_t* xids) {`
			`// Device is already set in GpuIndex::add`
			`FAISS_ASSERT(index_);`
			`FAISS_ASSERT(n > 0);`

			`// Data is already resident on the GPU`
			`Tensor<float, 2, true> data(const_cast<float*>(x), {n, (int) this->d});`

			`static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");`
			`Tensor<long, 1, true> labels(const_cast<long*>(xids), {n});`

			`// Not all vectors may be able to be added (some may contain NaNs etc)`
			`index_->classifyAndAddVectors(data, labels);`

			`// but keep the ntotal based on the total number of vectors that we attempted`
			`// to add`
			`ntotal += n;`
			`}`

			`void`
			`GpuIndexIVFScalarQuantizer::searchImpl_(int n,`
			`const float* x,`
			`int k,`
			`float* distances,`
			`Index::idx_t* labels) const {`
			`// Device is already set in GpuIndex::search`
			`FAISS_ASSERT(index_);`
			`FAISS_ASSERT(n > 0);`

			`// Data is already resident on the GPU`
			`Tensor<float, 2, true> queries(const_cast<float*>(x), {n, (int) this->d});`
			`Tensor<float, 2, true> outDistances(distances, {n, k});`

			`static_assert(sizeof(long) == sizeof(Index::idx_t), "size mismatch");`
			`Tensor<long, 2, true> outLabels(const_cast<long*>(labels), {n, k});`

			`index_->query(queries, nprobe, k, outDistances, outLabels);`
			`}`

			`} } // namespace`