docs/html/IndexScalarQuantizer_8h_source.html

 /**

  * Copyright (c) 2015-present, Facebook, Inc.

  * All rights reserved.

  *

  * This source code is licensed under the BSD+Patents license found in the

  * LICENSE file in the root directory of this source tree.

  */


 // -*- c++ -*-


 #ifndef FAISS_INDEX_SCALAR_QUANTIZER_H

 #define FAISS_INDEX_SCALAR_QUANTIZER_H


 #include <stdint.h>


 #include <vector>


 #include "IndexIVF.h"


 namespace faiss {


 /**

  * The uniform quantizer has a range [vmin, vmax]. The range can be

  * the same for all dimensions (uniform) or specific per dimension

  * (default).

  */


 struct ScalarQuantizer {


     enum QuantizerType {

         QT_8bit,             ///< 8 bits per component

         QT_4bit,             ///< 4 bits per component

         QT_8bit_uniform,     ///< same, shared range for all dimensions

         QT_4bit_uniform,

         QT_fp16,

     };


     QuantizerType qtype;


     /** The uniform encoder can estimate the range of representable

      * values of the unform encoder using different statistics. Here

      * rs = rangestat_arg */


     // rangestat_arg.

     enum RangeStat {

         RS_minmax,           ///< [min - rs*(max-min), max + rs*(max-min)]

         RS_meanstd,          ///< [mean - std * rs, mean + std * rs]

         RS_quantiles,        ///< [Q(rs), Q(1-rs)]

         RS_optim,            ///< alternate optimization of reconstruction error

     };


     RangeStat rangestat;

     float rangestat_arg;


     /// dimension of input vectors

     size_t d;


     /// bytes per vector

     size_t code_size;


     /// trained values (including the range)

     std::vector<float> trained;


     ScalarQuantizer (size_t d, QuantizerType qtype);

     ScalarQuantizer ();


     void train (size_t n, const float *x);


     /// same as compute_code for several vectors

     void compute_codes (const float * x,

                         uint8_t * codes,

                         size_t n) const ;


     /// decode a vector from a given code (or n vectors if third argument)

     void decode (const uint8_t *code, float *x, size_t n) const;


     // fast, non thread-safe way of computing vector-to-code and

     // code-to-code distances.

     struct DistanceComputer {


         /// vector-to-code distance computation

         virtual float compute_distance (const float *x,

                                         const uint8_t *code) const = 0;


         /// code-to-code distance computation

         virtual float compute_code_distance (const uint8_t *code1,

                                              const uint8_t *code2) const = 0;

         virtual ~DistanceComputer () {}

     };


     DistanceComputer *get_distance_computer (MetricType metric = METRIC_L2)

         const;


 };


 struct IndexScalarQuantizer: Index {

     /// Used to encode the vectors

     ScalarQuantizer sq;


     /// Codes. Size ntotal * pq.code_size

     std::vector<uint8_t> codes;


     size_t code_size;


     /** Constructor.

      *

      * @param d      dimensionality of the input vectors

      * @param M      number of subquantizers

      * @param nbits  number of bit per subvector index

      */

     IndexScalarQuantizer (int d,

                           ScalarQuantizer::QuantizerType qtype,

                           MetricType metric = METRIC_L2);


     IndexScalarQuantizer ();


     void train(idx_t n, const float* x) override;


     void add(idx_t n, const float* x) override;


     void search(

         idx_t n,

         const float* x,

         idx_t k,

         float* distances,

         idx_t* labels) const override;


     void reset() override;


     void reconstruct_n(idx_t i0, idx_t ni, float* recons) const override;


     void reconstruct(idx_t key, float* recons) const override;


 };


  /** An IVF implementation where the components of the residuals are

  * encoded with a scalar uniform quantizer. All distance computations

  * are asymmetric, so the encoded vectors are decoded and approximate

  * distances are computed.

  */


 struct IndexIVFScalarQuantizer: IndexIVF {

     ScalarQuantizer sq;


     IndexIVFScalarQuantizer(Index *quantizer, size_t d, size_t nlist,

                             ScalarQuantizer::QuantizerType qtype,

                             MetricType metric = METRIC_L2);


     IndexIVFScalarQuantizer();


     void train_residual(idx_t n, const float* x) override;


     void encode_vectors(idx_t n, const float* x,

                         const idx_t *list_nos,

                         uint8_t * codes) const override;


     void add_with_ids(idx_t n, const float* x, const long* xids) override;


     InvertedListScanner *get_InvertedListScanner (bool store_pairs)

         const override;


     void reconstruct_from_offset (long list_no, long offset,

                                   float* recons) const override;


 };


 }


 #endif

faiss::IndexIVF
Definition: IndexIVF.h:91

faiss::IndexIVFScalarQuantizer::encode_vectors
void encode_vectors(idx_t n, const float *x, const idx_t *list_nos, uint8_t *codes) const override
Definition: IndexScalarQuantizer.cpp:1155

faiss::ScalarQuantizer::code_size
size_t code_size
bytes per vector
Definition: IndexScalarQuantizer.h:63

faiss::ScalarQuantizer::QuantizerType
QuantizerType
Definition: IndexScalarQuantizer.h:34

faiss::IndexScalarQuantizer::search
void search(idx_t n, const float *x, idx_t k, float *distances, idx_t *labels) const override
Definition: IndexScalarQuantizer.cpp:1072

faiss::IndexIVFScalarQuantizer::train_residual
void train_residual(idx_t n, const float *x) override
Definition: IndexScalarQuantizer.cpp:1129

faiss::ScalarQuantizer::RS_optim
alternate optimization of reconstruction error
Definition: IndexScalarQuantizer.h:53

faiss::IndexScalarQuantizer
Definition: IndexScalarQuantizer.h:102

faiss::ScalarQuantizer::QT_8bit_uniform
same, shared range for all dimensions
Definition: IndexScalarQuantizer.h:37

faiss::IndexIVFScalarQuantizer::reconstruct_from_offset
void reconstruct_from_offset(long list_no, long offset, float *recons) const override
Definition: IndexScalarQuantizer.cpp:1418

faiss::IndexScalarQuantizer::add
void add(idx_t n, const float *x) override
Definition: IndexScalarQuantizer.cpp:1017

faiss::ScalarQuantizer::QT_4bit
4 bits per component
Definition: IndexScalarQuantizer.h:36

faiss::ScalarQuantizer::DistanceComputer::compute_distance
virtual float compute_distance(const float *x, const uint8_t *code) const =0
vector-to-code distance computation

faiss::IndexScalarQuantizer::reset
void reset() override
removes all elements from the database.
Definition: IndexScalarQuantizer.cpp:1087

faiss::ScalarQuantizer
Definition: IndexScalarQuantizer.h:32

faiss::IndexIVFScalarQuantizer::add_with_ids
void add_with_ids(idx_t n, const float *x, const long *xids) override
Definition: IndexScalarQuantizer.cpp:1188

faiss::Index::d
int d
vector dimension
Definition: Index.h:66

faiss::IndexScalarQuantizer::codes
std::vector< uint8_t > codes
Codes. Size ntotal * pq.code_size.
Definition: IndexScalarQuantizer.h:107

faiss::ScalarQuantizer::DistanceComputer
Definition: IndexScalarQuantizer.h:84

faiss::IndexScalarQuantizer::sq
ScalarQuantizer sq
Used to encode the vectors.
Definition: IndexScalarQuantizer.h:104

faiss::Index::idx_t
long idx_t
all indices are this type
Definition: Index.h:64

faiss::ScalarQuantizer::RangeStat
RangeStat
Definition: IndexScalarQuantizer.h:49

faiss::IndexIVFScalarQuantizer
Definition: IndexScalarQuantizer.h:149

faiss::ScalarQuantizer::RS_quantiles
[Q(rs), Q(1-rs)]
Definition: IndexScalarQuantizer.h:52

faiss::ScalarQuantizer::RS_meanstd
[mean - std * rs, mean + std * rs]
Definition: IndexScalarQuantizer.h:51

faiss::InvertedListScanner
Definition: IndexIVF.h:261

faiss::ScalarQuantizer::decode
void decode(const uint8_t *code, float *x, size_t n) const
decode a vector from a given code (or n vectors if third argument)
Definition: IndexScalarQuantizer.cpp:955

faiss::IndexIVFScalarQuantizer::get_InvertedListScanner
InvertedListScanner * get_InvertedListScanner(bool store_pairs) const override
get a scanner for this index (store_pairs means ignore labels)
Definition: IndexScalarQuantizer.cpp:1404

faiss::ScalarQuantizer::compute_codes
void compute_codes(const float *x, uint8_t *codes, size_t n) const
same as compute_code for several vectors
Definition: IndexScalarQuantizer.cpp:943

faiss::ScalarQuantizer::DistanceComputer::compute_code_distance
virtual float compute_code_distance(const uint8_t *code1, const uint8_t *code2) const =0
code-to-code distance computation

faiss::ScalarQuantizer::QT_8bit
8 bits per component
Definition: IndexScalarQuantizer.h:35

faiss::Index
Definition: Index.h:62

faiss::IndexScalarQuantizer::reconstruct_n
void reconstruct_n(idx_t i0, idx_t ni, float *recons) const override
Definition: IndexScalarQuantizer.cpp:1093

faiss::IndexScalarQuantizer::reconstruct
void reconstruct(idx_t key, float *recons) const override
Definition: IndexScalarQuantizer.cpp:1103

faiss::ScalarQuantizer::RS_minmax
[min - rs*(max-min), max + rs*(max-min)]
Definition: IndexScalarQuantizer.h:50

faiss::ScalarQuantizer::trained
std::vector< float > trained
trained values (including the range)
Definition: IndexScalarQuantizer.h:66

faiss::Level1Quantizer::quantizer
Index * quantizer
quantizer that maps vectors to inverted lists
Definition: IndexIVF.h:33

faiss::IndexScalarQuantizer::train
void train(idx_t n, const float *x) override
Definition: IndexScalarQuantizer.cpp:1011

faiss::ScalarQuantizer::d
size_t d
dimension of input vectors
Definition: IndexScalarQuantizer.h:60

faiss::Level1Quantizer::nlist
size_t nlist
number of possible key values
Definition: IndexIVF.h:34

faiss::MetricType
MetricType
Some algorithms support both an inner product version and a L2 search version.
Definition: Index.h:45