faiss/IndexScalarQuantizer.h

/**
 * Copyright (c) 2015-present, Facebook, Inc.
 * All rights reserved.
 *
 * This source code is licensed under the BSD+Patents license found in the
 * LICENSE file in the root directory of this source tree.
 */

// -*- c++ -*-

#ifndef FAISS_INDEX_SCALAR_QUANTIZER_H
#define FAISS_INDEX_SCALAR_QUANTIZER_H

#include <stdint.h>


#include <vector>


#include "IndexIVF.h"


namespace faiss {

/**
 * The uniform quantizer has a range [vmin, vmax]. The range can be
 * the same for all dimensions (uniform) or specific per dimension
 * (default).
 */

struct SQDistanceComputer;

struct ScalarQuantizer {

    enum QuantizerType {
        QT_8bit,             ///< 8 bits per component
        QT_4bit,             ///< 4 bits per component
        QT_8bit_uniform,     ///< same, shared range for all dimensions
        QT_4bit_uniform,
        QT_fp16,
        QT_8bit_direct,      /// fast indexing of uint8s
    };

    QuantizerType qtype;

    /** The uniform encoder can estimate the range of representable
     * values of the unform encoder using different statistics. Here
     * rs = rangestat_arg */

    // rangestat_arg.
    enum RangeStat {
        RS_minmax,           ///< [min - rs*(max-min), max + rs*(max-min)]
        RS_meanstd,          ///< [mean - std * rs, mean + std * rs]
        RS_quantiles,        ///< [Q(rs), Q(1-rs)]
        RS_optim,            ///< alternate optimization of reconstruction error
    };

    RangeStat rangestat;
    float rangestat_arg;

    /// dimension of input vectors
    size_t d;

    /// bytes per vector
    size_t code_size;

    /// trained values (including the range)
    std::vector<float> trained;

    ScalarQuantizer (size_t d, QuantizerType qtype);
    ScalarQuantizer ();

    void train (size_t n, const float *x);


    /// same as compute_code for several vectors
    void compute_codes (const float * x,
                        uint8_t * codes,
                        size_t n) const ;

    /// decode a vector from a given code (or n vectors if third argument)
    void decode (const uint8_t *code, float *x, size_t n) const;


    SQDistanceComputer *get_distance_computer (MetricType metric = METRIC_L2)
        const;

};

struct DistanceComputer;

struct IndexScalarQuantizer: Index {
    /// Used to encode the vectors
    ScalarQuantizer sq;

    /// Codes. Size ntotal * pq.code_size
    std::vector<uint8_t> codes;

    size_t code_size;

    /** Constructor.
     *
     * @param d      dimensionality of the input vectors
     * @param M      number of subquantizers
     * @param nbits  number of bit per subvector index
     */
    IndexScalarQuantizer (int d,
                          ScalarQuantizer::QuantizerType qtype,
                          MetricType metric = METRIC_L2);

    IndexScalarQuantizer ();

    void train(idx_t n, const float* x) override;

    void add(idx_t n, const float* x) override;

    void search(
        idx_t n,
        const float* x,
        idx_t k,
        float* distances,
        idx_t* labels) const override;

    void reset() override;

    void reconstruct_n(idx_t i0, idx_t ni, float* recons) const override;

    void reconstruct(idx_t key, float* recons) const override;

    DistanceComputer *get_distance_computer () const;

};


 /** An IVF implementation where the components of the residuals are
 * encoded with a scalar uniform quantizer. All distance computations
 * are asymmetric, so the encoded vectors are decoded and approximate
 * distances are computed.
 */

struct IndexIVFScalarQuantizer: IndexIVF {
    ScalarQuantizer sq;
    bool by_residual;

    IndexIVFScalarQuantizer(Index *quantizer, size_t d, size_t nlist,
                            ScalarQuantizer::QuantizerType qtype,
                            MetricType metric = METRIC_L2);

    IndexIVFScalarQuantizer();

    void train_residual(idx_t n, const float* x) override;

    void encode_vectors(idx_t n, const float* x,
                        const idx_t *list_nos,
                        uint8_t * codes) const override;

    void add_with_ids(idx_t n, const float* x, const long* xids) override;

    InvertedListScanner *get_InvertedListScanner (bool store_pairs)
        const override;


    void reconstruct_from_offset (long list_no, long offset,
                                  float* recons) const override;

};


}


#endif
forgotten sources 2017-07-18 17:52:23 +08:00			`/**`
			`* Copyright (c) 2015-present, Facebook, Inc.`
			`* All rights reserved.`
			`*`
changed license 2017-07-30 15:18:45 +08:00			`* This source code is licensed under the BSD+Patents license found in the`
forgotten sources 2017-07-18 17:52:23 +08:00			`* LICENSE file in the root directory of this source tree.`
			`*/`

Facebook sync (#504) * Facebook sync * Update swig wrappers. * Fix comment. 2018-07-06 20:12:11 +08:00			`// -- c++ --`

forgotten sources 2017-07-18 17:52:23 +08:00			`#ifndef FAISS_INDEX_SCALAR_QUANTIZER_H`
			`#define FAISS_INDEX_SCALAR_QUANTIZER_H`

			`#include <stdint.h>`


			`#include <vector>`


			`#include "IndexIVF.h"`


			`namespace faiss {`

			`/**`
			`* The uniform quantizer has a range [vmin, vmax]. The range can be`
			`* the same for all dimensions (uniform) or specific per dimension`
			`* (default).`
			`*/`

Facebook sync (Mar 2019) (#756) Facebook sync (Mar 2019) - MatrixStats object - option to round coordinates during k-means optimization - alternative option for search in HNSW - moved stats and imbalance_factor of IndexIVF to InvertedLists object - range search for IVFScalarQuantizer - direct unit8 codec in ScalarQuantizer - renamed IndexProxy to IndexReplicas and moved to main Faiss - better support for PQ code assignment with external index - support for IMI2x16 (4B virtual centroids!) - support for k = 2048 search on GPU (instead of 1024) - most CUDA mem alloc failures throw exceptions instead of terminating on an assertion - support for renaming an ondisk invertedlists - interrupt computations with ctrl-C in python 2019-03-29 23:32:28 +08:00			`struct SQDistanceComputer;`
forgotten sources 2017-07-18 17:52:23 +08:00
			`struct ScalarQuantizer {`

			`enum QuantizerType {`
			`QT_8bit, ///< 8 bits per component`
			`QT_4bit, ///< 4 bits per component`
			`QT_8bit_uniform, ///< same, shared range for all dimensions`
			`QT_4bit_uniform,`
Facebook sync (#504) * Facebook sync * Update swig wrappers. * Fix comment. 2018-07-06 20:12:11 +08:00			`QT_fp16,`
Facebook sync (Mar 2019) (#756) Facebook sync (Mar 2019) - MatrixStats object - option to round coordinates during k-means optimization - alternative option for search in HNSW - moved stats and imbalance_factor of IndexIVF to InvertedLists object - range search for IVFScalarQuantizer - direct unit8 codec in ScalarQuantizer - renamed IndexProxy to IndexReplicas and moved to main Faiss - better support for PQ code assignment with external index - support for IMI2x16 (4B virtual centroids!) - support for k = 2048 search on GPU (instead of 1024) - most CUDA mem alloc failures throw exceptions instead of terminating on an assertion - support for renaming an ondisk invertedlists - interrupt computations with ctrl-C in python 2019-03-29 23:32:28 +08:00			`QT_8bit_direct, /// fast indexing of uint8s`
forgotten sources 2017-07-18 17:52:23 +08:00			`};`

			`QuantizerType qtype;`

			`/** The uniform encoder can estimate the range of representable`
			`* values of the unform encoder using different statistics. Here`
			`* rs = rangestat_arg */`

			`// rangestat_arg.`
			`enum RangeStat {`
			`RS_minmax, ///< [min - rs(max-min), max + rs(max-min)]`
			`RS_meanstd, ///< [mean - std * rs, mean + std * rs]`
			`RS_quantiles, ///< [Q(rs), Q(1-rs)]`
			`RS_optim, ///< alternate optimization of reconstruction error`
			`};`

			`RangeStat rangestat;`
			`float rangestat_arg;`

			`/// dimension of input vectors`
			`size_t d;`

			`/// bytes per vector`
			`size_t code_size;`

			`/// trained values (including the range)`
			`std::vector<float> trained;`

			`ScalarQuantizer (size_t d, QuantizerType qtype);`
			`ScalarQuantizer ();`

			`void train (size_t n, const float *x);`


			`/// same as compute_code for several vectors`
			`void compute_codes (const float * x,`
			`uint8_t * codes,`
			`size_t n) const ;`

			`/// decode a vector from a given code (or n vectors if third argument)`
sync with FB version 2017-01-09 - adding HNSW indexing method - simultaneous search and reconstruction for IndexIVFPQ 2018-01-09 22:42:06 +08:00			`void decode (const uint8_t code, float x, size_t n) const;`


Facebook sync (Mar 2019) (#756) Facebook sync (Mar 2019) - MatrixStats object - option to round coordinates during k-means optimization - alternative option for search in HNSW - moved stats and imbalance_factor of IndexIVF to InvertedLists object - range search for IVFScalarQuantizer - direct unit8 codec in ScalarQuantizer - renamed IndexProxy to IndexReplicas and moved to main Faiss - better support for PQ code assignment with external index - support for IMI2x16 (4B virtual centroids!) - support for k = 2048 search on GPU (instead of 1024) - most CUDA mem alloc failures throw exceptions instead of terminating on an assertion - support for renaming an ondisk invertedlists - interrupt computations with ctrl-C in python 2019-03-29 23:32:28 +08:00			`SQDistanceComputer *get_distance_computer (MetricType metric = METRIC_L2)`
sync with FB version 2017-01-09 - adding HNSW indexing method - simultaneous search and reconstruction for IndexIVFPQ 2018-01-09 22:42:06 +08:00			`const;`
forgotten sources 2017-07-18 17:52:23 +08:00
			`};`

Facebook sync (Mar 2019) (#756) Facebook sync (Mar 2019) - MatrixStats object - option to round coordinates during k-means optimization - alternative option for search in HNSW - moved stats and imbalance_factor of IndexIVF to InvertedLists object - range search for IVFScalarQuantizer - direct unit8 codec in ScalarQuantizer - renamed IndexProxy to IndexReplicas and moved to main Faiss - better support for PQ code assignment with external index - support for IMI2x16 (4B virtual centroids!) - support for k = 2048 search on GPU (instead of 1024) - most CUDA mem alloc failures throw exceptions instead of terminating on an assertion - support for renaming an ondisk invertedlists - interrupt computations with ctrl-C in python 2019-03-29 23:32:28 +08:00			`struct DistanceComputer;`
forgotten sources 2017-07-18 17:52:23 +08:00
			`struct IndexScalarQuantizer: Index {`
			`/// Used to encode the vectors`
			`ScalarQuantizer sq;`

			`/// Codes. Size ntotal * pq.code_size`
			`std::vector<uint8_t> codes;`

			`size_t code_size;`

			`/** Constructor.`
			`*`
			`* @param d dimensionality of the input vectors`
			`* @param M number of subquantizers`
			`* @param nbits number of bit per subvector index`
			`*/`
			`IndexScalarQuantizer (int d,`
			`ScalarQuantizer::QuantizerType qtype,`
			`MetricType metric = METRIC_L2);`

			`IndexScalarQuantizer ();`

			`void train(idx_t n, const float* x) override;`

			`void add(idx_t n, const float* x) override;`

			`void search(`
			`idx_t n,`
			`const float* x,`
			`idx_t k,`
			`float* distances,`
			`idx_t* labels) const override;`

			`void reset() override;`

			`void reconstruct_n(idx_t i0, idx_t ni, float* recons) const override;`

			`void reconstruct(idx_t key, float* recons) const override;`

Facebook sync (Mar 2019) (#756) Facebook sync (Mar 2019) - MatrixStats object - option to round coordinates during k-means optimization - alternative option for search in HNSW - moved stats and imbalance_factor of IndexIVF to InvertedLists object - range search for IVFScalarQuantizer - direct unit8 codec in ScalarQuantizer - renamed IndexProxy to IndexReplicas and moved to main Faiss - better support for PQ code assignment with external index - support for IMI2x16 (4B virtual centroids!) - support for k = 2048 search on GPU (instead of 1024) - most CUDA mem alloc failures throw exceptions instead of terminating on an assertion - support for renaming an ondisk invertedlists - interrupt computations with ctrl-C in python 2019-03-29 23:32:28 +08:00			`DistanceComputer *get_distance_computer () const;`

forgotten sources 2017-07-18 17:52:23 +08:00			`};`


			`/** An IVF implementation where the components of the residuals are`
			`* encoded with a scalar uniform quantizer. All distance computations`
			`* are asymmetric, so the encoded vectors are decoded and approximate`
			`* distances are computed.`
			`*/`

sync with FB version 2017-01-09 - adding HNSW indexing method - simultaneous search and reconstruction for IndexIVFPQ 2018-01-09 22:42:06 +08:00			`struct IndexIVFScalarQuantizer: IndexIVF {`
forgotten sources 2017-07-18 17:52:23 +08:00			`ScalarQuantizer sq;`
Facebook sync (Mar 2019) (#756) Facebook sync (Mar 2019) - MatrixStats object - option to round coordinates during k-means optimization - alternative option for search in HNSW - moved stats and imbalance_factor of IndexIVF to InvertedLists object - range search for IVFScalarQuantizer - direct unit8 codec in ScalarQuantizer - renamed IndexProxy to IndexReplicas and moved to main Faiss - better support for PQ code assignment with external index - support for IMI2x16 (4B virtual centroids!) - support for k = 2048 search on GPU (instead of 1024) - most CUDA mem alloc failures throw exceptions instead of terminating on an assertion - support for renaming an ondisk invertedlists - interrupt computations with ctrl-C in python 2019-03-29 23:32:28 +08:00			`bool by_residual;`
forgotten sources 2017-07-18 17:52:23 +08:00
			`IndexIVFScalarQuantizer(Index *quantizer, size_t d, size_t nlist,`
			`ScalarQuantizer::QuantizerType qtype,`
			`MetricType metric = METRIC_L2);`

			`IndexIVFScalarQuantizer();`

			`void train_residual(idx_t n, const float* x) override;`

Facebook sync (Dec 2018). (#660) * Add GpuIndexBinaryFlat * Add IndexBinaryHNSW 2018-12-20 00:48:35 +08:00			`void encode_vectors(idx_t n, const float* x,`
			`const idx_t *list_nos,`
			`uint8_t * codes) const override;`

forgotten sources 2017-07-18 17:52:23 +08:00			`void add_with_ids(idx_t n, const float* x, const long* xids) override;`

Facebook sync (Dec 2018). (#660) * Add GpuIndexBinaryFlat * Add IndexBinaryHNSW 2018-12-20 00:48:35 +08:00			`InvertedListScanner *get_InvertedListScanner (bool store_pairs)`
			`const override;`

forgotten sources 2017-07-18 17:52:23 +08:00
sync with FB version 2017-01-09 - adding HNSW indexing method - simultaneous search and reconstruction for IndexIVFPQ 2018-01-09 22:42:06 +08:00			`void reconstruct_from_offset (long list_no, long offset,`
			`float* recons) const override;`

forgotten sources 2017-07-18 17:52:23 +08:00			`};`


			`}`


			`#endif`