docs/html/VectorTransform_8h_source.html

 /**

  * Copyright (c) 2015-present, Facebook, Inc.

  * All rights reserved.

  *

  * This source code is licensed under the CC-by-NC license found in the

  * LICENSE file in the root directory of this source tree.

  */


 // Copyright 2004-present Facebook. All Rights Reserved.

 // -*- c++ -*-


 #ifndef FAISS_VECTOR_TRANSFORM_H

 #define FAISS_VECTOR_TRANSFORM_H


 /** Defines a few objects that apply transformations to a set of

  * vectors Often these are pre-processing steps.

  */


 #include <vector>


 #include "Index.h"


 namespace faiss {


 /** Any transformation applied on a set of vectors */

 struct VectorTransform {


     typedef Index::idx_t idx_t;


     int d_in;      ///! input dimension

     int d_out;     ///! output dimension


     explicit VectorTransform (int d_in = 0, int d_out = 0):

     d_in(d_in), d_out(d_out), is_trained(true)

     {}


     /// set if the LinearTransform does not require training, or if

     /// training is done already

     bool is_trained;


     /** Perform training on a representative set of vectors. Does

      * nothing by default.

      *

      * @param n      nb of training vectors

      * @param x      training vecors, size n * d

      */

     virtual void train (idx_t n, const float *x);


     /** apply the random roation, return new allocated matrix

      * @param     x size n * d_in

      * @return    size n * d_out

      */

     float *apply (idx_t n, const float * x) const;


     /// same as apply, but result is pre-allocated

     virtual void apply_noalloc (idx_t n, const float * x,

                                 float *xt) const = 0;


     /// reverse transformation. May not be implemented or may return

     /// approximate result

     virtual void reverse_transform (idx_t n, const float * xt,

                                     float *x) const;


     virtual ~VectorTransform () {}


 };


 /** Generic linear transformation, with bias term applied on output

  * y = A * x + b

  */

 struct LinearTransform: VectorTransform {


     bool have_bias; ///! whether to use the bias term


     /// Transformation matrix, size d_out * d_in

     std::vector<float> A;


      /// bias vector, size d_out

     std::vector<float> b;


     /// both d_in > d_out and d_out < d_in are supported

     explicit LinearTransform (int d_in = 0, int d_out = 0,

                               bool have_bias = false);


     /// same as apply, but result is pre-allocated

     virtual void apply_noalloc (idx_t n, const float * x,

                                 float *xt) const;


     /// compute x = A^T * (x - b)

     /// is reverse transform if A has orthonormal lines

     void transform_transpose (idx_t n, const float * y,

                               float *x) const;


     // ratio between # training vectors and dimension

     size_t max_points_per_d;

     bool verbose;


     // subsamples training set if there are too many vectors

     const float *maybe_subsample_train_set (Index::idx_t *n, const float *x);


     virtual ~LinearTransform () {}


 };


 /// Randomly rotate a set of vectors

 struct RandomRotationMatrix: LinearTransform {


      /// both d_in > d_out and d_out < d_in are supported

      RandomRotationMatrix (int d_in, int d_out):

          LinearTransform(d_in, d_out, false) {}


      /// must be called before the transform is used

      void init(int seed);


      virtual void reverse_transform (idx_t n, const float * xt,

                                      float *x) const override;


      RandomRotationMatrix () {}

 };


 /** Applies a principal component analysis on a set of vectors,

  *  with optionally whitening and random rotation. */

 struct PCAMatrix: LinearTransform {


     /** after transformation the components are multiplied by

      * eigenvalues^eigen_power

      *

      * =0: no whitening

      * =-2: full whitening

      */

     float eigen_power;


     /// random rotation after PCA

     bool random_rotation;


     /// try to distribute output eigenvectors in this many bins

     int balanced_bins;


     /// Mean, size d_in

     std::vector<float> mean;


     /// eigenvalues of covariance matrix (= squared singular values)

     std::vector<float> eigenvalues;


     /// PCA matrix, size d_in * d_in

     std::vector<float> PCAMat;


     // the final matrix is computed after random rotation and/or whitening

     explicit PCAMatrix (int d_in = 0, int d_out = 0,

                         float eigen_power = 0, bool random_rotation = false);


     virtual void train (Index::idx_t n, const float *x) override;


     virtual void reverse_transform (idx_t n, const float * xt,

                                     float *x) const override;


     /// copy pre-trained PCA matrix

     void copy_from (const PCAMatrix & other);


     /// called after mean, PCAMat and eigenvalues are computed

     void prepare_Ab();


 };


 /** Applies a rotation to align the dimensions with a PQ to minimize

  *  the reconstruction error. Can be used before an IndexPQ or an

  *  IndexIVFPQ. The method is the non-parametric version described in:

  *

  * "Optimized Product Quantization for Approximate Nearest Neighbor Search"

  * Tiezheng Ge, Kaiming He, Qifa Ke, Jian Sun, CVPR'13

  *

  */

 struct OPQMatrix: LinearTransform {


     int M;          ///< nb of subquantizers

     int niter;      ///< Number of outer training iterations

     int niter_pq;   ///< Number of training iterations for the PQ

     int niter_pq_0; ///< same, for the first outer iteration

     /// if there are too many training points, resample

     int max_points_per_d;

     bool verbose;


     /// if d2 != -1, output vectors of this dimension

     explicit OPQMatrix (int d = 0, int M = 1, int d2 = -1);


     virtual void train (Index::idx_t n, const float *x) override;


     virtual void reverse_transform (idx_t n, const float * xt,

                                     float *x) const override;

 };


 /** remap dimensions for intput vectors, possibly inserting 0s

  * strictly speaking this is also a linear transform but we don't want

  * to compute it with matrix multiplies */

 struct RemapDimensionsTransform: VectorTransform {


     /// map from output dimension to input, size d_out

     /// -1 -> set output to 0

     std::vector<int> map;


     RemapDimensionsTransform (int d_in, int d_out, const int *map);


     /// remap input to output, skipping or inserting dimensions as needed

     /// if uniform: distribute dimensions uniformly

     /// otherwise just take the d_out first ones.

     RemapDimensionsTransform (int d_in, int d_out, bool uniform = true);


     virtual void apply_noalloc (idx_t n, const float * x,

                                 float *xt) const override;


     /// reverse transform correct only when the mapping is a permuation

     virtual void reverse_transform (idx_t n, const float * xt,

                                     float *x) const override;


     RemapDimensionsTransform () {}

 };


 /** Index that applies a LinearTransform transform on vectors before

  *  handing them over to a sub-index */

 struct IndexPreTransform: Index {


     std::vector<VectorTransform *> chain;  ///! chain of tranforms

     Index * index;            ///! the sub-index


     bool own_fields;          ///! whether pointers are deleted in destructor


     explicit IndexPreTransform (Index *index);


     IndexPreTransform ();


     /// ltrans is the last transform before the index

     IndexPreTransform (VectorTransform * ltrans, Index * index);


     void prepend_transform (VectorTransform * ltrans);


     virtual void set_typename () override;


     virtual void train (idx_t n, const float *x) override;


     virtual void add (idx_t n, const float *x) override;


     virtual void add_with_ids (idx_t n, const float * x, const long *xids)

         override;


     virtual void reset () override;


     /** removes IDs from the index. Not supported by all indexes.

      */

     virtual long remove_ids (const IDSelector & sel) override;


     virtual void search (

             idx_t n, const float *x, idx_t k,

             float *distances, idx_t *labels) const override;


     void reconstruct_n (idx_t i0, idx_t ni, float *recons)

         const override;


     /// apply the transforms in the chain. The returned float * may be

     /// equal to x, otherwise it should be deallocated.

     const float * apply_chain (idx_t n, const float *x) const;


     virtual ~IndexPreTransform ();


 };


 } // namespace faiss


 #endif

faiss::LinearTransform::transform_transpose
void transform_transpose(idx_t n, const float *y, float *x) const
Definition: VectorTransform.cpp:130

faiss::IndexPreTransform::index
Index * index
! chain of tranforms
Definition: VectorTransform.h:241

faiss::RandomRotationMatrix
Randomly rotate a set of vectors.
Definition: VectorTransform.h:118

faiss::OPQMatrix::niter
int niter
Number of outer training iterations.
Definition: VectorTransform.h:191

faiss::RandomRotationMatrix::RandomRotationMatrix
RandomRotationMatrix(int d_in, int d_out)
both d_in &gt; d_out and d_out &lt; d_in are supported
Definition: VectorTransform.h:121

faiss::RandomRotationMatrix::init
void init(int seed)
must be called before the transform is used
Definition: VectorTransform.cpp:181

faiss::IndexPreTransform::reset
virtual void reset() override
removes all elements from the database.
Definition: VectorTransform.cpp:769

faiss::OPQMatrix::niter_pq
int niter_pq
Number of training iterations for the PQ.
Definition: VectorTransform.h:192

faiss::LinearTransform::A
std::vector< float > A
! whether to use the bias term
Definition: VectorTransform.h:84

faiss::PCAMatrix::eigen_power
float eigen_power
Definition: VectorTransform.h:144

faiss::IDSelector
Definition: AuxIndexStructures.h:58

faiss::LinearTransform::LinearTransform
LinearTransform(int d_in=0, int d_out=0, bool have_bias=false)
both d_in &gt; d_out and d_out &lt; d_in are supported
Definition: VectorTransform.cpp:95

faiss::PCAMatrix
Definition: VectorTransform.h:136

faiss::VectorTransform::VectorTransform
VectorTransform(int d_in=0, int d_out=0)
! output dimension
Definition: VectorTransform.h:36

faiss::OPQMatrix
Definition: VectorTransform.h:188

faiss::PCAMatrix::train
virtual void train(Index::idx_t n, const float *x) override
Definition: VectorTransform.cpp:227

faiss::IndexPreTransform
Definition: VectorTransform.h:238

faiss::PCAMatrix::mean
std::vector< float > mean
Mean, size d_in.
Definition: VectorTransform.h:153

faiss::RemapDimensionsTransform::map
std::vector< int > map
Definition: VectorTransform.h:216

faiss::IndexPreTransform::apply_chain
const float * apply_chain(idx_t n, const float *x) const
Definition: VectorTransform.cpp:726

faiss::PCAMatrix::PCAMat
std::vector< float > PCAMat
PCA matrix, size d_in * d_in.
Definition: VectorTransform.h:159

faiss::IndexPreTransform::train
virtual void train(idx_t n, const float *x) override
Definition: VectorTransform.cpp:698

faiss::LinearTransform::b
std::vector< float > b
bias vector, size d_out
Definition: VectorTransform.h:87

faiss::OPQMatrix::max_points_per_d
int max_points_per_d
if there are too many training points, resample
Definition: VectorTransform.h:195

faiss::LinearTransform
Definition: VectorTransform.h:78

faiss::OPQMatrix::train
virtual void train(Index::idx_t n, const float *x) override
Definition: VectorTransform.cpp:469

faiss::PCAMatrix::balanced_bins
int balanced_bins
try to distribute output eigenvectors in this many bins
Definition: VectorTransform.h:150

faiss::VectorTransform::is_trained
bool is_trained
Definition: VectorTransform.h:43

faiss::Index::idx_t
long idx_t
all indices are this type
Definition: Index.h:64

faiss::IndexPreTransform::reconstruct_n
void reconstruct_n(idx_t i0, idx_t ni, float *recons) const override
Definition: VectorTransform.cpp:781

faiss::LinearTransform::apply_noalloc
virtual void apply_noalloc(idx_t n, const float *x, float *xt) const
same as apply, but result is pre-allocated
Definition: VectorTransform.cpp:101

faiss::VectorTransform
Definition: VectorTransform.h:29

faiss::IndexPreTransform::own_fields
bool own_fields
! the sub-index
Definition: VectorTransform.h:243

faiss::OPQMatrix::niter_pq_0
int niter_pq_0
Definition: VectorTransform.h:193

faiss::OPQMatrix::reverse_transform
virtual void reverse_transform(idx_t n, const float *xt, float *x) const override
Definition: VectorTransform.cpp:630

faiss::VectorTransform::train
virtual void train(idx_t n, const float *x)
Definition: VectorTransform.cpp:76

faiss::RandomRotationMatrix::reverse_transform
virtual void reverse_transform(idx_t n, const float *xt, float *x) const override
Definition: VectorTransform.cpp:206

faiss::VectorTransform::reverse_transform
virtual void reverse_transform(idx_t n, const float *xt, float *x) const
Definition: VectorTransform.cpp:81

faiss::RemapDimensionsTransform::reverse_transform
virtual void reverse_transform(idx_t n, const float *xt, float *x) const override
reverse transform correct only when the mapping is a permuation
Definition: VectorTransform.cpp:848

faiss::RemapDimensionsTransform
Definition: VectorTransform.h:211

faiss::PCAMatrix::reverse_transform
virtual void reverse_transform(idx_t n, const float *xt, float *x) const override
Definition: VectorTransform.cpp:444

faiss::PCAMatrix::copy_from
void copy_from(const PCAMatrix &other)
copy pre-trained PCA matrix
Definition: VectorTransform.cpp:339

faiss::VectorTransform::d_out
int d_out
! input dimension
Definition: VectorTransform.h:34

faiss::OPQMatrix::OPQMatrix
OPQMatrix(int d=0, int M=1, int d2=-1)
if d2 != -1, output vectors of this dimension
Definition: VectorTransform.cpp:457

faiss::Index
Definition: Index.h:61

faiss::PCAMatrix::prepare_Ab
void prepare_Ab()
called after mean, PCAMat and eigenvalues are computed
Definition: VectorTransform.cpp:349

faiss::IndexPreTransform::add
virtual void add(idx_t n, const float *x) override
Definition: VectorTransform.cpp:737

faiss::RemapDimensionsTransform::apply_noalloc
virtual void apply_noalloc(idx_t n, const float *x, float *xt) const override
same as apply, but result is pre-allocated
Definition: VectorTransform.cpp:836

faiss::PCAMatrix::eigenvalues
std::vector< float > eigenvalues
eigenvalues of covariance matrix (= squared singular values)
Definition: VectorTransform.h:156

faiss::IndexPreTransform::search
virtual void search(idx_t n, const float *x, idx_t k, float *distances, idx_t *labels) const override
Definition: VectorTransform.cpp:759

faiss::IndexPreTransform::add_with_ids
virtual void add_with_ids(idx_t n, const float *x, const long *xids) override
Definition: VectorTransform.cpp:746

faiss::PCAMatrix::random_rotation
bool random_rotation
random rotation after PCA
Definition: VectorTransform.h:147

faiss::VectorTransform::apply
float * apply(idx_t n, const float *x) const
Definition: VectorTransform.cpp:68

faiss::IndexPreTransform::remove_ids
virtual long remove_ids(const IDSelector &sel) override
Definition: VectorTransform.cpp:774

faiss::VectorTransform::apply_noalloc
virtual void apply_noalloc(idx_t n, const float *x, float *xt) const =0
same as apply, but result is pre-allocated

faiss::OPQMatrix::M
int M
nb of subquantizers
Definition: VectorTransform.h:190