docs/html/StandardGpuResources_8h_source.html

 /**

  * Copyright (c) 2015-present, Facebook, Inc.

  * All rights reserved.

  *

  * This source code is licensed under the BSD+Patents license found in the

  * LICENSE file in the root directory of this source tree.

  */


 #pragma once


 #include "GpuResources.h"

 #include "utils/StackDeviceMemory.h"

 #include "utils/DeviceUtils.h"

 #include <unordered_map>

 #include <vector>


 namespace faiss { namespace gpu {


 /// Default implementation of GpuResources that allocates a cuBLAS

 /// stream and 2 streams for use, as well as temporary memory

 class StandardGpuResources : public GpuResources {

  public:

   StandardGpuResources();


   ~StandardGpuResources() override;


   /// Disable allocation of temporary memory; all temporary memory

   /// requests will call cudaMalloc / cudaFree at the point of use

   void noTempMemory();


   /// Specify that we wish to use a certain fixed size of memory on

   /// all devices as temporary memory

   void setTempMemory(size_t size);


   /// Specify that we wish to use a certain fraction of memory on

   /// all devices as temporary memory

   void setTempMemoryFraction(float fraction);


   /// Set amount of pinned memory to allocate, for async GPU <-> CPU

   /// transfers

   void setPinnedMemory(size_t size);


   /// Called to change the stream for work ordering

   void setDefaultStream(int device, cudaStream_t stream);


   /// Called to change the work ordering streams to the null stream

   /// for all devices

   void setDefaultNullStreamAllDevices();


   /// Enable or disable the warning about not having enough temporary memory

   /// when cudaMalloc gets called

   void setCudaMallocWarning(bool b);


  public:

   /// Internal system calls

   void initializeForDevice(int device) override;


   cublasHandle_t getBlasHandle(int device) override;


   cudaStream_t getDefaultStream(int device) override;


   std::vector<cudaStream_t> getAlternateStreams(int device) override;


   DeviceMemory& getMemoryManager(int device) override;


   std::pair<void*, size_t> getPinnedMemory() override;


   cudaStream_t getAsyncCopyStream(int device) override;


  private:

   /// Our default stream that work is ordered on, one per each device

   std::unordered_map<int, cudaStream_t> defaultStreams_;


   /// This contains particular streams as set by the user for

   /// ordering, if any

   std::unordered_map<int, cudaStream_t> userDefaultStreams_;


   /// Other streams we can use, per each device

   std::unordered_map<int, std::vector<cudaStream_t> > alternateStreams_;


   /// Async copy stream to use for GPU <-> CPU pinned memory copies

   std::unordered_map<int, cudaStream_t> asyncCopyStreams_;


   /// cuBLAS handle for each device

   std::unordered_map<int, cublasHandle_t> blasHandles_;


   /// Temporary memory provider, per each device

   std::unordered_map<int, std::unique_ptr<StackDeviceMemory> > memory_;


   /// Pinned memory allocation for use with this GPU

   void* pinnedMemAlloc_;

   size_t pinnedMemAllocSize_;


   /// By default, we reserve this fraction of memory on all devices

   float tempMemFraction_;


   /// Another option is to use a specified amount of memory on all

   /// devices

   size_t tempMemSize_;


   /// Whether we look at tempMemFraction_ or tempMemSize_

   bool useFraction_;


   /// Amount of pinned memory we should allocate

   size_t pinnedMemSize_;


   /// Whether or not a warning upon cudaMalloc is generated

   bool cudaMallocWarning_;

 };


 } } // namespace

faiss::gpu::StandardGpuResources::setDefaultStream
void setDefaultStream(int device, cudaStream_t stream)
Called to change the stream for work ordering.
Definition: StandardGpuResources.cpp:104

faiss::gpu::StandardGpuResources::getBlasHandle
cublasHandle_t getBlasHandle(int device) override
Returns the cuBLAS handle that we use for the given device.
Definition: StandardGpuResources.cpp:218

faiss::gpu::StandardGpuResources::setTempMemoryFraction
void setTempMemoryFraction(float fraction)
Definition: StandardGpuResources.cpp:88

faiss::gpu::StandardGpuResources::noTempMemory
void noTempMemory()
Definition: StandardGpuResources.cpp:76

faiss::gpu::StandardGpuResources::initializeForDevice
void initializeForDevice(int device) override
Internal system calls.
Definition: StandardGpuResources.cpp:132

faiss::gpu::StandardGpuResources::getAsyncCopyStream
cudaStream_t getAsyncCopyStream(int device) override
Returns the stream on which we perform async CPU &lt;-&gt; GPU copies.
Definition: StandardGpuResources.cpp:246

faiss::gpu::StandardGpuResources::getMemoryManager
DeviceMemory & getMemoryManager(int device) override
Returns the temporary memory manager for the given device.
Definition: StandardGpuResources.cpp:235

faiss::gpu::GpuResources
Definition: GpuResources.h:22

faiss::gpu::StandardGpuResources::setCudaMallocWarning
void setCudaMallocWarning(bool b)
Definition: StandardGpuResources.cpp:123

faiss::gpu::StandardGpuResources::setTempMemory
void setTempMemory(size_t size)
Definition: StandardGpuResources.cpp:82

faiss::gpu::StandardGpuResources
Definition: StandardGpuResources.h:22

faiss::gpu::StandardGpuResources::setPinnedMemory
void setPinnedMemory(size_t size)
Definition: StandardGpuResources.cpp:95

faiss::gpu::StandardGpuResources::getDefaultStream
cudaStream_t getDefaultStream(int device) override
Definition: StandardGpuResources.cpp:224

faiss::gpu::StandardGpuResources::setDefaultNullStreamAllDevices
void setDefaultNullStreamAllDevices()
Definition: StandardGpuResources.cpp:116

faiss::gpu::DeviceMemory
Manages temporary memory allocations on a GPU device.
Definition: DeviceMemory.h:45

faiss::gpu::StandardGpuResources::getPinnedMemory
std::pair< void *, size_t > getPinnedMemory() override
Returns the available CPU pinned memory buffer.
Definition: StandardGpuResources.cpp:241

faiss::gpu::StandardGpuResources::getAlternateStreams
std::vector< cudaStream_t > getAlternateStreams(int device) override
Returns the set of alternative streams that we use for the given device.
Definition: StandardGpuResources.cpp:230