mirror of
https://github.com/facebookresearch/faiss.git
synced 2025-06-03 21:54:02 +08:00
various bugfixes from github issues kmean with some frozen centroids GPU better tiling for large flat datasets default AVX for vector ops
353 lines
45 KiB
HTML
353 lines
45 KiB
HTML
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
|
|
<html xmlns="http://www.w3.org/1999/xhtml">
|
|
<head>
|
|
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
|
|
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
|
|
<meta name="generator" content="Doxygen 1.8.5"/>
|
|
<title>Faiss: /data/users/matthijs/github_faiss/faiss/gpu/StandardGpuResources.cpp Source File</title>
|
|
<link href="tabs.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="jquery.js"></script>
|
|
<script type="text/javascript" src="dynsections.js"></script>
|
|
<link href="search/search.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="search/search.js"></script>
|
|
<script type="text/javascript">
|
|
$(document).ready(function() { searchBox.OnSelectItem(0); });
|
|
</script>
|
|
<link href="doxygen.css" rel="stylesheet" type="text/css" />
|
|
</head>
|
|
<body>
|
|
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
|
|
<div id="titlearea">
|
|
<table cellspacing="0" cellpadding="0">
|
|
<tbody>
|
|
<tr style="height: 56px;">
|
|
<td style="padding-left: 0.5em;">
|
|
<div id="projectname">Faiss
|
|
</div>
|
|
</td>
|
|
</tr>
|
|
</tbody>
|
|
</table>
|
|
</div>
|
|
<!-- end header part -->
|
|
<!-- Generated by Doxygen 1.8.5 -->
|
|
<script type="text/javascript">
|
|
var searchBox = new SearchBox("searchBox", "search",false,'Search');
|
|
</script>
|
|
<div id="navrow1" class="tabs">
|
|
<ul class="tablist">
|
|
<li><a href="index.html"><span>Main Page</span></a></li>
|
|
<li><a href="namespaces.html"><span>Namespaces</span></a></li>
|
|
<li><a href="annotated.html"><span>Classes</span></a></li>
|
|
<li class="current"><a href="files.html"><span>Files</span></a></li>
|
|
<li>
|
|
<div id="MSearchBox" class="MSearchBoxInactive">
|
|
<span class="left">
|
|
<img id="MSearchSelect" src="search/mag_sel.png"
|
|
onmouseover="return searchBox.OnSearchSelectShow()"
|
|
onmouseout="return searchBox.OnSearchSelectHide()"
|
|
alt=""/>
|
|
<input type="text" id="MSearchField" value="Search" accesskey="S"
|
|
onfocus="searchBox.OnSearchFieldFocus(true)"
|
|
onblur="searchBox.OnSearchFieldFocus(false)"
|
|
onkeyup="searchBox.OnSearchFieldChange(event)"/>
|
|
</span><span class="right">
|
|
<a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
|
|
</span>
|
|
</div>
|
|
</li>
|
|
</ul>
|
|
</div>
|
|
<div id="navrow2" class="tabs2">
|
|
<ul class="tablist">
|
|
<li><a href="files.html"><span>File List</span></a></li>
|
|
</ul>
|
|
</div>
|
|
<!-- window showing the filter options -->
|
|
<div id="MSearchSelectWindow"
|
|
onmouseover="return searchBox.OnSearchSelectShow()"
|
|
onmouseout="return searchBox.OnSearchSelectHide()"
|
|
onkeydown="return searchBox.OnSearchSelectKey(event)">
|
|
<a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(0)"><span class="SelectionMark"> </span>All</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(1)"><span class="SelectionMark"> </span>Classes</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(2)"><span class="SelectionMark"> </span>Namespaces</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(3)"><span class="SelectionMark"> </span>Functions</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(4)"><span class="SelectionMark"> </span>Variables</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(5)"><span class="SelectionMark"> </span>Typedefs</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(6)"><span class="SelectionMark"> </span>Enumerations</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(7)"><span class="SelectionMark"> </span>Enumerator</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(8)"><span class="SelectionMark"> </span>Friends</a></div>
|
|
|
|
<!-- iframe showing the search results (closed by default) -->
|
|
<div id="MSearchResultsWindow">
|
|
<iframe src="javascript:void(0)" frameborder="0"
|
|
name="MSearchResults" id="MSearchResults">
|
|
</iframe>
|
|
</div>
|
|
|
|
<div id="nav-path" class="navpath">
|
|
<ul>
|
|
<li class="navelem"><a class="el" href="dir_6b3ae6988449b0834e9596fad5d75199.html">gpu</a></li> </ul>
|
|
</div>
|
|
</div><!-- top -->
|
|
<div class="header">
|
|
<div class="headertitle">
|
|
<div class="title">StandardGpuResources.cpp</div> </div>
|
|
</div><!--header-->
|
|
<div class="contents">
|
|
<div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno"> 1</span> <span class="comment">/**</span></div>
|
|
<div class="line"><a name="l00002"></a><span class="lineno"> 2</span> <span class="comment"> * Copyright (c) 2015-present, Facebook, Inc.</span></div>
|
|
<div class="line"><a name="l00003"></a><span class="lineno"> 3</span> <span class="comment"> * All rights reserved.</span></div>
|
|
<div class="line"><a name="l00004"></a><span class="lineno"> 4</span> <span class="comment"> *</span></div>
|
|
<div class="line"><a name="l00005"></a><span class="lineno"> 5</span> <span class="comment"> * This source code is licensed under the BSD+Patents license found in the</span></div>
|
|
<div class="line"><a name="l00006"></a><span class="lineno"> 6</span> <span class="comment"> * LICENSE file in the root directory of this source tree.</span></div>
|
|
<div class="line"><a name="l00007"></a><span class="lineno"> 7</span> <span class="comment"> */</span></div>
|
|
<div class="line"><a name="l00008"></a><span class="lineno"> 8</span> </div>
|
|
<div class="line"><a name="l00009"></a><span class="lineno"> 9</span> <span class="comment">// Copyright 2004-present Facebook. All Rights Reserved.</span></div>
|
|
<div class="line"><a name="l00010"></a><span class="lineno"> 10</span> </div>
|
|
<div class="line"><a name="l00011"></a><span class="lineno"> 11</span> <span class="preprocessor">#include "StandardGpuResources.h"</span></div>
|
|
<div class="line"><a name="l00012"></a><span class="lineno"> 12</span> <span class="preprocessor">#include "../FaissAssert.h"</span></div>
|
|
<div class="line"><a name="l00013"></a><span class="lineno"> 13</span> </div>
|
|
<div class="line"><a name="l00014"></a><span class="lineno"> 14</span> <span class="keyword">namespace </span>faiss { <span class="keyword">namespace </span>gpu {</div>
|
|
<div class="line"><a name="l00015"></a><span class="lineno"> 15</span> </div>
|
|
<div class="line"><a name="l00016"></a><span class="lineno"> 16</span> <span class="keyword">namespace </span>{</div>
|
|
<div class="line"><a name="l00017"></a><span class="lineno"> 17</span> </div>
|
|
<div class="line"><a name="l00018"></a><span class="lineno"> 18</span> constexpr <span class="keywordtype">int</span> kNumStreams = 2;</div>
|
|
<div class="line"><a name="l00019"></a><span class="lineno"> 19</span> <span class="comment"></span></div>
|
|
<div class="line"><a name="l00020"></a><span class="lineno"> 20</span> <span class="comment">/// Use 18% of GPU memory for temporary space by default</span></div>
|
|
<div class="line"><a name="l00021"></a><span class="lineno"> 21</span> <span class="comment"></span>constexpr <span class="keywordtype">float</span> kDefaultTempMemFraction = 0.18f;</div>
|
|
<div class="line"><a name="l00022"></a><span class="lineno"> 22</span> <span class="comment"></span></div>
|
|
<div class="line"><a name="l00023"></a><span class="lineno"> 23</span> <span class="comment">/// Default pinned memory allocation size</span></div>
|
|
<div class="line"><a name="l00024"></a><span class="lineno"> 24</span> <span class="comment"></span>constexpr <span class="keywordtype">size_t</span> kDefaultPinnedMemoryAllocation = (size_t) 256 * 1024 * 1024;</div>
|
|
<div class="line"><a name="l00025"></a><span class="lineno"> 25</span> </div>
|
|
<div class="line"><a name="l00026"></a><span class="lineno"> 26</span> }</div>
|
|
<div class="line"><a name="l00027"></a><span class="lineno"> 27</span> </div>
|
|
<div class="line"><a name="l00028"></a><span class="lineno"> 28</span> StandardGpuResources::StandardGpuResources() :</div>
|
|
<div class="line"><a name="l00029"></a><span class="lineno"> 29</span>  pinnedMemAlloc_(nullptr),</div>
|
|
<div class="line"><a name="l00030"></a><span class="lineno"> 30</span>  pinnedMemAllocSize_(0),</div>
|
|
<div class="line"><a name="l00031"></a><span class="lineno"> 31</span>  tempMemFraction_(kDefaultTempMemFraction),</div>
|
|
<div class="line"><a name="l00032"></a><span class="lineno"> 32</span>  tempMemSize_(0),</div>
|
|
<div class="line"><a name="l00033"></a><span class="lineno"> 33</span>  useFraction_(true),</div>
|
|
<div class="line"><a name="l00034"></a><span class="lineno"> 34</span>  pinnedMemSize_(kDefaultPinnedMemoryAllocation) {</div>
|
|
<div class="line"><a name="l00035"></a><span class="lineno"> 35</span> }</div>
|
|
<div class="line"><a name="l00036"></a><span class="lineno"> 36</span> </div>
|
|
<div class="line"><a name="l00037"></a><span class="lineno"> 37</span> StandardGpuResources::~StandardGpuResources() {</div>
|
|
<div class="line"><a name="l00038"></a><span class="lineno"> 38</span>  <span class="keywordflow">for</span> (<span class="keyword">auto</span>& entry : defaultStreams_) {</div>
|
|
<div class="line"><a name="l00039"></a><span class="lineno"> 39</span>  DeviceScope scope(entry.first);</div>
|
|
<div class="line"><a name="l00040"></a><span class="lineno"> 40</span> </div>
|
|
<div class="line"><a name="l00041"></a><span class="lineno"> 41</span>  <span class="keyword">auto</span> it = userDefaultStreams_.find(entry.first);</div>
|
|
<div class="line"><a name="l00042"></a><span class="lineno"> 42</span>  <span class="keywordflow">if</span> (it == userDefaultStreams_.end()) {</div>
|
|
<div class="line"><a name="l00043"></a><span class="lineno"> 43</span>  <span class="comment">// The user did not specify this stream, thus we are the ones</span></div>
|
|
<div class="line"><a name="l00044"></a><span class="lineno"> 44</span>  <span class="comment">// who have created it</span></div>
|
|
<div class="line"><a name="l00045"></a><span class="lineno"> 45</span>  CUDA_VERIFY(cudaStreamDestroy(entry.second));</div>
|
|
<div class="line"><a name="l00046"></a><span class="lineno"> 46</span>  }</div>
|
|
<div class="line"><a name="l00047"></a><span class="lineno"> 47</span>  }</div>
|
|
<div class="line"><a name="l00048"></a><span class="lineno"> 48</span> </div>
|
|
<div class="line"><a name="l00049"></a><span class="lineno"> 49</span>  <span class="keywordflow">for</span> (<span class="keyword">auto</span>& entry : alternateStreams_) {</div>
|
|
<div class="line"><a name="l00050"></a><span class="lineno"> 50</span>  DeviceScope scope(entry.first);</div>
|
|
<div class="line"><a name="l00051"></a><span class="lineno"> 51</span> </div>
|
|
<div class="line"><a name="l00052"></a><span class="lineno"> 52</span>  <span class="keywordflow">for</span> (<span class="keyword">auto</span> stream : entry.second) {</div>
|
|
<div class="line"><a name="l00053"></a><span class="lineno"> 53</span>  CUDA_VERIFY(cudaStreamDestroy(stream));</div>
|
|
<div class="line"><a name="l00054"></a><span class="lineno"> 54</span>  }</div>
|
|
<div class="line"><a name="l00055"></a><span class="lineno"> 55</span>  }</div>
|
|
<div class="line"><a name="l00056"></a><span class="lineno"> 56</span> </div>
|
|
<div class="line"><a name="l00057"></a><span class="lineno"> 57</span>  <span class="keywordflow">for</span> (<span class="keyword">auto</span>& entry : asyncCopyStreams_) {</div>
|
|
<div class="line"><a name="l00058"></a><span class="lineno"> 58</span>  DeviceScope scope(entry.first);</div>
|
|
<div class="line"><a name="l00059"></a><span class="lineno"> 59</span> </div>
|
|
<div class="line"><a name="l00060"></a><span class="lineno"> 60</span>  CUDA_VERIFY(cudaStreamDestroy(entry.second));</div>
|
|
<div class="line"><a name="l00061"></a><span class="lineno"> 61</span>  }</div>
|
|
<div class="line"><a name="l00062"></a><span class="lineno"> 62</span> </div>
|
|
<div class="line"><a name="l00063"></a><span class="lineno"> 63</span>  <span class="keywordflow">for</span> (<span class="keyword">auto</span>& entry : blasHandles_) {</div>
|
|
<div class="line"><a name="l00064"></a><span class="lineno"> 64</span>  DeviceScope scope(entry.first);</div>
|
|
<div class="line"><a name="l00065"></a><span class="lineno"> 65</span> </div>
|
|
<div class="line"><a name="l00066"></a><span class="lineno"> 66</span>  <span class="keyword">auto</span> blasStatus = cublasDestroy(entry.second);</div>
|
|
<div class="line"><a name="l00067"></a><span class="lineno"> 67</span>  FAISS_ASSERT(blasStatus == CUBLAS_STATUS_SUCCESS);</div>
|
|
<div class="line"><a name="l00068"></a><span class="lineno"> 68</span>  }</div>
|
|
<div class="line"><a name="l00069"></a><span class="lineno"> 69</span> </div>
|
|
<div class="line"><a name="l00070"></a><span class="lineno"> 70</span>  <span class="keywordflow">if</span> (pinnedMemAlloc_) {</div>
|
|
<div class="line"><a name="l00071"></a><span class="lineno"> 71</span>  CUDA_VERIFY(cudaFreeHost(pinnedMemAlloc_));</div>
|
|
<div class="line"><a name="l00072"></a><span class="lineno"> 72</span>  }</div>
|
|
<div class="line"><a name="l00073"></a><span class="lineno"> 73</span> }</div>
|
|
<div class="line"><a name="l00074"></a><span class="lineno"> 74</span> </div>
|
|
<div class="line"><a name="l00075"></a><span class="lineno"> 75</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00076"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a6431477a7328ac147797b3b4e3fcf651"> 76</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a6431477a7328ac147797b3b4e3fcf651">StandardGpuResources::noTempMemory</a>() {</div>
|
|
<div class="line"><a name="l00077"></a><span class="lineno"> 77</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a367102e65b16bfdc7a32770a4f5854a6">setTempMemory</a>(0);</div>
|
|
<div class="line"><a name="l00078"></a><span class="lineno"> 78</span> }</div>
|
|
<div class="line"><a name="l00079"></a><span class="lineno"> 79</span> </div>
|
|
<div class="line"><a name="l00080"></a><span class="lineno"> 80</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00081"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a367102e65b16bfdc7a32770a4f5854a6"> 81</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a367102e65b16bfdc7a32770a4f5854a6">StandardGpuResources::setTempMemory</a>(<span class="keywordtype">size_t</span> size) {</div>
|
|
<div class="line"><a name="l00082"></a><span class="lineno"> 82</span>  useFraction_ = <span class="keyword">false</span>;</div>
|
|
<div class="line"><a name="l00083"></a><span class="lineno"> 83</span>  tempMemSize_ = size;</div>
|
|
<div class="line"><a name="l00084"></a><span class="lineno"> 84</span> }</div>
|
|
<div class="line"><a name="l00085"></a><span class="lineno"> 85</span> </div>
|
|
<div class="line"><a name="l00086"></a><span class="lineno"> 86</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00087"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a99ee4e66cb497873de804b9bd9042705"> 87</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a99ee4e66cb497873de804b9bd9042705">StandardGpuResources::setTempMemoryFraction</a>(<span class="keywordtype">float</span> fraction) {</div>
|
|
<div class="line"><a name="l00088"></a><span class="lineno"> 88</span>  FAISS_ASSERT(fraction >= 0.0f && fraction <= 0.5f);</div>
|
|
<div class="line"><a name="l00089"></a><span class="lineno"> 89</span>  useFraction_ = <span class="keyword">true</span>;</div>
|
|
<div class="line"><a name="l00090"></a><span class="lineno"> 90</span>  tempMemFraction_ = fraction;</div>
|
|
<div class="line"><a name="l00091"></a><span class="lineno"> 91</span> }</div>
|
|
<div class="line"><a name="l00092"></a><span class="lineno"> 92</span> </div>
|
|
<div class="line"><a name="l00093"></a><span class="lineno"> 93</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00094"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#af9acb23ac323f85fa5dab4ed968ccd51"> 94</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#af9acb23ac323f85fa5dab4ed968ccd51">StandardGpuResources::setPinnedMemory</a>(<span class="keywordtype">size_t</span> size) {</div>
|
|
<div class="line"><a name="l00095"></a><span class="lineno"> 95</span>  <span class="comment">// Should not call this after devices have been initialized</span></div>
|
|
<div class="line"><a name="l00096"></a><span class="lineno"> 96</span>  FAISS_ASSERT(defaultStreams_.size() == 0);</div>
|
|
<div class="line"><a name="l00097"></a><span class="lineno"> 97</span>  FAISS_ASSERT(!pinnedMemAlloc_);</div>
|
|
<div class="line"><a name="l00098"></a><span class="lineno"> 98</span> </div>
|
|
<div class="line"><a name="l00099"></a><span class="lineno"> 99</span>  pinnedMemSize_ = size;</div>
|
|
<div class="line"><a name="l00100"></a><span class="lineno"> 100</span> }</div>
|
|
<div class="line"><a name="l00101"></a><span class="lineno"> 101</span> </div>
|
|
<div class="line"><a name="l00102"></a><span class="lineno"> 102</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00103"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5924b424c36dba8300866f1b98c438cb"> 103</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5924b424c36dba8300866f1b98c438cb">StandardGpuResources::setDefaultStream</a>(<span class="keywordtype">int</span> device, cudaStream_t stream) {</div>
|
|
<div class="line"><a name="l00104"></a><span class="lineno"> 104</span>  <span class="keyword">auto</span> it = defaultStreams_.find(device);</div>
|
|
<div class="line"><a name="l00105"></a><span class="lineno"> 105</span>  <span class="keywordflow">if</span> (it != defaultStreams_.end()) {</div>
|
|
<div class="line"><a name="l00106"></a><span class="lineno"> 106</span>  <span class="comment">// Replace this stream with the user stream</span></div>
|
|
<div class="line"><a name="l00107"></a><span class="lineno"> 107</span>  CUDA_VERIFY(cudaStreamDestroy(it->second));</div>
|
|
<div class="line"><a name="l00108"></a><span class="lineno"> 108</span>  it->second = stream;</div>
|
|
<div class="line"><a name="l00109"></a><span class="lineno"> 109</span>  }</div>
|
|
<div class="line"><a name="l00110"></a><span class="lineno"> 110</span> </div>
|
|
<div class="line"><a name="l00111"></a><span class="lineno"> 111</span>  userDefaultStreams_[device] = stream;</div>
|
|
<div class="line"><a name="l00112"></a><span class="lineno"> 112</span> }</div>
|
|
<div class="line"><a name="l00113"></a><span class="lineno"> 113</span> </div>
|
|
<div class="line"><a name="l00114"></a><span class="lineno"> 114</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00115"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5374f336f1957c266d7a5c185eb962a1"> 115</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5374f336f1957c266d7a5c185eb962a1">StandardGpuResources::setDefaultNullStreamAllDevices</a>() {</div>
|
|
<div class="line"><a name="l00116"></a><span class="lineno"> 116</span>  <span class="keywordflow">for</span> (<span class="keywordtype">int</span> dev = 0; dev < getNumDevices(); ++dev) {</div>
|
|
<div class="line"><a name="l00117"></a><span class="lineno"> 117</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5924b424c36dba8300866f1b98c438cb">setDefaultStream</a>(dev, <span class="keyword">nullptr</span>);</div>
|
|
<div class="line"><a name="l00118"></a><span class="lineno"> 118</span>  }</div>
|
|
<div class="line"><a name="l00119"></a><span class="lineno"> 119</span> }</div>
|
|
<div class="line"><a name="l00120"></a><span class="lineno"> 120</span> </div>
|
|
<div class="line"><a name="l00121"></a><span class="lineno"> 121</span> <span class="keywordtype">void</span></div>
|
|
<div class="line"><a name="l00122"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056"> 122</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">StandardGpuResources::initializeForDevice</a>(<span class="keywordtype">int</span> device) {</div>
|
|
<div class="line"><a name="l00123"></a><span class="lineno"> 123</span>  <span class="comment">// Use default streams as a marker for whether or not a certain</span></div>
|
|
<div class="line"><a name="l00124"></a><span class="lineno"> 124</span>  <span class="comment">// device has been initialized</span></div>
|
|
<div class="line"><a name="l00125"></a><span class="lineno"> 125</span>  <span class="keywordflow">if</span> (defaultStreams_.count(device) != 0) {</div>
|
|
<div class="line"><a name="l00126"></a><span class="lineno"> 126</span>  <span class="keywordflow">return</span>;</div>
|
|
<div class="line"><a name="l00127"></a><span class="lineno"> 127</span>  }</div>
|
|
<div class="line"><a name="l00128"></a><span class="lineno"> 128</span> </div>
|
|
<div class="line"><a name="l00129"></a><span class="lineno"> 129</span>  <span class="comment">// If this is the first device that we're initializing, create our</span></div>
|
|
<div class="line"><a name="l00130"></a><span class="lineno"> 130</span>  <span class="comment">// pinned memory allocation</span></div>
|
|
<div class="line"><a name="l00131"></a><span class="lineno"> 131</span>  <span class="keywordflow">if</span> (defaultStreams_.empty() && pinnedMemSize_ > 0) {</div>
|
|
<div class="line"><a name="l00132"></a><span class="lineno"> 132</span>  CUDA_VERIFY(cudaHostAlloc(&pinnedMemAlloc_,</div>
|
|
<div class="line"><a name="l00133"></a><span class="lineno"> 133</span>  pinnedMemSize_,</div>
|
|
<div class="line"><a name="l00134"></a><span class="lineno"> 134</span>  cudaHostAllocDefault));</div>
|
|
<div class="line"><a name="l00135"></a><span class="lineno"> 135</span>  pinnedMemAllocSize_ = pinnedMemSize_;</div>
|
|
<div class="line"><a name="l00136"></a><span class="lineno"> 136</span>  }</div>
|
|
<div class="line"><a name="l00137"></a><span class="lineno"> 137</span> </div>
|
|
<div class="line"><a name="l00138"></a><span class="lineno"> 138</span>  FAISS_ASSERT(device < getNumDevices());</div>
|
|
<div class="line"><a name="l00139"></a><span class="lineno"> 139</span>  <a class="code" href="classfaiss_1_1gpu_1_1DeviceScope.html">DeviceScope</a> scope(device);</div>
|
|
<div class="line"><a name="l00140"></a><span class="lineno"> 140</span> </div>
|
|
<div class="line"><a name="l00141"></a><span class="lineno"> 141</span>  <span class="comment">// Make sure that device properties for all devices are cached</span></div>
|
|
<div class="line"><a name="l00142"></a><span class="lineno"> 142</span>  <span class="keyword">auto</span>& prop = getDeviceProperties(device);</div>
|
|
<div class="line"><a name="l00143"></a><span class="lineno"> 143</span> </div>
|
|
<div class="line"><a name="l00144"></a><span class="lineno"> 144</span>  <span class="comment">// Also check to make sure we meet our minimum compute capability (3.0)</span></div>
|
|
<div class="line"><a name="l00145"></a><span class="lineno"> 145</span>  FAISS_ASSERT_FMT(prop.major >= 3,</div>
|
|
<div class="line"><a name="l00146"></a><span class="lineno"> 146</span>  <span class="stringliteral">"Device id %d with CC %d.%d not supported, "</span></div>
|
|
<div class="line"><a name="l00147"></a><span class="lineno"> 147</span>  <span class="stringliteral">"need 3.0+ compute capability"</span>,</div>
|
|
<div class="line"><a name="l00148"></a><span class="lineno"> 148</span>  device, prop.major, prop.minor);</div>
|
|
<div class="line"><a name="l00149"></a><span class="lineno"> 149</span> </div>
|
|
<div class="line"><a name="l00150"></a><span class="lineno"> 150</span>  <span class="comment">// Create streams</span></div>
|
|
<div class="line"><a name="l00151"></a><span class="lineno"> 151</span>  cudaStream_t defaultStream = 0;</div>
|
|
<div class="line"><a name="l00152"></a><span class="lineno"> 152</span>  <span class="keyword">auto</span> it = userDefaultStreams_.find(device);</div>
|
|
<div class="line"><a name="l00153"></a><span class="lineno"> 153</span>  <span class="keywordflow">if</span> (it != userDefaultStreams_.end()) {</div>
|
|
<div class="line"><a name="l00154"></a><span class="lineno"> 154</span>  <span class="comment">// We already have a stream provided by the user</span></div>
|
|
<div class="line"><a name="l00155"></a><span class="lineno"> 155</span>  defaultStream = it->second;</div>
|
|
<div class="line"><a name="l00156"></a><span class="lineno"> 156</span>  } <span class="keywordflow">else</span> {</div>
|
|
<div class="line"><a name="l00157"></a><span class="lineno"> 157</span>  CUDA_VERIFY(cudaStreamCreateWithFlags(&defaultStream,</div>
|
|
<div class="line"><a name="l00158"></a><span class="lineno"> 158</span>  cudaStreamNonBlocking));</div>
|
|
<div class="line"><a name="l00159"></a><span class="lineno"> 159</span>  }</div>
|
|
<div class="line"><a name="l00160"></a><span class="lineno"> 160</span> </div>
|
|
<div class="line"><a name="l00161"></a><span class="lineno"> 161</span>  defaultStreams_[device] = defaultStream;</div>
|
|
<div class="line"><a name="l00162"></a><span class="lineno"> 162</span> </div>
|
|
<div class="line"><a name="l00163"></a><span class="lineno"> 163</span>  cudaStream_t asyncCopyStream = 0;</div>
|
|
<div class="line"><a name="l00164"></a><span class="lineno"> 164</span>  CUDA_VERIFY(cudaStreamCreateWithFlags(&asyncCopyStream,</div>
|
|
<div class="line"><a name="l00165"></a><span class="lineno"> 165</span>  cudaStreamNonBlocking));</div>
|
|
<div class="line"><a name="l00166"></a><span class="lineno"> 166</span> </div>
|
|
<div class="line"><a name="l00167"></a><span class="lineno"> 167</span>  asyncCopyStreams_[device] = asyncCopyStream;</div>
|
|
<div class="line"><a name="l00168"></a><span class="lineno"> 168</span> </div>
|
|
<div class="line"><a name="l00169"></a><span class="lineno"> 169</span>  std::vector<cudaStream_t> deviceStreams;</div>
|
|
<div class="line"><a name="l00170"></a><span class="lineno"> 170</span>  <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j < kNumStreams; ++j) {</div>
|
|
<div class="line"><a name="l00171"></a><span class="lineno"> 171</span>  cudaStream_t stream = 0;</div>
|
|
<div class="line"><a name="l00172"></a><span class="lineno"> 172</span>  CUDA_VERIFY(cudaStreamCreateWithFlags(&stream,</div>
|
|
<div class="line"><a name="l00173"></a><span class="lineno"> 173</span>  cudaStreamNonBlocking));</div>
|
|
<div class="line"><a name="l00174"></a><span class="lineno"> 174</span> </div>
|
|
<div class="line"><a name="l00175"></a><span class="lineno"> 175</span>  deviceStreams.push_back(stream);</div>
|
|
<div class="line"><a name="l00176"></a><span class="lineno"> 176</span>  }</div>
|
|
<div class="line"><a name="l00177"></a><span class="lineno"> 177</span> </div>
|
|
<div class="line"><a name="l00178"></a><span class="lineno"> 178</span>  alternateStreams_[device] = std::move(deviceStreams);</div>
|
|
<div class="line"><a name="l00179"></a><span class="lineno"> 179</span> </div>
|
|
<div class="line"><a name="l00180"></a><span class="lineno"> 180</span>  <span class="comment">// Create cuBLAS handle</span></div>
|
|
<div class="line"><a name="l00181"></a><span class="lineno"> 181</span>  cublasHandle_t blasHandle = 0;</div>
|
|
<div class="line"><a name="l00182"></a><span class="lineno"> 182</span>  <span class="keyword">auto</span> blasStatus = cublasCreate(&blasHandle);</div>
|
|
<div class="line"><a name="l00183"></a><span class="lineno"> 183</span>  FAISS_ASSERT(blasStatus == CUBLAS_STATUS_SUCCESS);</div>
|
|
<div class="line"><a name="l00184"></a><span class="lineno"> 184</span>  blasHandles_[device] = blasHandle;</div>
|
|
<div class="line"><a name="l00185"></a><span class="lineno"> 185</span> </div>
|
|
<div class="line"><a name="l00186"></a><span class="lineno"> 186</span>  <span class="keywordtype">size_t</span> toAlloc = 0;</div>
|
|
<div class="line"><a name="l00187"></a><span class="lineno"> 187</span>  <span class="keywordflow">if</span> (useFraction_) {</div>
|
|
<div class="line"><a name="l00188"></a><span class="lineno"> 188</span>  <span class="keywordtype">size_t</span> devFree = 0;</div>
|
|
<div class="line"><a name="l00189"></a><span class="lineno"> 189</span>  <span class="keywordtype">size_t</span> devTotal = 0;</div>
|
|
<div class="line"><a name="l00190"></a><span class="lineno"> 190</span> </div>
|
|
<div class="line"><a name="l00191"></a><span class="lineno"> 191</span>  CUDA_VERIFY(cudaMemGetInfo(&devFree, &devTotal));</div>
|
|
<div class="line"><a name="l00192"></a><span class="lineno"> 192</span> </div>
|
|
<div class="line"><a name="l00193"></a><span class="lineno"> 193</span>  toAlloc = (size_t) (tempMemFraction_ * devTotal);</div>
|
|
<div class="line"><a name="l00194"></a><span class="lineno"> 194</span>  } <span class="keywordflow">else</span> {</div>
|
|
<div class="line"><a name="l00195"></a><span class="lineno"> 195</span>  toAlloc = tempMemSize_;</div>
|
|
<div class="line"><a name="l00196"></a><span class="lineno"> 196</span>  }</div>
|
|
<div class="line"><a name="l00197"></a><span class="lineno"> 197</span> </div>
|
|
<div class="line"><a name="l00198"></a><span class="lineno"> 198</span>  FAISS_ASSERT(memory_.count(device) == 0);</div>
|
|
<div class="line"><a name="l00199"></a><span class="lineno"> 199</span>  memory_.emplace(device,</div>
|
|
<div class="line"><a name="l00200"></a><span class="lineno"> 200</span>  std::unique_ptr<StackDeviceMemory>(</div>
|
|
<div class="line"><a name="l00201"></a><span class="lineno"> 201</span>  <span class="keyword">new</span> <a class="code" href="classfaiss_1_1gpu_1_1StackDeviceMemory.html">StackDeviceMemory</a>(device, toAlloc)));</div>
|
|
<div class="line"><a name="l00202"></a><span class="lineno"> 202</span> }</div>
|
|
<div class="line"><a name="l00203"></a><span class="lineno"> 203</span> </div>
|
|
<div class="line"><a name="l00204"></a><span class="lineno"> 204</span> cublasHandle_t</div>
|
|
<div class="line"><a name="l00205"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a7560435c7f45fd59d94ee947330a58da"> 205</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a7560435c7f45fd59d94ee947330a58da">StandardGpuResources::getBlasHandle</a>(<span class="keywordtype">int</span> device) {</div>
|
|
<div class="line"><a name="l00206"></a><span class="lineno"> 206</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">initializeForDevice</a>(device);</div>
|
|
<div class="line"><a name="l00207"></a><span class="lineno"> 207</span>  <span class="keywordflow">return</span> blasHandles_[device];</div>
|
|
<div class="line"><a name="l00208"></a><span class="lineno"> 208</span> }</div>
|
|
<div class="line"><a name="l00209"></a><span class="lineno"> 209</span> </div>
|
|
<div class="line"><a name="l00210"></a><span class="lineno"> 210</span> cudaStream_t</div>
|
|
<div class="line"><a name="l00211"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a954f34ef68fd36b8d502ca3a21f7e8a8"> 211</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a954f34ef68fd36b8d502ca3a21f7e8a8">StandardGpuResources::getDefaultStream</a>(<span class="keywordtype">int</span> device) {</div>
|
|
<div class="line"><a name="l00212"></a><span class="lineno"> 212</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">initializeForDevice</a>(device);</div>
|
|
<div class="line"><a name="l00213"></a><span class="lineno"> 213</span>  <span class="keywordflow">return</span> defaultStreams_[device];</div>
|
|
<div class="line"><a name="l00214"></a><span class="lineno"> 214</span> }</div>
|
|
<div class="line"><a name="l00215"></a><span class="lineno"> 215</span> </div>
|
|
<div class="line"><a name="l00216"></a><span class="lineno"> 216</span> std::vector<cudaStream_t></div>
|
|
<div class="line"><a name="l00217"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a9ebf68604864cb890a4c2e3d0a6f9952"> 217</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a9ebf68604864cb890a4c2e3d0a6f9952">StandardGpuResources::getAlternateStreams</a>(<span class="keywordtype">int</span> device) {</div>
|
|
<div class="line"><a name="l00218"></a><span class="lineno"> 218</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">initializeForDevice</a>(device);</div>
|
|
<div class="line"><a name="l00219"></a><span class="lineno"> 219</span>  <span class="keywordflow">return</span> alternateStreams_[device];</div>
|
|
<div class="line"><a name="l00220"></a><span class="lineno"> 220</span> }</div>
|
|
<div class="line"><a name="l00221"></a><span class="lineno"> 221</span> </div>
|
|
<div class="line"><a name="l00222"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a35da92117dd4b47ee773444af716d634"> 222</a></span> <a class="code" href="classfaiss_1_1gpu_1_1DeviceMemory.html">DeviceMemory</a>& <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a35da92117dd4b47ee773444af716d634">StandardGpuResources::getMemoryManager</a>(<span class="keywordtype">int</span> device) {</div>
|
|
<div class="line"><a name="l00223"></a><span class="lineno"> 223</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">initializeForDevice</a>(device);</div>
|
|
<div class="line"><a name="l00224"></a><span class="lineno"> 224</span>  <span class="keywordflow">return</span> *memory_[device];</div>
|
|
<div class="line"><a name="l00225"></a><span class="lineno"> 225</span> }</div>
|
|
<div class="line"><a name="l00226"></a><span class="lineno"> 226</span> </div>
|
|
<div class="line"><a name="l00227"></a><span class="lineno"> 227</span> std::pair<void*, size_t></div>
|
|
<div class="line"><a name="l00228"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#ae7418f127cac2ac663ac0ae2e6f88e8d"> 228</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#ae7418f127cac2ac663ac0ae2e6f88e8d">StandardGpuResources::getPinnedMemory</a>() {</div>
|
|
<div class="line"><a name="l00229"></a><span class="lineno"> 229</span>  <span class="keywordflow">return</span> std::make_pair(pinnedMemAlloc_, pinnedMemAllocSize_);</div>
|
|
<div class="line"><a name="l00230"></a><span class="lineno"> 230</span> }</div>
|
|
<div class="line"><a name="l00231"></a><span class="lineno"> 231</span> </div>
|
|
<div class="line"><a name="l00232"></a><span class="lineno"> 232</span> cudaStream_t</div>
|
|
<div class="line"><a name="l00233"></a><span class="lineno"><a class="line" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adf89d4731c826df889f51fe42287b15d"> 233</a></span> <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adf89d4731c826df889f51fe42287b15d">StandardGpuResources::getAsyncCopyStream</a>(<span class="keywordtype">int</span> device) {</div>
|
|
<div class="line"><a name="l00234"></a><span class="lineno"> 234</span>  <a class="code" href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">initializeForDevice</a>(device);</div>
|
|
<div class="line"><a name="l00235"></a><span class="lineno"> 235</span>  <span class="keywordflow">return</span> asyncCopyStreams_[device];</div>
|
|
<div class="line"><a name="l00236"></a><span class="lineno"> 236</span> }</div>
|
|
<div class="line"><a name="l00237"></a><span class="lineno"> 237</span> </div>
|
|
<div class="line"><a name="l00238"></a><span class="lineno"> 238</span> } } <span class="comment">// namespace</span></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a5924b424c36dba8300866f1b98c438cb"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5924b424c36dba8300866f1b98c438cb">faiss::gpu::StandardGpuResources::setDefaultStream</a></div><div class="ttdeci">void setDefaultStream(int device, cudaStream_t stream)</div><div class="ttdoc">Called to change the stream for work ordering. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00103">StandardGpuResources.cpp:103</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a7560435c7f45fd59d94ee947330a58da"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a7560435c7f45fd59d94ee947330a58da">faiss::gpu::StandardGpuResources::getBlasHandle</a></div><div class="ttdeci">cublasHandle_t getBlasHandle(int device) override</div><div class="ttdoc">Returns the cuBLAS handle that we use for the given device. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00205">StandardGpuResources.cpp:205</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a99ee4e66cb497873de804b9bd9042705"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a99ee4e66cb497873de804b9bd9042705">faiss::gpu::StandardGpuResources::setTempMemoryFraction</a></div><div class="ttdeci">void setTempMemoryFraction(float fraction)</div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00087">StandardGpuResources.cpp:87</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a6431477a7328ac147797b3b4e3fcf651"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a6431477a7328ac147797b3b4e3fcf651">faiss::gpu::StandardGpuResources::noTempMemory</a></div><div class="ttdeci">void noTempMemory()</div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00076">StandardGpuResources.cpp:76</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_adb2729678638ed89f7b8b38470f96056"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adb2729678638ed89f7b8b38470f96056">faiss::gpu::StandardGpuResources::initializeForDevice</a></div><div class="ttdeci">void initializeForDevice(int device) override</div><div class="ttdoc">Internal system calls. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00122">StandardGpuResources.cpp:122</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_adf89d4731c826df889f51fe42287b15d"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#adf89d4731c826df889f51fe42287b15d">faiss::gpu::StandardGpuResources::getAsyncCopyStream</a></div><div class="ttdeci">cudaStream_t getAsyncCopyStream(int device) override</div><div class="ttdoc">Returns the stream on which we perform async CPU &lt;-&gt; GPU copies. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00233">StandardGpuResources.cpp:233</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a35da92117dd4b47ee773444af716d634"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a35da92117dd4b47ee773444af716d634">faiss::gpu::StandardGpuResources::getMemoryManager</a></div><div class="ttdeci">DeviceMemory & getMemoryManager(int device) override</div><div class="ttdoc">Returns the temporary memory manager for the given device. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00222">StandardGpuResources.cpp:222</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a367102e65b16bfdc7a32770a4f5854a6"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a367102e65b16bfdc7a32770a4f5854a6">faiss::gpu::StandardGpuResources::setTempMemory</a></div><div class="ttdeci">void setTempMemory(size_t size)</div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00081">StandardGpuResources.cpp:81</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_af9acb23ac323f85fa5dab4ed968ccd51"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#af9acb23ac323f85fa5dab4ed968ccd51">faiss::gpu::StandardGpuResources::setPinnedMemory</a></div><div class="ttdeci">void setPinnedMemory(size_t size)</div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00094">StandardGpuResources.cpp:94</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a954f34ef68fd36b8d502ca3a21f7e8a8"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a954f34ef68fd36b8d502ca3a21f7e8a8">faiss::gpu::StandardGpuResources::getDefaultStream</a></div><div class="ttdeci">cudaStream_t getDefaultStream(int device) override</div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00211">StandardGpuResources.cpp:211</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a5374f336f1957c266d7a5c185eb962a1"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a5374f336f1957c266d7a5c185eb962a1">faiss::gpu::StandardGpuResources::setDefaultNullStreamAllDevices</a></div><div class="ttdeci">void setDefaultNullStreamAllDevices()</div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00115">StandardGpuResources.cpp:115</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1DeviceScope_html"><div class="ttname"><a href="classfaiss_1_1gpu_1_1DeviceScope.html">faiss::gpu::DeviceScope</a></div><div class="ttdef"><b>Definition:</b> <a href="DeviceUtils_8h_source.html#l00065">DeviceUtils.h:65</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StackDeviceMemory_html"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StackDeviceMemory.html">faiss::gpu::StackDeviceMemory</a></div><div class="ttdef"><b>Definition:</b> <a href="StackDeviceMemory_8h_source.html#l00022">StackDeviceMemory.h:22</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1DeviceMemory_html"><div class="ttname"><a href="classfaiss_1_1gpu_1_1DeviceMemory.html">faiss::gpu::DeviceMemory</a></div><div class="ttdoc">Manages temporary memory allocations on a GPU device. </div><div class="ttdef"><b>Definition:</b> <a href="DeviceMemory_8h_source.html#l00046">DeviceMemory.h:46</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_ae7418f127cac2ac663ac0ae2e6f88e8d"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#ae7418f127cac2ac663ac0ae2e6f88e8d">faiss::gpu::StandardGpuResources::getPinnedMemory</a></div><div class="ttdeci">std::pair< void *, size_t > getPinnedMemory() override</div><div class="ttdoc">Returns the available CPU pinned memory buffer. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00228">StandardGpuResources.cpp:228</a></div></div>
|
|
<div class="ttc" id="classfaiss_1_1gpu_1_1StandardGpuResources_html_a9ebf68604864cb890a4c2e3d0a6f9952"><div class="ttname"><a href="classfaiss_1_1gpu_1_1StandardGpuResources.html#a9ebf68604864cb890a4c2e3d0a6f9952">faiss::gpu::StandardGpuResources::getAlternateStreams</a></div><div class="ttdeci">std::vector< cudaStream_t > getAlternateStreams(int device) override</div><div class="ttdoc">Returns the set of alternative streams that we use for the given device. </div><div class="ttdef"><b>Definition:</b> <a href="StandardGpuResources_8cpp_source.html#l00217">StandardGpuResources.cpp:217</a></div></div>
|
|
</div><!-- fragment --></div><!-- contents -->
|
|
<!-- start footer part -->
|
|
<hr class="footer"/><address class="footer"><small>
|
|
Generated by  <a href="http://www.doxygen.org/index.html">
|
|
<img class="footer" src="doxygen.png" alt="doxygen"/>
|
|
</a> 1.8.5
|
|
</small></address>
|
|
</body>
|
|
</html>
|